diff --git "a/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" "b/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" --- "a/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" +++ "b/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.5506, "train/learning_rate": 9.11104513064133e-05, "train/epoch": 2.8, "train/global_step": 2500, "_runtime": 15588, "_timestamp": 1647609465, "_step": 2500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 62.0, 341.0, 487.0, 90.0, 12.0, 7.0, 5.0, 0.0, 1.0, 1.0], "bins": [-178.49705505371094, -175.31912231445312, -172.1411895751953, -168.9632568359375, -165.78533935546875, -162.60740661621094, -159.42947387695312, -156.2515411376953, -153.0736083984375, -149.8956756591797, -146.71774291992188, -143.53982543945312, -140.3618927001953, -137.1839599609375, -134.0060272216797, -130.82809448242188, -127.6501693725586, -124.47223663330078, -121.2943115234375, -118.11637878417969, -114.93844604492188, -111.76051330566406, -108.58258819580078, -105.40465545654297, -102.22673034667969, -99.04879760742188, -95.8708724975586, -92.69293975830078, -89.51500701904297, -86.33708190917969, -83.15914916992188, -79.98121643066406, -76.80328369140625, -73.62535095214844, -70.44742584228516, -67.26949310302734, -64.09156036376953, -60.913631439208984, -57.73570251464844, -54.557769775390625, -51.37983703613281, -48.201908111572266, -45.02397537231445, -41.846046447753906, -38.668113708496094, -35.49018478393555, -32.312255859375, -29.13432502746582, -25.956396102905273, -22.778465270996094, -19.600536346435547, -16.422605514526367, -13.244674682617188, -10.066743850708008, -6.888814926147461, -3.7108840942382812, -0.5329532623291016, 2.64497709274292, 5.822907447814941, 9.000837326049805, 12.178768157958984, 15.356698989868164, 18.53462791442871, 21.71255874633789, 24.89048957824707]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 3.0, 6.0, 6.0, 12.0, 16.0, 19.0, 14.0, 15.0, 37.0, 31.0, 51.0, 62.0, 60.0, 89.0, 94.0, 89.0, 71.0, 57.0, 47.0, 43.0, 36.0, 28.0, 27.0, 19.0, 16.0, 10.0, 11.0, 10.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-53.00906753540039, -51.5723762512207, -50.13568115234375, -48.69898986816406, -47.262298583984375, -45.82560729980469, -44.388916015625, -42.95222091674805, -41.51552963256836, -40.07883834838867, -38.64214324951172, -37.20545196533203, -35.768760681152344, -34.332069396972656, -32.89537811279297, -31.458683013916016, -30.021991729736328, -28.58530044555664, -27.14860725402832, -25.7119140625, -24.275222778320312, -22.838531494140625, -21.401838302612305, -19.965145111083984, -18.528453826904297, -17.09176254272461, -15.655069351196289, -14.218377113342285, -12.781684875488281, -11.344992637634277, -9.908300399780273, -8.47160816192627, -7.034912109375, -5.598219871520996, -4.161527633666992, -2.7248353958129883, -1.2881431579589844, 0.14854907989501953, 1.5852413177490234, 3.0219335556030273, 4.458625793457031, 5.895318031311035, 7.332010269165039, 8.768702507019043, 10.205394744873047, 11.64208698272705, 13.078779220581055, 14.515471458435059, 15.952163696289062, 17.38885498046875, 18.82554817199707, 20.26224136352539, 21.698932647705078, 23.135623931884766, 24.572317123413086, 26.009010314941406, 27.445701599121094, 28.88239288330078, 30.3190860748291, 31.755779266357422, 33.19247055053711, 34.6291618347168, 36.06585693359375, 37.50254821777344, 38.939239501953125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 11.0, 9.0, 12.0, 11.0, 19.0, 23.0, 22.0, 34.0, 41.0, 50.0, 60.0, 65.0, 73.0, 79.0, 90.0, 84.0, 42.0, 40.0, 46.0, 29.0, 29.0, 23.0, 17.0, 15.0, 20.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.052734375, -1.9895477294921875, -1.926361083984375, -1.8631744384765625, -1.79998779296875, -1.7368011474609375, -1.673614501953125, -1.6104278564453125, -1.5472412109375, -1.4840545654296875, -1.420867919921875, -1.3576812744140625, -1.29449462890625, -1.2313079833984375, -1.168121337890625, -1.1049346923828125, -1.041748046875, -0.9785614013671875, -0.915374755859375, -0.8521881103515625, -0.78900146484375, -0.7258148193359375, -0.662628173828125, -0.5994415283203125, -0.5362548828125, -0.4730682373046875, -0.409881591796875, -0.3466949462890625, -0.28350830078125, -0.2203216552734375, -0.157135009765625, -0.0939483642578125, -0.03076171875, 0.0324249267578125, 0.095611572265625, 0.1587982177734375, 0.22198486328125, 0.2851715087890625, 0.348358154296875, 0.4115447998046875, 0.4747314453125, 0.5379180908203125, 0.601104736328125, 0.6642913818359375, 0.72747802734375, 0.7906646728515625, 0.853851318359375, 0.9170379638671875, 0.980224609375, 1.0434112548828125, 1.106597900390625, 1.1697845458984375, 1.23297119140625, 1.2961578369140625, 1.359344482421875, 1.4225311279296875, 1.4857177734375, 1.5489044189453125, 1.612091064453125, 1.6752777099609375, 1.73846435546875, 1.8016510009765625, 1.864837646484375, 1.9280242919921875, 1.9912109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 3.0, 3.0, 6.0, 13.0, 16.0, 17.0, 26.0, 41.0, 54.0, 52.0, 107.0, 148.0, 197.0, 235.0, 347.0, 597.0, 785.0, 1132.0, 1756.0, 2816.0, 5067.0, 10623.0, 34865.0, 390093.0, 3347136.0, 345730.0, 30098.0, 8956.0, 4461.0, 2702.0, 1790.0, 1250.0, 851.0, 643.0, 437.0, 342.0, 247.0, 175.0, 121.0, 104.0, 56.0, 53.0, 35.0, 28.0, 14.0, 24.0, 7.0, 9.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0], "bins": [-8.421875, -8.1776123046875, -7.933349609375, -7.6890869140625, -7.44482421875, -7.2005615234375, -6.956298828125, -6.7120361328125, -6.4677734375, -6.2235107421875, -5.979248046875, -5.7349853515625, -5.49072265625, -5.2464599609375, -5.002197265625, -4.7579345703125, -4.513671875, -4.2694091796875, -4.025146484375, -3.7808837890625, -3.53662109375, -3.2923583984375, -3.048095703125, -2.8038330078125, -2.5595703125, -2.3153076171875, -2.071044921875, -1.8267822265625, -1.58251953125, -1.3382568359375, -1.093994140625, -0.8497314453125, -0.60546875, -0.3612060546875, -0.116943359375, 0.1273193359375, 0.37158203125, 0.6158447265625, 0.860107421875, 1.1043701171875, 1.3486328125, 1.5928955078125, 1.837158203125, 2.0814208984375, 2.32568359375, 2.5699462890625, 2.814208984375, 3.0584716796875, 3.302734375, 3.5469970703125, 3.791259765625, 4.0355224609375, 4.27978515625, 4.5240478515625, 4.768310546875, 5.0125732421875, 5.2568359375, 5.5010986328125, 5.745361328125, 5.9896240234375, 6.23388671875, 6.4781494140625, 6.722412109375, 6.9666748046875, 7.2109375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 15.0, 7.0, 15.0, 21.0, 36.0, 35.0, 35.0, 68.0, 74.0, 112.0, 123.0, 190.0, 256.0, 322.0, 426.0, 471.0, 459.0, 322.0, 253.0, 204.0, 159.0, 108.0, 76.0, 53.0, 42.0, 35.0, 28.0, 27.0, 20.0, 9.0, 10.0, 10.0, 14.0, 9.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-6.59765625, -6.417236328125, -6.23681640625, -6.056396484375, -5.8759765625, -5.695556640625, -5.51513671875, -5.334716796875, -5.154296875, -4.973876953125, -4.79345703125, -4.613037109375, -4.4326171875, -4.252197265625, -4.07177734375, -3.891357421875, -3.7109375, -3.530517578125, -3.35009765625, -3.169677734375, -2.9892578125, -2.808837890625, -2.62841796875, -2.447998046875, -2.267578125, -2.087158203125, -1.90673828125, -1.726318359375, -1.5458984375, -1.365478515625, -1.18505859375, -1.004638671875, -0.82421875, -0.643798828125, -0.46337890625, -0.282958984375, -0.1025390625, 0.077880859375, 0.25830078125, 0.438720703125, 0.619140625, 0.799560546875, 0.97998046875, 1.160400390625, 1.3408203125, 1.521240234375, 1.70166015625, 1.882080078125, 2.0625, 2.242919921875, 2.42333984375, 2.603759765625, 2.7841796875, 2.964599609375, 3.14501953125, 3.325439453125, 3.505859375, 3.686279296875, 3.86669921875, 4.047119140625, 4.2275390625, 4.407958984375, 4.58837890625, 4.768798828125, 4.94921875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 12.0, 7.0, 12.0, 30.0, 24.0, 40.0, 39.0, 81.0, 96.0, 149.0, 207.0, 350.0, 671.0, 1529.0, 4016.0, 11722.0, 42448.0, 319935.0, 3333812.0, 410077.0, 48371.0, 12838.0, 4337.0, 1647.0, 744.0, 355.0, 200.0, 141.0, 102.0, 75.0, 56.0, 46.0, 20.0, 23.0, 19.0, 7.0, 15.0, 9.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.375, -13.871337890625, -13.36767578125, -12.864013671875, -12.3603515625, -11.856689453125, -11.35302734375, -10.849365234375, -10.345703125, -9.842041015625, -9.33837890625, -8.834716796875, -8.3310546875, -7.827392578125, -7.32373046875, -6.820068359375, -6.31640625, -5.812744140625, -5.30908203125, -4.805419921875, -4.3017578125, -3.798095703125, -3.29443359375, -2.790771484375, -2.287109375, -1.783447265625, -1.27978515625, -0.776123046875, -0.2724609375, 0.231201171875, 0.73486328125, 1.238525390625, 1.7421875, 2.245849609375, 2.74951171875, 3.253173828125, 3.7568359375, 4.260498046875, 4.76416015625, 5.267822265625, 5.771484375, 6.275146484375, 6.77880859375, 7.282470703125, 7.7861328125, 8.289794921875, 8.79345703125, 9.297119140625, 9.80078125, 10.304443359375, 10.80810546875, 11.311767578125, 11.8154296875, 12.319091796875, 12.82275390625, 13.326416015625, 13.830078125, 14.333740234375, 14.83740234375, 15.341064453125, 15.8447265625, 16.348388671875, 16.85205078125, 17.355712890625, 17.859375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 10.0, 9.0, 28.0, 46.0, 86.0, 193.0, 206.0, 188.0, 121.0, 66.0, 35.0, 13.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.34196090698242, -51.08407211303711, -49.82617950439453, -48.56829071044922, -47.31039810180664, -46.05250930786133, -44.79461669921875, -43.53672790527344, -42.27883529663086, -41.02094650268555, -39.76305389404297, -38.505165100097656, -37.24727249145508, -35.989383697509766, -34.73149108886719, -33.473602294921875, -32.21571350097656, -30.957822799682617, -29.699932098388672, -28.442041397094727, -27.18415069580078, -25.926259994506836, -24.66836929321289, -23.410480499267578, -22.152587890625, -20.894697189331055, -19.63680648803711, -18.378915786743164, -17.12102508544922, -15.863134384155273, -14.605244636535645, -13.3473539352417, -12.089460372924805, -10.83156967163086, -9.573678970336914, -8.315788269042969, -7.057898044586182, -5.800007343292236, -4.542117118835449, -3.284226417541504, -2.0263357162475586, -0.7684451341629028, 0.48944544792175293, 1.7473359107971191, 3.0052266120910645, 4.26311731338501, 5.521007537841797, 6.778898239135742, 8.036788940429688, 9.294679641723633, 10.552570343017578, 11.810461044311523, 13.068351745605469, 14.326242446899414, 15.584132194519043, 16.842021942138672, 18.09991455078125, 19.357805252075195, 20.61569595336914, 21.873586654663086, 23.13147735595703, 24.389368057250977, 25.647258758544922, 26.905147552490234, 28.16303825378418]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 10.0, 2.0, 9.0, 7.0, 14.0, 13.0, 17.0, 26.0, 19.0, 29.0, 29.0, 29.0, 26.0, 46.0, 42.0, 51.0, 59.0, 41.0, 44.0, 34.0, 35.0, 51.0, 47.0, 36.0, 37.0, 39.0, 32.0, 32.0, 19.0, 19.0, 23.0, 14.0, 15.0, 16.0, 14.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8236026763916, -20.095436096191406, -19.367267608642578, -18.639101028442383, -17.910932540893555, -17.18276596069336, -16.45459747314453, -15.726430892944336, -14.998263359069824, -14.270095825195312, -13.5419282913208, -12.813760757446289, -12.085594177246094, -11.357425689697266, -10.62925910949707, -9.901091575622559, -9.172924041748047, -8.444756507873535, -7.716588973999023, -6.98842191696167, -6.260254383087158, -5.5320868492126465, -4.803919792175293, -4.075752258300781, -3.3475847244262695, -2.619417190551758, -1.8912498950958252, -1.1630825996398926, -0.43491506576538086, 0.29325246810913086, 1.0214195251464844, 1.749587059020996, 2.477754592895508, 3.2059221267700195, 3.934089422225952, 4.662256717681885, 5.3904242515563965, 6.118591785430908, 6.846758842468262, 7.574926376342773, 8.303093910217285, 9.031261444091797, 9.759428977966309, 10.48759651184082, 11.215763092041016, 11.943931579589844, 12.672098159790039, 13.40026569366455, 14.128433227539062, 14.856600761413574, 15.584768295288086, 16.31293487548828, 17.04110336303711, 17.769269943237305, 18.4974365234375, 19.225605010986328, 19.953773498535156, 20.68194007873535, 21.41010856628418, 22.138275146484375, 22.866443634033203, 23.5946102142334, 24.322776794433594, 25.050945281982422, 25.779111862182617]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 6.0, 5.0, 2.0, 20.0, 16.0, 25.0, 27.0, 38.0, 35.0, 41.0, 78.0, 65.0, 64.0, 78.0, 79.0, 69.0, 73.0, 58.0, 46.0, 38.0, 16.0, 24.0, 27.0, 10.0, 11.0, 8.0, 4.0, 6.0, 2.0, 7.0, 2.0, 0.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.48828125, -2.412322998046875, -2.33636474609375, -2.260406494140625, -2.1844482421875, -2.108489990234375, -2.03253173828125, -1.956573486328125, -1.880615234375, -1.804656982421875, -1.72869873046875, -1.652740478515625, -1.5767822265625, -1.500823974609375, -1.42486572265625, -1.348907470703125, -1.27294921875, -1.196990966796875, -1.12103271484375, -1.045074462890625, -0.9691162109375, -0.893157958984375, -0.81719970703125, -0.741241455078125, -0.665283203125, -0.589324951171875, -0.51336669921875, -0.437408447265625, -0.3614501953125, -0.285491943359375, -0.20953369140625, -0.133575439453125, -0.0576171875, 0.018341064453125, 0.09429931640625, 0.170257568359375, 0.2462158203125, 0.322174072265625, 0.39813232421875, 0.474090576171875, 0.550048828125, 0.626007080078125, 0.70196533203125, 0.777923583984375, 0.8538818359375, 0.929840087890625, 1.00579833984375, 1.081756591796875, 1.15771484375, 1.233673095703125, 1.30963134765625, 1.385589599609375, 1.4615478515625, 1.537506103515625, 1.61346435546875, 1.689422607421875, 1.765380859375, 1.841339111328125, 1.91729736328125, 1.993255615234375, 2.0692138671875, 2.145172119140625, 2.22113037109375, 2.297088623046875, 2.373046875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 5.0, 13.0, 23.0, 22.0, 31.0, 52.0, 78.0, 105.0, 180.0, 259.0, 354.0, 529.0, 688.0, 1059.0, 1599.0, 2636.0, 4389.0, 7694.0, 13621.0, 24996.0, 45265.0, 80637.0, 133014.0, 188047.0, 195447.0, 143753.0, 88556.0, 50514.0, 27767.0, 15328.0, 8477.0, 4911.0, 2960.0, 1812.0, 1196.0, 774.0, 536.0, 361.0, 257.0, 167.0, 113.0, 98.0, 74.0, 52.0, 29.0, 27.0, 17.0, 10.0, 4.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2919921875, -0.2831687927246094, -0.27434539794921875, -0.2655220031738281, -0.2566986083984375, -0.24787521362304688, -0.23905181884765625, -0.23022842407226562, -0.221405029296875, -0.21258163452148438, -0.20375823974609375, -0.19493484497070312, -0.1861114501953125, -0.17728805541992188, -0.16846466064453125, -0.15964126586914062, -0.15081787109375, -0.14199447631835938, -0.13317108154296875, -0.12434768676757812, -0.1155242919921875, -0.10670089721679688, -0.09787750244140625, -0.08905410766601562, -0.080230712890625, -0.07140731811523438, -0.06258392333984375, -0.053760528564453125, -0.0449371337890625, -0.036113739013671875, -0.02729034423828125, -0.018466949462890625, -0.0096435546875, -0.000820159912109375, 0.00800323486328125, 0.016826629638671875, 0.0256500244140625, 0.034473419189453125, 0.04329681396484375, 0.052120208740234375, 0.060943603515625, 0.06976699829101562, 0.07859039306640625, 0.08741378784179688, 0.0962371826171875, 0.10506057739257812, 0.11388397216796875, 0.12270736694335938, 0.13153076171875, 0.14035415649414062, 0.14917755126953125, 0.15800094604492188, 0.1668243408203125, 0.17564773559570312, 0.18447113037109375, 0.19329452514648438, 0.202117919921875, 0.21094131469726562, 0.21976470947265625, 0.22858810424804688, 0.2374114990234375, 0.24623489379882812, 0.25505828857421875, 0.2638816833496094, 0.272705078125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 11.0, 10.0, 16.0, 14.0, 13.0, 20.0, 17.0, 28.0, 30.0, 29.0, 20.0, 26.0, 34.0, 24.0, 39.0, 36.0, 40.0, 48.0, 1060.0, 39.0, 27.0, 35.0, 36.0, 40.0, 33.0, 41.0, 33.0, 28.0, 26.0, 20.0, 33.0, 11.0, 14.0, 9.0, 10.0, 17.0, 13.0, 11.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1357421875, -1.0997161865234375, -1.063690185546875, -1.0276641845703125, -0.99163818359375, -0.9556121826171875, -0.919586181640625, -0.8835601806640625, -0.8475341796875, -0.8115081787109375, -0.775482177734375, -0.7394561767578125, -0.70343017578125, -0.6674041748046875, -0.631378173828125, -0.5953521728515625, -0.559326171875, -0.5233001708984375, -0.487274169921875, -0.4512481689453125, -0.41522216796875, -0.3791961669921875, -0.343170166015625, -0.3071441650390625, -0.2711181640625, -0.2350921630859375, -0.199066162109375, -0.1630401611328125, -0.12701416015625, -0.0909881591796875, -0.054962158203125, -0.0189361572265625, 0.01708984375, 0.0531158447265625, 0.089141845703125, 0.1251678466796875, 0.16119384765625, 0.1972198486328125, 0.233245849609375, 0.2692718505859375, 0.3052978515625, 0.3413238525390625, 0.377349853515625, 0.4133758544921875, 0.44940185546875, 0.4854278564453125, 0.521453857421875, 0.5574798583984375, 0.593505859375, 0.6295318603515625, 0.665557861328125, 0.7015838623046875, 0.73760986328125, 0.7736358642578125, 0.809661865234375, 0.8456878662109375, 0.8817138671875, 0.9177398681640625, 0.953765869140625, 0.9897918701171875, 1.02581787109375, 1.0618438720703125, 1.097869873046875, 1.1338958740234375, 1.169921875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 5.0, 10.0, 15.0, 16.0, 35.0, 35.0, 43.0, 83.0, 113.0, 145.0, 248.0, 364.0, 508.0, 822.0, 1220.0, 1913.0, 3056.0, 4442.0, 7054.0, 11041.0, 17590.0, 27370.0, 43739.0, 67281.0, 106313.0, 189804.0, 657179.0, 516995.0, 167609.0, 97890.0, 63127.0, 40447.0, 25543.0, 16287.0, 10240.0, 6479.0, 4113.0, 2757.0, 1777.0, 1139.0, 731.0, 502.0, 349.0, 198.0, 155.0, 110.0, 76.0, 51.0, 34.0, 25.0, 24.0, 13.0, 7.0, 5.0, 6.0, 0.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.08447265625, -0.0817403793334961, -0.07900810241699219, -0.07627582550048828, -0.07354354858398438, -0.07081127166748047, -0.06807899475097656, -0.06534671783447266, -0.06261444091796875, -0.059882164001464844, -0.05714988708496094, -0.05441761016845703, -0.051685333251953125, -0.04895305633544922, -0.04622077941894531, -0.043488502502441406, -0.0407562255859375, -0.038023948669433594, -0.03529167175292969, -0.03255939483642578, -0.029827117919921875, -0.02709484100341797, -0.024362564086914062, -0.021630287170410156, -0.01889801025390625, -0.016165733337402344, -0.013433456420898438, -0.010701179504394531, -0.007968902587890625, -0.005236625671386719, -0.0025043487548828125, 0.00022792816162109375, 0.002960205078125, 0.005692481994628906, 0.008424758911132812, 0.011157035827636719, 0.013889312744140625, 0.01662158966064453, 0.019353866577148438, 0.022086143493652344, 0.02481842041015625, 0.027550697326660156, 0.030282974243164062, 0.03301525115966797, 0.035747528076171875, 0.03847980499267578, 0.04121208190917969, 0.043944358825683594, 0.0466766357421875, 0.049408912658691406, 0.05214118957519531, 0.05487346649169922, 0.057605743408203125, 0.06033802032470703, 0.06307029724121094, 0.06580257415771484, 0.06853485107421875, 0.07126712799072266, 0.07399940490722656, 0.07673168182373047, 0.07946395874023438, 0.08219623565673828, 0.08492851257324219, 0.0876607894897461, 0.09039306640625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 12.0, 7.0, 10.0, 8.0, 14.0, 24.0, 26.0, 32.0, 31.0, 35.0, 41.0, 53.0, 70.0, 58.0, 51.0, 78.0, 68.0, 63.0, 59.0, 46.0, 39.0, 27.0, 20.0, 16.0, 15.0, 16.0, 15.0, 12.0, 7.0, 3.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0450439453125, -0.04358816146850586, -0.04213237762451172, -0.04067659378051758, -0.03922080993652344, -0.0377650260925293, -0.036309242248535156, -0.034853458404541016, -0.033397674560546875, -0.031941890716552734, -0.030486106872558594, -0.029030323028564453, -0.027574539184570312, -0.026118755340576172, -0.02466297149658203, -0.02320718765258789, -0.02175140380859375, -0.02029561996459961, -0.01883983612060547, -0.017384052276611328, -0.015928268432617188, -0.014472484588623047, -0.013016700744628906, -0.011560916900634766, -0.010105133056640625, -0.008649349212646484, -0.007193565368652344, -0.005737781524658203, -0.0042819976806640625, -0.002826213836669922, -0.0013704299926757812, 8.535385131835938e-05, 0.0015411376953125, 0.0029969215393066406, 0.004452705383300781, 0.005908489227294922, 0.0073642730712890625, 0.008820056915283203, 0.010275840759277344, 0.011731624603271484, 0.013187408447265625, 0.014643192291259766, 0.016098976135253906, 0.017554759979248047, 0.019010543823242188, 0.020466327667236328, 0.02192211151123047, 0.02337789535522461, 0.02483367919921875, 0.02628946304321289, 0.02774524688720703, 0.029201030731201172, 0.030656814575195312, 0.03211259841918945, 0.033568382263183594, 0.035024166107177734, 0.036479949951171875, 0.037935733795166016, 0.039391517639160156, 0.0408473014831543, 0.04230308532714844, 0.04375886917114258, 0.04521465301513672, 0.04667043685913086, 0.048126220703125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 7.0, 4.0, 3.0, 6.0, 7.0, 5.0, 9.0, 13.0, 14.0, 24.0, 19.0, 20.0, 29.0, 43.0, 54.0, 69.0, 79.0, 117.0, 129.0, 177.0, 258.0, 426.0, 1265.0, 901618.0, 141941.0, 847.0, 334.0, 275.0, 184.0, 109.0, 84.0, 79.0, 55.0, 42.0, 42.0, 34.0, 24.0, 22.0, 18.0, 15.0, 11.0, 6.0, 6.0, 9.0, 4.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.85009765625, -0.8225860595703125, -0.795074462890625, -0.7675628662109375, -0.74005126953125, -0.7125396728515625, -0.685028076171875, -0.6575164794921875, -0.6300048828125, -0.6024932861328125, -0.574981689453125, -0.5474700927734375, -0.51995849609375, -0.4924468994140625, -0.464935302734375, -0.4374237060546875, -0.409912109375, -0.3824005126953125, -0.354888916015625, -0.3273773193359375, -0.29986572265625, -0.2723541259765625, -0.244842529296875, -0.2173309326171875, -0.1898193359375, -0.1623077392578125, -0.134796142578125, -0.1072845458984375, -0.07977294921875, -0.0522613525390625, -0.024749755859375, 0.0027618408203125, 0.0302734375, 0.0577850341796875, 0.085296630859375, 0.1128082275390625, 0.14031982421875, 0.1678314208984375, 0.195343017578125, 0.2228546142578125, 0.2503662109375, 0.2778778076171875, 0.305389404296875, 0.3329010009765625, 0.36041259765625, 0.3879241943359375, 0.415435791015625, 0.4429473876953125, 0.470458984375, 0.4979705810546875, 0.525482177734375, 0.5529937744140625, 0.58050537109375, 0.6080169677734375, 0.635528564453125, 0.6630401611328125, 0.6905517578125, 0.7180633544921875, 0.745574951171875, 0.7730865478515625, 0.80059814453125, 0.8281097412109375, 0.855621337890625, 0.8831329345703125, 0.91064453125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 13.0, 968.0, 35.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.203166961669922, -3.134596586227417, -3.066026210784912, -2.9974558353424072, -2.9288854598999023, -2.8603150844573975, -2.7917447090148926, -2.723174571990967, -2.654603958129883, -2.586033582687378, -2.517463207244873, -2.448892831802368, -2.3803224563598633, -2.3117520809173584, -2.2431817054748535, -2.1746115684509277, -2.106041193008423, -2.037470817565918, -1.968900442123413, -1.9003300666809082, -1.8317596912384033, -1.7631893157958984, -1.694619059562683, -1.6260486841201782, -1.5574783086776733, -1.4889079332351685, -1.4203375577926636, -1.3517671823501587, -1.2831969261169434, -1.2146265506744385, -1.1460561752319336, -1.0774857997894287, -1.0089151859283447, -0.9403448104858398, -0.871774435043335, -0.8032041192054749, -0.73463374376297, -0.6660633683204651, -0.597493052482605, -0.5289226770401001, -0.4603523015975952, -0.39178192615509033, -0.32321158051490784, -0.25464123487472534, -0.18607085943222046, -0.11750048398971558, -0.04893013834953308, 0.019640207290649414, 0.0882105827331543, 0.15678094327449799, 0.22535130381584167, 0.29392164945602417, 0.36249202489852905, 0.43106240034103394, 0.49963274598121643, 0.5682030916213989, 0.6367734670639038, 0.7053438425064087, 0.7739142179489136, 0.8424845337867737, 0.9110549092292786, 0.9796252846717834, 1.0481956005096436, 1.1167659759521484, 1.1853363513946533]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 7.0, 20.0, 20.0, 28.0, 33.0, 27.0, 53.0, 58.0, 70.0, 70.0, 68.0, 67.0, 63.0, 66.0, 69.0, 47.0, 45.0, 59.0, 30.0, 25.0, 16.0, 15.0, 12.0, 10.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27271538972854614, -0.2627987563610077, -0.25288212299346924, -0.2429654747247696, -0.23304882645606995, -0.2231321930885315, -0.21321555972099304, -0.2032989263534546, -0.19338227808475494, -0.1834656447172165, -0.17354899644851685, -0.1636323630809784, -0.15371572971343994, -0.1437990814447403, -0.13388244807720184, -0.1239658072590828, -0.11404916644096375, -0.1041325256228447, -0.09421588480472565, -0.0842992514371872, -0.07438261061906815, -0.0644659698009491, -0.054549332708120346, -0.044632695615291595, -0.034716054797172546, -0.024799415841698647, -0.014882776886224747, -0.004966137930750847, 0.004950501024723053, 0.014867141842842102, 0.024783778935670853, 0.0347004160284996, 0.04461705684661865, 0.0545336976647377, 0.06445033848285675, 0.0743669718503952, 0.08428361266851425, 0.0942002534866333, 0.10411688685417175, 0.1140335276722908, 0.12395016849040985, 0.1338668018579483, 0.14378345012664795, 0.1537000834941864, 0.16361671686172485, 0.1735333651304245, 0.18344999849796295, 0.1933666467666626, 0.20328328013420105, 0.2131999135017395, 0.22311656177043915, 0.2330331951379776, 0.24294984340667725, 0.2528664767742157, 0.26278311014175415, 0.2726997435092926, 0.28261637687683105, 0.2925330102443695, 0.30244964361190796, 0.3123663067817688, 0.32228294014930725, 0.3321995735168457, 0.34211620688438416, 0.3520328402519226, 0.36194950342178345]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 10.0, 5.0, 9.0, 9.0, 13.0, 26.0, 28.0, 30.0, 39.0, 48.0, 68.0, 77.0, 73.0, 88.0, 77.0, 68.0, 63.0, 37.0, 48.0, 40.0, 26.0, 29.0, 18.0, 16.0, 7.0, 8.0, 10.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.365234375, -2.290771484375, -2.21630859375, -2.141845703125, -2.0673828125, -1.992919921875, -1.91845703125, -1.843994140625, -1.76953125, -1.695068359375, -1.62060546875, -1.546142578125, -1.4716796875, -1.397216796875, -1.32275390625, -1.248291015625, -1.173828125, -1.099365234375, -1.02490234375, -0.950439453125, -0.8759765625, -0.801513671875, -0.72705078125, -0.652587890625, -0.578125, -0.503662109375, -0.42919921875, -0.354736328125, -0.2802734375, -0.205810546875, -0.13134765625, -0.056884765625, 0.017578125, 0.092041015625, 0.16650390625, 0.240966796875, 0.3154296875, 0.389892578125, 0.46435546875, 0.538818359375, 0.61328125, 0.687744140625, 0.76220703125, 0.836669921875, 0.9111328125, 0.985595703125, 1.06005859375, 1.134521484375, 1.208984375, 1.283447265625, 1.35791015625, 1.432373046875, 1.5068359375, 1.581298828125, 1.65576171875, 1.730224609375, 1.8046875, 1.879150390625, 1.95361328125, 2.028076171875, 2.1025390625, 2.177001953125, 2.25146484375, 2.325927734375, 2.400390625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 8.0, 16.0, 13.0, 14.0, 13.0, 22.0, 24.0, 35.0, 59.0, 48.0, 74.0, 93.0, 163.0, 223.0, 310.0, 528.0, 938.0, 1627.0, 3390.0, 8018.0, 25251.0, 112247.0, 486594.0, 319107.0, 62311.0, 15780.0, 5585.0, 2524.0, 1325.0, 760.0, 466.0, 278.0, 181.0, 129.0, 85.0, 72.0, 56.0, 41.0, 33.0, 25.0, 21.0, 9.0, 15.0, 11.0, 12.0, 10.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0], "bins": [-5.796875, -5.61468505859375, -5.4324951171875, -5.25030517578125, -5.068115234375, -4.88592529296875, -4.7037353515625, -4.52154541015625, -4.33935546875, -4.15716552734375, -3.9749755859375, -3.79278564453125, -3.610595703125, -3.42840576171875, -3.2462158203125, -3.06402587890625, -2.8818359375, -2.69964599609375, -2.5174560546875, -2.33526611328125, -2.153076171875, -1.97088623046875, -1.7886962890625, -1.60650634765625, -1.42431640625, -1.24212646484375, -1.0599365234375, -0.87774658203125, -0.695556640625, -0.51336669921875, -0.3311767578125, -0.14898681640625, 0.033203125, 0.21539306640625, 0.3975830078125, 0.57977294921875, 0.761962890625, 0.94415283203125, 1.1263427734375, 1.30853271484375, 1.49072265625, 1.67291259765625, 1.8551025390625, 2.03729248046875, 2.219482421875, 2.40167236328125, 2.5838623046875, 2.76605224609375, 2.9482421875, 3.13043212890625, 3.3126220703125, 3.49481201171875, 3.677001953125, 3.85919189453125, 4.0413818359375, 4.22357177734375, 4.40576171875, 4.58795166015625, 4.7701416015625, 4.95233154296875, 5.134521484375, 5.31671142578125, 5.4989013671875, 5.68109130859375, 5.86328125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 10.0, 10.0, 9.0, 6.0, 22.0, 22.0, 25.0, 28.0, 39.0, 36.0, 37.0, 41.0, 53.0, 118.0, 191.0, 1410.0, 291.0, 165.0, 95.0, 60.0, 50.0, 49.0, 41.0, 27.0, 42.0, 36.0, 20.0, 18.0, 17.0, 12.0, 9.0, 6.0, 3.0, 11.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.6851806640625, -6.487548828125, -6.2899169921875, -6.09228515625, -5.8946533203125, -5.697021484375, -5.4993896484375, -5.3017578125, -5.1041259765625, -4.906494140625, -4.7088623046875, -4.51123046875, -4.3135986328125, -4.115966796875, -3.9183349609375, -3.720703125, -3.5230712890625, -3.325439453125, -3.1278076171875, -2.93017578125, -2.7325439453125, -2.534912109375, -2.3372802734375, -2.1396484375, -1.9420166015625, -1.744384765625, -1.5467529296875, -1.34912109375, -1.1514892578125, -0.953857421875, -0.7562255859375, -0.55859375, -0.3609619140625, -0.163330078125, 0.0343017578125, 0.23193359375, 0.4295654296875, 0.627197265625, 0.8248291015625, 1.0224609375, 1.2200927734375, 1.417724609375, 1.6153564453125, 1.81298828125, 2.0106201171875, 2.208251953125, 2.4058837890625, 2.603515625, 2.8011474609375, 2.998779296875, 3.1964111328125, 3.39404296875, 3.5916748046875, 3.789306640625, 3.9869384765625, 4.1845703125, 4.3822021484375, 4.579833984375, 4.7774658203125, 4.97509765625, 5.1727294921875, 5.370361328125, 5.5679931640625, 5.765625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 13.0, 14.0, 13.0, 21.0, 21.0, 25.0, 34.0, 30.0, 40.0, 32.0, 59.0, 111.0, 294.0, 1398.0, 270807.0, 2868173.0, 3746.0, 419.0, 132.0, 54.0, 39.0, 40.0, 29.0, 24.0, 21.0, 17.0, 18.0, 11.0, 11.0, 8.0, 5.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.6875, -23.869140625, -23.05078125, -22.232421875, -21.4140625, -20.595703125, -19.77734375, -18.958984375, -18.140625, -17.322265625, -16.50390625, -15.685546875, -14.8671875, -14.048828125, -13.23046875, -12.412109375, -11.59375, -10.775390625, -9.95703125, -9.138671875, -8.3203125, -7.501953125, -6.68359375, -5.865234375, -5.046875, -4.228515625, -3.41015625, -2.591796875, -1.7734375, -0.955078125, -0.13671875, 0.681640625, 1.5, 2.318359375, 3.13671875, 3.955078125, 4.7734375, 5.591796875, 6.41015625, 7.228515625, 8.046875, 8.865234375, 9.68359375, 10.501953125, 11.3203125, 12.138671875, 12.95703125, 13.775390625, 14.59375, 15.412109375, 16.23046875, 17.048828125, 17.8671875, 18.685546875, 19.50390625, 20.322265625, 21.140625, 21.958984375, 22.77734375, 23.595703125, 24.4140625, 25.232421875, 26.05078125, 26.869140625, 27.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [799.0, 220.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1745572090148926, 0.7899472713470459, 4.754451751708984, 8.718955993652344, 12.683460235595703, 16.647966384887695, 20.612470626831055, 24.576974868774414, 28.541479110717773, 32.505985260009766, 36.470489501953125, 40.434993743896484, 44.399497985839844, 48.3640022277832, 52.32850646972656, 56.29301071166992, 60.25751495361328, 64.2220230102539, 68.1865234375, 72.15103149414062, 76.11553192138672, 80.08003997802734, 84.04454040527344, 88.00904846191406, 91.97354888916016, 95.93805694580078, 99.90255737304688, 103.8670654296875, 107.8315658569336, 111.79607391357422, 115.76057434082031, 119.72508239746094, 123.68958282470703, 127.65409088134766, 131.61859130859375, 135.58309936523438, 139.547607421875, 143.51210021972656, 147.4766082763672, 151.4411163330078, 155.40562438964844, 159.37013244628906, 163.3346405029297, 167.29913330078125, 171.26364135742188, 175.2281494140625, 179.19265747070312, 183.1571502685547, 187.1216583251953, 191.08616638183594, 195.05067443847656, 199.01516723632812, 202.97967529296875, 206.94418334960938, 210.90869140625, 214.87318420410156, 218.8376922607422, 222.8022003173828, 226.76670837402344, 230.731201171875, 234.69570922851562, 238.66021728515625, 242.62472534179688, 246.58921813964844, 250.55372619628906]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 5.0, 2.0, 4.0, 6.0, 3.0, 9.0, 6.0, 8.0, 10.0, 18.0, 16.0, 17.0, 20.0, 16.0, 26.0, 26.0, 20.0, 32.0, 30.0, 23.0, 41.0, 32.0, 32.0, 24.0, 38.0, 43.0, 49.0, 47.0, 33.0, 34.0, 37.0, 38.0, 27.0, 26.0, 26.0, 29.0, 25.0, 19.0, 16.0, 21.0, 18.0, 6.0, 9.0, 13.0, 3.0, 6.0, 1.0, 7.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 3.0], "bins": [-17.81157875061035, -17.274394989013672, -16.737211227416992, -16.20002555847168, -15.662841796875, -15.12565803527832, -14.58847427368164, -14.051290512084961, -13.514105796813965, -12.976922035217285, -12.439737319946289, -11.90255355834961, -11.36536979675293, -10.828185081481934, -10.291001319885254, -9.753816604614258, -9.216632843017578, -8.679449081420898, -8.142264366149902, -7.605080604553223, -7.067896366119385, -6.530712127685547, -5.993528366088867, -5.456344127655029, -4.919159889221191, -4.3819756507873535, -3.8447916507720947, -3.307607650756836, -2.770423412322998, -2.23323917388916, -1.6960551738739014, -1.1588711738586426, -0.6216869354248047, -0.08450281620025635, 0.452681303024292, 0.9898654222488403, 1.5270495414733887, 2.0642337799072266, 2.6014177799224854, 3.138601779937744, 3.675786018371582, 4.21297025680542, 4.750154495239258, 5.2873382568359375, 5.824522495269775, 6.361706733703613, 6.898890495300293, 7.436074733734131, 7.973258972167969, 8.510442733764648, 9.047627449035645, 9.584811210632324, 10.12199592590332, 10.6591796875, 11.19636344909668, 11.73354721069336, 12.270731925964355, 12.807915687561035, 13.345100402832031, 13.882284164428711, 14.41946792602539, 14.956652641296387, 15.493836402893066, 16.031021118164062, 16.568204879760742]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 6.0, 9.0, 11.0, 13.0, 23.0, 20.0, 29.0, 38.0, 38.0, 50.0, 62.0, 57.0, 69.0, 76.0, 78.0, 73.0, 63.0, 57.0, 46.0, 39.0, 24.0, 17.0, 17.0, 17.0, 12.0, 13.0, 6.0, 3.0, 5.0, 5.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.451171875, -2.373779296875, -2.29638671875, -2.218994140625, -2.1416015625, -2.064208984375, -1.98681640625, -1.909423828125, -1.83203125, -1.754638671875, -1.67724609375, -1.599853515625, -1.5224609375, -1.445068359375, -1.36767578125, -1.290283203125, -1.212890625, -1.135498046875, -1.05810546875, -0.980712890625, -0.9033203125, -0.825927734375, -0.74853515625, -0.671142578125, -0.59375, -0.516357421875, -0.43896484375, -0.361572265625, -0.2841796875, -0.206787109375, -0.12939453125, -0.052001953125, 0.025390625, 0.102783203125, 0.18017578125, 0.257568359375, 0.3349609375, 0.412353515625, 0.48974609375, 0.567138671875, 0.64453125, 0.721923828125, 0.79931640625, 0.876708984375, 0.9541015625, 1.031494140625, 1.10888671875, 1.186279296875, 1.263671875, 1.341064453125, 1.41845703125, 1.495849609375, 1.5732421875, 1.650634765625, 1.72802734375, 1.805419921875, 1.8828125, 1.960205078125, 2.03759765625, 2.114990234375, 2.1923828125, 2.269775390625, 2.34716796875, 2.424560546875, 2.501953125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 10.0, 20.0, 25.0, 24.0, 41.0, 57.0, 74.0, 93.0, 170.0, 201.0, 317.0, 497.0, 854.0, 1394.0, 2638.0, 5949.0, 19532.0, 225744.0, 3661363.0, 244643.0, 18873.0, 5368.0, 2493.0, 1360.0, 861.0, 538.0, 362.0, 243.0, 188.0, 107.0, 87.0, 52.0, 32.0, 19.0, 12.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.390625, -12.009521484375, -11.62841796875, -11.247314453125, -10.8662109375, -10.485107421875, -10.10400390625, -9.722900390625, -9.341796875, -8.960693359375, -8.57958984375, -8.198486328125, -7.8173828125, -7.436279296875, -7.05517578125, -6.674072265625, -6.29296875, -5.911865234375, -5.53076171875, -5.149658203125, -4.7685546875, -4.387451171875, -4.00634765625, -3.625244140625, -3.244140625, -2.863037109375, -2.48193359375, -2.100830078125, -1.7197265625, -1.338623046875, -0.95751953125, -0.576416015625, -0.1953125, 0.185791015625, 0.56689453125, 0.947998046875, 1.3291015625, 1.710205078125, 2.09130859375, 2.472412109375, 2.853515625, 3.234619140625, 3.61572265625, 3.996826171875, 4.3779296875, 4.759033203125, 5.14013671875, 5.521240234375, 5.90234375, 6.283447265625, 6.66455078125, 7.045654296875, 7.4267578125, 7.807861328125, 8.18896484375, 8.570068359375, 8.951171875, 9.332275390625, 9.71337890625, 10.094482421875, 10.4755859375, 10.856689453125, 11.23779296875, 11.618896484375, 12.0]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 11.0, 5.0, 7.0, 12.0, 20.0, 37.0, 30.0, 50.0, 75.0, 138.0, 208.0, 345.0, 543.0, 693.0, 668.0, 442.0, 278.0, 169.0, 114.0, 79.0, 44.0, 42.0, 25.0, 14.0, 7.0, 8.0, 8.0, 1.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.02734375, -5.75103759765625, -5.4747314453125, -5.19842529296875, -4.922119140625, -4.64581298828125, -4.3695068359375, -4.09320068359375, -3.81689453125, -3.54058837890625, -3.2642822265625, -2.98797607421875, -2.711669921875, -2.43536376953125, -2.1590576171875, -1.88275146484375, -1.6064453125, -1.33013916015625, -1.0538330078125, -0.77752685546875, -0.501220703125, -0.22491455078125, 0.0513916015625, 0.32769775390625, 0.60400390625, 0.88031005859375, 1.1566162109375, 1.43292236328125, 1.709228515625, 1.98553466796875, 2.2618408203125, 2.53814697265625, 2.814453125, 3.09075927734375, 3.3670654296875, 3.64337158203125, 3.919677734375, 4.19598388671875, 4.4722900390625, 4.74859619140625, 5.02490234375, 5.30120849609375, 5.5775146484375, 5.85382080078125, 6.130126953125, 6.40643310546875, 6.6827392578125, 6.95904541015625, 7.2353515625, 7.51165771484375, 7.7879638671875, 8.06427001953125, 8.340576171875, 8.61688232421875, 8.8931884765625, 9.16949462890625, 9.44580078125, 9.72210693359375, 9.9984130859375, 10.27471923828125, 10.551025390625, 10.82733154296875, 11.1036376953125, 11.37994384765625, 11.65625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 10.0, 9.0, 29.0, 28.0, 63.0, 166.0, 330.0, 657.0, 1409.0, 3201.0, 7237.0, 18603.0, 56246.0, 363438.0, 3029828.0, 602316.0, 73241.0, 21918.0, 8650.0, 3655.0, 1665.0, 788.0, 395.0, 202.0, 92.0, 60.0, 30.0, 10.0, 10.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.477783203125, -10.03369140625, -9.589599609375, -9.1455078125, -8.701416015625, -8.25732421875, -7.813232421875, -7.369140625, -6.925048828125, -6.48095703125, -6.036865234375, -5.5927734375, -5.148681640625, -4.70458984375, -4.260498046875, -3.81640625, -3.372314453125, -2.92822265625, -2.484130859375, -2.0400390625, -1.595947265625, -1.15185546875, -0.707763671875, -0.263671875, 0.180419921875, 0.62451171875, 1.068603515625, 1.5126953125, 1.956787109375, 2.40087890625, 2.844970703125, 3.2890625, 3.733154296875, 4.17724609375, 4.621337890625, 5.0654296875, 5.509521484375, 5.95361328125, 6.397705078125, 6.841796875, 7.285888671875, 7.72998046875, 8.174072265625, 8.6181640625, 9.062255859375, 9.50634765625, 9.950439453125, 10.39453125, 10.838623046875, 11.28271484375, 11.726806640625, 12.1708984375, 12.614990234375, 13.05908203125, 13.503173828125, 13.947265625, 14.391357421875, 14.83544921875, 15.279541015625, 15.7236328125, 16.167724609375, 16.61181640625, 17.055908203125, 17.5]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 7.0, 10.0, 9.0, 24.0, 41.0, 68.0, 86.0, 126.0, 129.0, 145.0, 127.0, 74.0, 49.0, 46.0, 29.0, 8.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.53968048095703, -42.44634246826172, -41.35300827026367, -40.259674072265625, -39.16633605957031, -38.072998046875, -36.97966384887695, -35.886329650878906, -34.792991638183594, -33.69965362548828, -32.606319427490234, -31.512983322143555, -30.419647216796875, -29.326311111450195, -28.232975006103516, -27.139638900756836, -26.046302795410156, -24.952966690063477, -23.859630584716797, -22.766294479370117, -21.672958374023438, -20.579622268676758, -19.486286163330078, -18.3929500579834, -17.29961395263672, -16.20627784729004, -15.11294174194336, -14.01960563659668, -12.92626953125, -11.83293342590332, -10.73959732055664, -9.646261215209961, -8.552923202514648, -7.459587097167969, -6.366250991821289, -5.272914886474609, -4.17957878112793, -3.08624267578125, -1.9929065704345703, -0.8995704650878906, 0.19376564025878906, 1.2871017456054688, 2.3804378509521484, 3.473773956298828, 4.567110061645508, 5.6604461669921875, 6.753782272338867, 7.847118377685547, 8.940454483032227, 10.033790588378906, 11.127126693725586, 12.220462799072266, 13.313798904418945, 14.407135009765625, 15.500471115112305, 16.593807220458984, 17.687143325805664, 18.780479431152344, 19.873815536499023, 20.967151641845703, 22.060487747192383, 23.153823852539062, 24.247159957885742, 25.340496063232422, 26.4338321685791]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 7.0, 2.0, 4.0, 10.0, 18.0, 10.0, 8.0, 22.0, 22.0, 17.0, 22.0, 42.0, 36.0, 42.0, 50.0, 44.0, 41.0, 38.0, 51.0, 45.0, 32.0, 51.0, 52.0, 40.0, 50.0, 24.0, 35.0, 24.0, 25.0, 22.0, 23.0, 12.0, 12.0, 18.0, 8.0, 7.0, 4.0, 7.0, 5.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.514572143554688, -21.813264846801758, -21.111957550048828, -20.4106502532959, -19.70934295654297, -19.00803565979004, -18.30672836303711, -17.60542106628418, -16.90411376953125, -16.20280647277832, -15.50149917602539, -14.800191879272461, -14.098884582519531, -13.397577285766602, -12.696269989013672, -11.994962692260742, -11.293656349182129, -10.5923490524292, -9.89104175567627, -9.18973445892334, -8.48842716217041, -7.7871198654174805, -7.085813045501709, -6.384505748748779, -5.68319845199585, -4.98189115524292, -4.28058385848999, -3.5792768001556396, -2.87796950340271, -2.1766622066497803, -1.4753551483154297, -0.7740478515625, -0.07274055480957031, 0.6285666823387146, 1.3298739194869995, 2.0311810970306396, 2.7324883937835693, 3.433795690536499, 4.13510274887085, 4.836410045623779, 5.537717342376709, 6.239024639129639, 6.940331935882568, 7.64163875579834, 8.34294605255127, 9.0442533493042, 9.745560646057129, 10.446867942810059, 11.148175239562988, 11.849482536315918, 12.550789833068848, 13.252097129821777, 13.953404426574707, 14.654711723327637, 15.35601806640625, 16.05732536315918, 16.75863265991211, 17.45993995666504, 18.16124725341797, 18.8625545501709, 19.563861846923828, 20.265169143676758, 20.966476440429688, 21.667783737182617, 22.369091033935547]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 8.0, 19.0, 23.0, 15.0, 34.0, 27.0, 35.0, 53.0, 47.0, 59.0, 74.0, 50.0, 75.0, 57.0, 61.0, 53.0, 48.0, 50.0, 38.0, 28.0, 20.0, 22.0, 18.0, 12.0, 14.0, 4.0, 5.0, 4.0, 6.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.28350830078125, -2.2076416015625, -2.13177490234375, -2.055908203125, -1.98004150390625, -1.9041748046875, -1.82830810546875, -1.75244140625, -1.67657470703125, -1.6007080078125, -1.52484130859375, -1.448974609375, -1.37310791015625, -1.2972412109375, -1.22137451171875, -1.1455078125, -1.06964111328125, -0.9937744140625, -0.91790771484375, -0.842041015625, -0.76617431640625, -0.6903076171875, -0.61444091796875, -0.53857421875, -0.46270751953125, -0.3868408203125, -0.31097412109375, -0.235107421875, -0.15924072265625, -0.0833740234375, -0.00750732421875, 0.068359375, 0.14422607421875, 0.2200927734375, 0.29595947265625, 0.371826171875, 0.44769287109375, 0.5235595703125, 0.59942626953125, 0.67529296875, 0.75115966796875, 0.8270263671875, 0.90289306640625, 0.978759765625, 1.05462646484375, 1.1304931640625, 1.20635986328125, 1.2822265625, 1.35809326171875, 1.4339599609375, 1.50982666015625, 1.585693359375, 1.66156005859375, 1.7374267578125, 1.81329345703125, 1.88916015625, 1.96502685546875, 2.0408935546875, 2.11676025390625, 2.192626953125, 2.26849365234375, 2.3443603515625, 2.42022705078125, 2.49609375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 11.0, 19.0, 30.0, 27.0, 50.0, 66.0, 110.0, 156.0, 233.0, 388.0, 666.0, 1260.0, 2572.0, 7066.0, 26771.0, 141302.0, 502101.0, 290828.0, 54975.0, 11991.0, 3944.0, 1734.0, 861.0, 532.0, 307.0, 176.0, 111.0, 81.0, 53.0, 33.0, 24.0, 17.0, 10.0, 8.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.1953125, -1.1627655029296875, -1.130218505859375, -1.0976715087890625, -1.06512451171875, -1.0325775146484375, -1.000030517578125, -0.9674835205078125, -0.9349365234375, -0.9023895263671875, -0.869842529296875, -0.8372955322265625, -0.80474853515625, -0.7722015380859375, -0.739654541015625, -0.7071075439453125, -0.674560546875, -0.6420135498046875, -0.609466552734375, -0.5769195556640625, -0.54437255859375, -0.5118255615234375, -0.479278564453125, -0.4467315673828125, -0.4141845703125, -0.3816375732421875, -0.349090576171875, -0.3165435791015625, -0.28399658203125, -0.2514495849609375, -0.218902587890625, -0.1863555908203125, -0.15380859375, -0.1212615966796875, -0.088714599609375, -0.0561676025390625, -0.02362060546875, 0.0089263916015625, 0.041473388671875, 0.0740203857421875, 0.1065673828125, 0.1391143798828125, 0.171661376953125, 0.2042083740234375, 0.23675537109375, 0.2693023681640625, 0.301849365234375, 0.3343963623046875, 0.366943359375, 0.3994903564453125, 0.432037353515625, 0.4645843505859375, 0.49713134765625, 0.5296783447265625, 0.562225341796875, 0.5947723388671875, 0.6273193359375, 0.6598663330078125, 0.692413330078125, 0.7249603271484375, 0.75750732421875, 0.7900543212890625, 0.822601318359375, 0.8551483154296875, 0.8876953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 4.0, 13.0, 9.0, 11.0, 17.0, 13.0, 19.0, 17.0, 20.0, 28.0, 28.0, 33.0, 31.0, 42.0, 44.0, 52.0, 46.0, 36.0, 47.0, 1061.0, 39.0, 46.0, 43.0, 40.0, 30.0, 41.0, 21.0, 25.0, 25.0, 16.0, 29.0, 22.0, 9.0, 14.0, 17.0, 13.0, 10.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2377166748046875, -1.195159912109375, -1.1526031494140625, -1.11004638671875, -1.0674896240234375, -1.024932861328125, -0.9823760986328125, -0.9398193359375, -0.8972625732421875, -0.854705810546875, -0.8121490478515625, -0.76959228515625, -0.7270355224609375, -0.684478759765625, -0.6419219970703125, -0.599365234375, -0.5568084716796875, -0.514251708984375, -0.4716949462890625, -0.42913818359375, -0.3865814208984375, -0.344024658203125, -0.3014678955078125, -0.2589111328125, -0.2163543701171875, -0.173797607421875, -0.1312408447265625, -0.08868408203125, -0.0461273193359375, -0.003570556640625, 0.0389862060546875, 0.08154296875, 0.1240997314453125, 0.166656494140625, 0.2092132568359375, 0.25177001953125, 0.2943267822265625, 0.336883544921875, 0.3794403076171875, 0.4219970703125, 0.4645538330078125, 0.507110595703125, 0.5496673583984375, 0.59222412109375, 0.6347808837890625, 0.677337646484375, 0.7198944091796875, 0.762451171875, 0.8050079345703125, 0.847564697265625, 0.8901214599609375, 0.93267822265625, 0.9752349853515625, 1.017791748046875, 1.0603485107421875, 1.1029052734375, 1.1454620361328125, 1.188018798828125, 1.2305755615234375, 1.27313232421875, 1.3156890869140625, 1.358245849609375, 1.4008026123046875, 1.443359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 9.0, 9.0, 13.0, 16.0, 22.0, 25.0, 44.0, 69.0, 113.0, 208.0, 319.0, 679.0, 1485.0, 4044.0, 17240.0, 100425.0, 1280772.0, 593801.0, 77804.0, 13838.0, 3545.0, 1259.0, 569.0, 319.0, 171.0, 105.0, 71.0, 37.0, 25.0, 24.0, 17.0, 16.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.453125, -0.438934326171875, -0.42474365234375, -0.410552978515625, -0.3963623046875, -0.382171630859375, -0.36798095703125, -0.353790283203125, -0.339599609375, -0.325408935546875, -0.31121826171875, -0.297027587890625, -0.2828369140625, -0.268646240234375, -0.25445556640625, -0.240264892578125, -0.22607421875, -0.211883544921875, -0.19769287109375, -0.183502197265625, -0.1693115234375, -0.155120849609375, -0.14093017578125, -0.126739501953125, -0.112548828125, -0.098358154296875, -0.08416748046875, -0.069976806640625, -0.0557861328125, -0.041595458984375, -0.02740478515625, -0.013214111328125, 0.0009765625, 0.015167236328125, 0.02935791015625, 0.043548583984375, 0.0577392578125, 0.071929931640625, 0.08612060546875, 0.100311279296875, 0.114501953125, 0.128692626953125, 0.14288330078125, 0.157073974609375, 0.1712646484375, 0.185455322265625, 0.19964599609375, 0.213836669921875, 0.22802734375, 0.242218017578125, 0.25640869140625, 0.270599365234375, 0.2847900390625, 0.298980712890625, 0.31317138671875, 0.327362060546875, 0.341552734375, 0.355743408203125, 0.36993408203125, 0.384124755859375, 0.3983154296875, 0.412506103515625, 0.42669677734375, 0.440887451171875, 0.455078125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 13.0, 20.0, 24.0, 39.0, 69.0, 290.0, 315.0, 89.0, 37.0, 20.0, 20.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0994873046875, -0.0961771011352539, -0.09286689758300781, -0.08955669403076172, -0.08624649047851562, -0.08293628692626953, -0.07962608337402344, -0.07631587982177734, -0.07300567626953125, -0.06969547271728516, -0.06638526916503906, -0.06307506561279297, -0.059764862060546875, -0.05645465850830078, -0.05314445495605469, -0.049834251403808594, -0.0465240478515625, -0.043213844299316406, -0.03990364074707031, -0.03659343719482422, -0.033283233642578125, -0.02997303009033203, -0.026662826538085938, -0.023352622985839844, -0.02004241943359375, -0.016732215881347656, -0.013422012329101562, -0.010111808776855469, -0.006801605224609375, -0.0034914016723632812, -0.0001811981201171875, 0.0031290054321289062, 0.006439208984375, 0.009749412536621094, 0.013059616088867188, 0.01636981964111328, 0.019680023193359375, 0.02299022674560547, 0.026300430297851562, 0.029610633850097656, 0.03292083740234375, 0.036231040954589844, 0.03954124450683594, 0.04285144805908203, 0.046161651611328125, 0.04947185516357422, 0.05278205871582031, 0.056092262268066406, 0.0594024658203125, 0.0627126693725586, 0.06602287292480469, 0.06933307647705078, 0.07264328002929688, 0.07595348358154297, 0.07926368713378906, 0.08257389068603516, 0.08588409423828125, 0.08919429779052734, 0.09250450134277344, 0.09581470489501953, 0.09912490844726562, 0.10243511199951172, 0.10574531555175781, 0.1090555191040039, 0.11236572265625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 0.0, 5.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 5.0, 5.0, 7.0, 2.0, 7.0, 7.0, 6.0, 9.0, 16.0, 12.0, 26.0, 46.0, 87.0, 117.0, 238.0, 2897.0, 990870.0, 52775.0, 898.0, 195.0, 98.0, 68.0, 28.0, 21.0, 9.0, 12.0, 11.0, 9.0, 8.0, 6.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7333984375, -1.6752777099609375, -1.617156982421875, -1.5590362548828125, -1.50091552734375, -1.4427947998046875, -1.384674072265625, -1.3265533447265625, -1.2684326171875, -1.2103118896484375, -1.152191162109375, -1.0940704345703125, -1.03594970703125, -0.9778289794921875, -0.919708251953125, -0.8615875244140625, -0.803466796875, -0.7453460693359375, -0.687225341796875, -0.6291046142578125, -0.57098388671875, -0.5128631591796875, -0.454742431640625, -0.3966217041015625, -0.3385009765625, -0.2803802490234375, -0.222259521484375, -0.1641387939453125, -0.10601806640625, -0.0478973388671875, 0.010223388671875, 0.0683441162109375, 0.12646484375, 0.1845855712890625, 0.242706298828125, 0.3008270263671875, 0.35894775390625, 0.4170684814453125, 0.475189208984375, 0.5333099365234375, 0.5914306640625, 0.6495513916015625, 0.707672119140625, 0.7657928466796875, 0.82391357421875, 0.8820343017578125, 0.940155029296875, 0.9982757568359375, 1.056396484375, 1.1145172119140625, 1.172637939453125, 1.2307586669921875, 1.28887939453125, 1.3470001220703125, 1.405120849609375, 1.4632415771484375, 1.5213623046875, 1.5794830322265625, 1.637603759765625, 1.6957244873046875, 1.75384521484375, 1.8119659423828125, 1.870086669921875, 1.9282073974609375, 1.986328125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 45.0, 626.0, 334.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.3595519065856934, -2.3187954425811768, -2.27803897857666, -2.2372825145721436, -2.196526050567627, -2.1557698249816895, -2.115013360977173, -2.0742568969726562, -2.0335004329681396, -1.992743968963623, -1.9519875049591064, -1.9112311601638794, -1.8704746961593628, -1.8297182321548462, -1.7889617681503296, -1.7482054233551025, -1.707448959350586, -1.6666924953460693, -1.6259360313415527, -1.5851796865463257, -1.544423222541809, -1.5036667585372925, -1.4629102945327759, -1.4221539497375488, -1.3813973665237427, -1.340640902519226, -1.2998844385147095, -1.2591280937194824, -1.2183716297149658, -1.1776151657104492, -1.1368587017059326, -1.096102237701416, -1.055345892906189, -1.0145894289016724, -0.9738330245018005, -0.9330765604972839, -0.8923201560974121, -0.8515636920928955, -0.8108072280883789, -0.7700508236885071, -0.7292944192886353, -0.6885379552841187, -0.6477815508842468, -0.6070250868797302, -0.5662686824798584, -0.5255122184753418, -0.4847557842731476, -0.44399935007095337, -0.40324288606643677, -0.36248645186424255, -0.32173001766204834, -0.28097355365753174, -0.24021713435649872, -0.1994607001543045, -0.1587042510509491, -0.11794781684875488, -0.07719139754772186, -0.03643495962023735, 0.004321478307247162, 0.04507791996002197, 0.08583435416221619, 0.1265907883644104, 0.1673472374677658, 0.20810367166996002, 0.24886010587215424]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 4.0, 7.0, 4.0, 11.0, 14.0, 12.0, 5.0, 24.0, 22.0, 19.0, 30.0, 22.0, 33.0, 43.0, 40.0, 48.0, 48.0, 50.0, 52.0, 57.0, 42.0, 49.0, 52.0, 35.0, 43.0, 38.0, 32.0, 34.0, 24.0, 25.0, 24.0, 14.0, 10.0, 11.0, 12.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11557161808013916, -0.11079752445220947, -0.10602343082427979, -0.1012493371963501, -0.09647524356842041, -0.09170114994049072, -0.08692705631256104, -0.08215296268463135, -0.07737886905670166, -0.07260477542877197, -0.06783068180084229, -0.0630565881729126, -0.05828249454498291, -0.05350840091705322, -0.048734307289123535, -0.04396021366119385, -0.03918612003326416, -0.03441202640533447, -0.029637932777404785, -0.024863839149475098, -0.02008974552154541, -0.015315651893615723, -0.010541558265686035, -0.005767464637756348, -0.0009933710098266602, 0.0037807226181030273, 0.008554816246032715, 0.013328909873962402, 0.01810300350189209, 0.022877097129821777, 0.027651190757751465, 0.03242528438568115, 0.03719937801361084, 0.04197347164154053, 0.046747565269470215, 0.0515216588973999, 0.05629575252532959, 0.06106984615325928, 0.06584393978118896, 0.07061803340911865, 0.07539212703704834, 0.08016622066497803, 0.08494031429290771, 0.0897144079208374, 0.09448850154876709, 0.09926259517669678, 0.10403668880462646, 0.10881078243255615, 0.11358487606048584, 0.11835896968841553, 0.12313306331634521, 0.1279071569442749, 0.1326812505722046, 0.13745534420013428, 0.14222943782806396, 0.14700353145599365, 0.15177762508392334, 0.15655171871185303, 0.16132581233978271, 0.1660999059677124, 0.1708739995956421, 0.17564809322357178, 0.18042218685150146, 0.18519628047943115, 0.18997037410736084]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 10.0, 11.0, 9.0, 14.0, 13.0, 22.0, 26.0, 35.0, 46.0, 41.0, 68.0, 74.0, 74.0, 85.0, 61.0, 64.0, 61.0, 49.0, 47.0, 43.0, 27.0, 31.0, 17.0, 24.0, 7.0, 3.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.545867919921875, -2.46282958984375, -2.379791259765625, -2.2967529296875, -2.213714599609375, -2.13067626953125, -2.047637939453125, -1.964599609375, -1.881561279296875, -1.79852294921875, -1.715484619140625, -1.6324462890625, -1.549407958984375, -1.46636962890625, -1.383331298828125, -1.30029296875, -1.217254638671875, -1.13421630859375, -1.051177978515625, -0.9681396484375, -0.885101318359375, -0.80206298828125, -0.719024658203125, -0.635986328125, -0.552947998046875, -0.46990966796875, -0.386871337890625, -0.3038330078125, -0.220794677734375, -0.13775634765625, -0.054718017578125, 0.0283203125, 0.111358642578125, 0.19439697265625, 0.277435302734375, 0.3604736328125, 0.443511962890625, 0.52655029296875, 0.609588623046875, 0.692626953125, 0.775665283203125, 0.85870361328125, 0.941741943359375, 1.0247802734375, 1.107818603515625, 1.19085693359375, 1.273895263671875, 1.35693359375, 1.439971923828125, 1.52301025390625, 1.606048583984375, 1.6890869140625, 1.772125244140625, 1.85516357421875, 1.938201904296875, 2.021240234375, 2.104278564453125, 2.18731689453125, 2.270355224609375, 2.3533935546875, 2.436431884765625, 2.51947021484375, 2.602508544921875, 2.685546875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 12.0, 14.0, 15.0, 31.0, 42.0, 65.0, 102.0, 168.0, 347.0, 700.0, 1670.0, 4482.0, 14318.0, 54233.0, 199878.0, 421385.0, 251030.0, 71934.0, 18783.0, 5599.0, 2015.0, 848.0, 371.0, 200.0, 128.0, 64.0, 39.0, 27.0, 24.0, 13.0, 6.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.72021484375, -2.6416015625, -2.56298828125, -2.484375, -2.40576171875, -2.3271484375, -2.24853515625, -2.169921875, -2.09130859375, -2.0126953125, -1.93408203125, -1.85546875, -1.77685546875, -1.6982421875, -1.61962890625, -1.541015625, -1.46240234375, -1.3837890625, -1.30517578125, -1.2265625, -1.14794921875, -1.0693359375, -0.99072265625, -0.912109375, -0.83349609375, -0.7548828125, -0.67626953125, -0.59765625, -0.51904296875, -0.4404296875, -0.36181640625, -0.283203125, -0.20458984375, -0.1259765625, -0.04736328125, 0.03125, 0.10986328125, 0.1884765625, 0.26708984375, 0.345703125, 0.42431640625, 0.5029296875, 0.58154296875, 0.66015625, 0.73876953125, 0.8173828125, 0.89599609375, 0.974609375, 1.05322265625, 1.1318359375, 1.21044921875, 1.2890625, 1.36767578125, 1.4462890625, 1.52490234375, 1.603515625, 1.68212890625, 1.7607421875, 1.83935546875, 1.91796875, 1.99658203125, 2.0751953125, 2.15380859375, 2.232421875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 9.0, 4.0, 5.0, 11.0, 6.0, 9.0, 15.0, 9.0, 18.0, 26.0, 26.0, 42.0, 32.0, 28.0, 34.0, 42.0, 45.0, 74.0, 153.0, 400.0, 1449.0, 159.0, 69.0, 40.0, 38.0, 46.0, 36.0, 29.0, 23.0, 22.0, 25.0, 21.0, 17.0, 21.0, 15.0, 9.0, 11.0, 10.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.59765625, -7.35272216796875, -7.1077880859375, -6.86285400390625, -6.617919921875, -6.37298583984375, -6.1280517578125, -5.88311767578125, -5.63818359375, -5.39324951171875, -5.1483154296875, -4.90338134765625, -4.658447265625, -4.41351318359375, -4.1685791015625, -3.92364501953125, -3.6787109375, -3.43377685546875, -3.1888427734375, -2.94390869140625, -2.698974609375, -2.45404052734375, -2.2091064453125, -1.96417236328125, -1.71923828125, -1.47430419921875, -1.2293701171875, -0.98443603515625, -0.739501953125, -0.49456787109375, -0.2496337890625, -0.00469970703125, 0.240234375, 0.48516845703125, 0.7301025390625, 0.97503662109375, 1.219970703125, 1.46490478515625, 1.7098388671875, 1.95477294921875, 2.19970703125, 2.44464111328125, 2.6895751953125, 2.93450927734375, 3.179443359375, 3.42437744140625, 3.6693115234375, 3.91424560546875, 4.1591796875, 4.40411376953125, 4.6490478515625, 4.89398193359375, 5.138916015625, 5.38385009765625, 5.6287841796875, 5.87371826171875, 6.11865234375, 6.36358642578125, 6.6085205078125, 6.85345458984375, 7.098388671875, 7.34332275390625, 7.5882568359375, 7.83319091796875, 8.078125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 5.0, 11.0, 8.0, 8.0, 17.0, 19.0, 16.0, 20.0, 22.0, 27.0, 21.0, 42.0, 47.0, 83.0, 165.0, 310.0, 846.0, 7815.0, 2794744.0, 337824.0, 2417.0, 557.0, 243.0, 112.0, 66.0, 41.0, 33.0, 41.0, 34.0, 18.0, 14.0, 12.0, 13.0, 11.0, 5.0, 9.0, 6.0, 3.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.0, -15.5267333984375, -15.053466796875, -14.5802001953125, -14.10693359375, -13.6336669921875, -13.160400390625, -12.6871337890625, -12.2138671875, -11.7406005859375, -11.267333984375, -10.7940673828125, -10.32080078125, -9.8475341796875, -9.374267578125, -8.9010009765625, -8.427734375, -7.9544677734375, -7.481201171875, -7.0079345703125, -6.53466796875, -6.0614013671875, -5.588134765625, -5.1148681640625, -4.6416015625, -4.1683349609375, -3.695068359375, -3.2218017578125, -2.74853515625, -2.2752685546875, -1.802001953125, -1.3287353515625, -0.85546875, -0.3822021484375, 0.091064453125, 0.5643310546875, 1.03759765625, 1.5108642578125, 1.984130859375, 2.4573974609375, 2.9306640625, 3.4039306640625, 3.877197265625, 4.3504638671875, 4.82373046875, 5.2969970703125, 5.770263671875, 6.2435302734375, 6.716796875, 7.1900634765625, 7.663330078125, 8.1365966796875, 8.60986328125, 9.0831298828125, 9.556396484375, 10.0296630859375, 10.5029296875, 10.9761962890625, 11.449462890625, 11.9227294921875, 12.39599609375, 12.8692626953125, 13.342529296875, 13.8157958984375, 14.2890625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 20.0, 843.0, 155.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.227604866027832, -4.560506820678711, -1.8934087753295898, 0.7736892700195312, 3.4407873153686523, 6.107885360717773, 8.774983406066895, 11.4420804977417, 14.109179496765137, 16.776277542114258, 19.443374633789062, 22.1104736328125, 24.777572631835938, 27.444669723510742, 30.111766815185547, 32.778865814208984, 35.44596481323242, 38.11306381225586, 40.78015899658203, 43.44725799560547, 46.114356994628906, 48.781455993652344, 51.44855499267578, 54.11565017700195, 56.78274917602539, 59.44984817504883, 62.116943359375, 64.78404235839844, 67.45114135742188, 70.11824035644531, 72.78533935546875, 75.45243835449219, 78.11953735351562, 80.78663635253906, 83.4537353515625, 86.12083435058594, 88.78793334960938, 91.45502471923828, 94.12212371826172, 96.78922271728516, 99.4563217163086, 102.12342071533203, 104.79051971435547, 107.4576187133789, 110.12471008300781, 112.79180908203125, 115.45890808105469, 118.12600708007812, 120.79310607910156, 123.460205078125, 126.12730407714844, 128.79440307617188, 131.4615020751953, 134.12860107421875, 136.7957000732422, 139.46279907226562, 142.1298828125, 144.79698181152344, 147.46408081054688, 150.1311798095703, 152.79827880859375, 155.4653778076172, 158.13247680664062, 160.799560546875, 163.4666748046875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 5.0, 7.0, 4.0, 4.0, 5.0, 12.0, 13.0, 17.0, 26.0, 30.0, 29.0, 35.0, 36.0, 25.0, 37.0, 37.0, 42.0, 39.0, 51.0, 42.0, 37.0, 47.0, 35.0, 34.0, 34.0, 33.0, 34.0, 29.0, 27.0, 21.0, 27.0, 14.0, 22.0, 18.0, 17.0, 10.0, 9.0, 6.0, 13.0, 2.0, 4.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.892179489135742, -23.12891387939453, -22.365650177001953, -21.602386474609375, -20.839120864868164, -20.075855255126953, -19.312591552734375, -18.549327850341797, -17.786062240600586, -17.022796630859375, -16.259532928466797, -15.496268272399902, -14.733003616333008, -13.969738960266113, -13.206474304199219, -12.443209648132324, -11.67994499206543, -10.916680335998535, -10.15341567993164, -9.390151023864746, -8.626886367797852, -7.863621711730957, -7.1003570556640625, -6.337092399597168, -5.573827743530273, -4.810563087463379, -4.047298431396484, -3.28403377532959, -2.5207691192626953, -1.7575044631958008, -0.9942398071289062, -0.23097515106201172, 0.5322914123535156, 1.2955560684204102, 2.0588207244873047, 2.822085380554199, 3.5853500366210938, 4.348614692687988, 5.111879348754883, 5.875144004821777, 6.638408660888672, 7.401673316955566, 8.164937973022461, 8.928202629089355, 9.69146728515625, 10.454731941223145, 11.217996597290039, 11.981261253356934, 12.744525909423828, 13.507790565490723, 14.271055221557617, 15.034319877624512, 15.797584533691406, 16.560848236083984, 17.324113845825195, 18.087379455566406, 18.850643157958984, 19.613906860351562, 20.377172470092773, 21.140438079833984, 21.903701782226562, 22.66696548461914, 23.43023109436035, 24.193496704101562, 24.95676040649414]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 9.0, 10.0, 11.0, 7.0, 11.0, 21.0, 25.0, 31.0, 25.0, 55.0, 58.0, 64.0, 55.0, 69.0, 63.0, 67.0, 51.0, 52.0, 45.0, 55.0, 46.0, 26.0, 22.0, 28.0, 11.0, 15.0, 16.0, 8.0, 8.0, 3.0, 7.0, 0.0, 5.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.560546875, -2.482177734375, -2.40380859375, -2.325439453125, -2.2470703125, -2.168701171875, -2.09033203125, -2.011962890625, -1.93359375, -1.855224609375, -1.77685546875, -1.698486328125, -1.6201171875, -1.541748046875, -1.46337890625, -1.385009765625, -1.306640625, -1.228271484375, -1.14990234375, -1.071533203125, -0.9931640625, -0.914794921875, -0.83642578125, -0.758056640625, -0.6796875, -0.601318359375, -0.52294921875, -0.444580078125, -0.3662109375, -0.287841796875, -0.20947265625, -0.131103515625, -0.052734375, 0.025634765625, 0.10400390625, 0.182373046875, 0.2607421875, 0.339111328125, 0.41748046875, 0.495849609375, 0.57421875, 0.652587890625, 0.73095703125, 0.809326171875, 0.8876953125, 0.966064453125, 1.04443359375, 1.122802734375, 1.201171875, 1.279541015625, 1.35791015625, 1.436279296875, 1.5146484375, 1.593017578125, 1.67138671875, 1.749755859375, 1.828125, 1.906494140625, 1.98486328125, 2.063232421875, 2.1416015625, 2.219970703125, 2.29833984375, 2.376708984375, 2.455078125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 7.0, 2.0, 10.0, 14.0, 18.0, 33.0, 34.0, 60.0, 87.0, 120.0, 170.0, 261.0, 394.0, 645.0, 1038.0, 1950.0, 4315.0, 13351.0, 86669.0, 3221698.0, 813786.0, 34229.0, 8011.0, 3159.0, 1689.0, 922.0, 553.0, 360.0, 248.0, 144.0, 97.0, 80.0, 37.0, 28.0, 17.0, 14.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.625, -13.221923828125, -12.81884765625, -12.415771484375, -12.0126953125, -11.609619140625, -11.20654296875, -10.803466796875, -10.400390625, -9.997314453125, -9.59423828125, -9.191162109375, -8.7880859375, -8.385009765625, -7.98193359375, -7.578857421875, -7.17578125, -6.772705078125, -6.36962890625, -5.966552734375, -5.5634765625, -5.160400390625, -4.75732421875, -4.354248046875, -3.951171875, -3.548095703125, -3.14501953125, -2.741943359375, -2.3388671875, -1.935791015625, -1.53271484375, -1.129638671875, -0.7265625, -0.323486328125, 0.07958984375, 0.482666015625, 0.8857421875, 1.288818359375, 1.69189453125, 2.094970703125, 2.498046875, 2.901123046875, 3.30419921875, 3.707275390625, 4.1103515625, 4.513427734375, 4.91650390625, 5.319580078125, 5.72265625, 6.125732421875, 6.52880859375, 6.931884765625, 7.3349609375, 7.738037109375, 8.14111328125, 8.544189453125, 8.947265625, 9.350341796875, 9.75341796875, 10.156494140625, 10.5595703125, 10.962646484375, 11.36572265625, 11.768798828125, 12.171875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 4.0, 9.0, 17.0, 14.0, 21.0, 27.0, 32.0, 38.0, 43.0, 63.0, 84.0, 118.0, 174.0, 259.0, 385.0, 508.0, 486.0, 464.0, 366.0, 251.0, 185.0, 136.0, 100.0, 51.0, 43.0, 38.0, 32.0, 21.0, 16.0, 16.0, 14.0, 8.0, 10.0, 6.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.90234375, -5.70172119140625, -5.5010986328125, -5.30047607421875, -5.099853515625, -4.89923095703125, -4.6986083984375, -4.49798583984375, -4.29736328125, -4.09674072265625, -3.8961181640625, -3.69549560546875, -3.494873046875, -3.29425048828125, -3.0936279296875, -2.89300537109375, -2.6923828125, -2.49176025390625, -2.2911376953125, -2.09051513671875, -1.889892578125, -1.68927001953125, -1.4886474609375, -1.28802490234375, -1.08740234375, -0.88677978515625, -0.6861572265625, -0.48553466796875, -0.284912109375, -0.08428955078125, 0.1163330078125, 0.31695556640625, 0.517578125, 0.71820068359375, 0.9188232421875, 1.11944580078125, 1.320068359375, 1.52069091796875, 1.7213134765625, 1.92193603515625, 2.12255859375, 2.32318115234375, 2.5238037109375, 2.72442626953125, 2.925048828125, 3.12567138671875, 3.3262939453125, 3.52691650390625, 3.7275390625, 3.92816162109375, 4.1287841796875, 4.32940673828125, 4.530029296875, 4.73065185546875, 4.9312744140625, 5.13189697265625, 5.33251953125, 5.53314208984375, 5.7337646484375, 5.93438720703125, 6.135009765625, 6.33563232421875, 6.5362548828125, 6.73687744140625, 6.9375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 11.0, 13.0, 11.0, 23.0, 49.0, 56.0, 77.0, 110.0, 139.0, 238.0, 341.0, 500.0, 819.0, 1186.0, 1890.0, 2870.0, 4911.0, 7961.0, 14139.0, 27974.0, 69920.0, 276687.0, 1687007.0, 1686566.0, 277865.0, 69256.0, 28252.0, 14054.0, 8033.0, 4805.0, 2973.0, 1937.0, 1173.0, 815.0, 500.0, 322.0, 236.0, 177.0, 110.0, 79.0, 70.0, 53.0, 31.0, 12.0, 6.0, 15.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.453125, -9.15771484375, -8.8623046875, -8.56689453125, -8.271484375, -7.97607421875, -7.6806640625, -7.38525390625, -7.08984375, -6.79443359375, -6.4990234375, -6.20361328125, -5.908203125, -5.61279296875, -5.3173828125, -5.02197265625, -4.7265625, -4.43115234375, -4.1357421875, -3.84033203125, -3.544921875, -3.24951171875, -2.9541015625, -2.65869140625, -2.36328125, -2.06787109375, -1.7724609375, -1.47705078125, -1.181640625, -0.88623046875, -0.5908203125, -0.29541015625, 0.0, 0.29541015625, 0.5908203125, 0.88623046875, 1.181640625, 1.47705078125, 1.7724609375, 2.06787109375, 2.36328125, 2.65869140625, 2.9541015625, 3.24951171875, 3.544921875, 3.84033203125, 4.1357421875, 4.43115234375, 4.7265625, 5.02197265625, 5.3173828125, 5.61279296875, 5.908203125, 6.20361328125, 6.4990234375, 6.79443359375, 7.08984375, 7.38525390625, 7.6806640625, 7.97607421875, 8.271484375, 8.56689453125, 8.8623046875, 9.15771484375, 9.453125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 6.0, 0.0, 2.0, 6.0, 9.0, 8.0, 7.0, 18.0, 18.0, 40.0, 32.0, 61.0, 92.0, 125.0, 114.0, 120.0, 83.0, 62.0, 53.0, 55.0, 27.0, 19.0, 14.0, 17.0, 5.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-49.129119873046875, -48.05461502075195, -46.980106353759766, -45.905601501464844, -44.83109664916992, -43.756591796875, -42.68208312988281, -41.60757827758789, -40.53307342529297, -39.45856857299805, -38.38405990600586, -37.30955505371094, -36.235050201416016, -35.160545349121094, -34.086036682128906, -33.011531829833984, -31.937023162841797, -30.862516403198242, -29.78801155090332, -28.713504791259766, -27.638999938964844, -26.56449317932129, -25.489986419677734, -24.415481567382812, -23.340974807739258, -22.266468048095703, -21.19196319580078, -20.117456436157227, -19.042949676513672, -17.96844482421875, -16.893938064575195, -15.819432258605957, -14.744930267333984, -13.670424461364746, -12.595918655395508, -11.521411895751953, -10.446906089782715, -9.372400283813477, -8.297893524169922, -7.223387718200684, -6.148881912231445, -5.074376106262207, -3.9998698234558105, -2.925363779067993, -1.8508577346801758, -0.7763519287109375, 0.298154354095459, 1.3726606369018555, 2.4471664428710938, 3.521672487258911, 4.5961785316467285, 5.670684814453125, 6.745190620422363, 7.819696426391602, 8.894203186035156, 9.968708992004395, 11.043214797973633, 12.117720603942871, 13.19222640991211, 14.266733169555664, 15.341238975524902, 16.41574478149414, 17.490251541137695, 18.56475830078125, 19.639263153076172]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 9.0, 6.0, 8.0, 6.0, 12.0, 4.0, 9.0, 12.0, 18.0, 17.0, 29.0, 19.0, 34.0, 35.0, 36.0, 24.0, 38.0, 31.0, 41.0, 26.0, 34.0, 36.0, 40.0, 33.0, 46.0, 47.0, 35.0, 31.0, 27.0, 38.0, 33.0, 32.0, 22.0, 21.0, 21.0, 22.0, 15.0, 15.0, 12.0, 7.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.63003921508789, -20.947994232177734, -20.265947341918945, -19.58390235900879, -18.901857376098633, -18.219810485839844, -17.537765502929688, -16.85572052001953, -16.173675537109375, -15.491629600524902, -14.809584617614746, -14.127538681030273, -13.445493698120117, -12.763447761535645, -12.081401824951172, -11.399356842041016, -10.717309951782227, -10.035264015197754, -9.353219032287598, -8.671173095703125, -7.9891276359558105, -7.307082176208496, -6.625036239624023, -5.942990779876709, -5.2609453201293945, -4.57889986038208, -3.8968541622161865, -3.214808464050293, -2.5327630043029785, -1.850717544555664, -1.1686716079711914, -0.48662614822387695, 0.1954174041748047, 0.8774629831314087, 1.5595085620880127, 2.2415542602539062, 2.9235997200012207, 3.605645179748535, 4.287691116333008, 4.969736576080322, 5.651782035827637, 6.333827495574951, 7.015872955322266, 7.697918891906738, 8.379964828491211, 9.062009811401367, 9.74405574798584, 10.426101684570312, 11.108146667480469, 11.790192604064941, 12.472237586975098, 13.15428352355957, 13.836328506469727, 14.5183744430542, 15.200420379638672, 15.882465362548828, 16.564510345458984, 17.24655532836914, 17.92860221862793, 18.610647201538086, 19.292692184448242, 19.97473907470703, 20.656784057617188, 21.338829040527344, 22.020875930786133]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 6.0, 6.0, 11.0, 20.0, 20.0, 20.0, 29.0, 35.0, 38.0, 48.0, 56.0, 44.0, 55.0, 75.0, 50.0, 66.0, 49.0, 51.0, 35.0, 41.0, 47.0, 38.0, 26.0, 23.0, 21.0, 11.0, 6.0, 13.0, 13.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.828125, -2.748443603515625, -2.66876220703125, -2.589080810546875, -2.5093994140625, -2.429718017578125, -2.35003662109375, -2.270355224609375, -2.190673828125, -2.110992431640625, -2.03131103515625, -1.951629638671875, -1.8719482421875, -1.792266845703125, -1.71258544921875, -1.632904052734375, -1.55322265625, -1.473541259765625, -1.39385986328125, -1.314178466796875, -1.2344970703125, -1.154815673828125, -1.07513427734375, -0.995452880859375, -0.915771484375, -0.836090087890625, -0.75640869140625, -0.676727294921875, -0.5970458984375, -0.517364501953125, -0.43768310546875, -0.358001708984375, -0.2783203125, -0.198638916015625, -0.11895751953125, -0.039276123046875, 0.0404052734375, 0.120086669921875, 0.19976806640625, 0.279449462890625, 0.359130859375, 0.438812255859375, 0.51849365234375, 0.598175048828125, 0.6778564453125, 0.757537841796875, 0.83721923828125, 0.916900634765625, 0.99658203125, 1.076263427734375, 1.15594482421875, 1.235626220703125, 1.3153076171875, 1.394989013671875, 1.47467041015625, 1.554351806640625, 1.634033203125, 1.713714599609375, 1.79339599609375, 1.873077392578125, 1.9527587890625, 2.032440185546875, 2.11212158203125, 2.191802978515625, 2.271484375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 11.0, 8.0, 22.0, 30.0, 34.0, 49.0, 73.0, 117.0, 164.0, 240.0, 413.0, 696.0, 1115.0, 1933.0, 3454.0, 6559.0, 12000.0, 23638.0, 47165.0, 94086.0, 170815.0, 245568.0, 202318.0, 115449.0, 59180.0, 29941.0, 15138.0, 8017.0, 4268.0, 2474.0, 1379.0, 797.0, 484.0, 283.0, 204.0, 125.0, 100.0, 60.0, 35.0, 38.0, 19.0, 17.0, 11.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.453369140625, -0.43990325927734375, -0.4264373779296875, -0.41297149658203125, -0.399505615234375, -0.38603973388671875, -0.3725738525390625, -0.35910797119140625, -0.34564208984375, -0.33217620849609375, -0.3187103271484375, -0.30524444580078125, -0.291778564453125, -0.27831268310546875, -0.2648468017578125, -0.25138092041015625, -0.2379150390625, -0.22444915771484375, -0.2109832763671875, -0.19751739501953125, -0.184051513671875, -0.17058563232421875, -0.1571197509765625, -0.14365386962890625, -0.13018798828125, -0.11672210693359375, -0.1032562255859375, -0.08979034423828125, -0.076324462890625, -0.06285858154296875, -0.0493927001953125, -0.03592681884765625, -0.0224609375, -0.00899505615234375, 0.0044708251953125, 0.01793670654296875, 0.031402587890625, 0.04486846923828125, 0.0583343505859375, 0.07180023193359375, 0.08526611328125, 0.09873199462890625, 0.1121978759765625, 0.12566375732421875, 0.139129638671875, 0.15259552001953125, 0.1660614013671875, 0.17952728271484375, 0.1929931640625, 0.20645904541015625, 0.2199249267578125, 0.23339080810546875, 0.246856689453125, 0.26032257080078125, 0.2737884521484375, 0.28725433349609375, 0.30072021484375, 0.31418609619140625, 0.3276519775390625, 0.34111785888671875, 0.354583740234375, 0.36804962158203125, 0.3815155029296875, 0.39498138427734375, 0.408447265625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 3.0, 9.0, 6.0, 15.0, 21.0, 20.0, 15.0, 17.0, 29.0, 28.0, 33.0, 34.0, 40.0, 47.0, 38.0, 42.0, 28.0, 42.0, 1063.0, 42.0, 41.0, 36.0, 45.0, 35.0, 41.0, 29.0, 31.0, 29.0, 23.0, 21.0, 17.0, 19.0, 16.0, 9.0, 7.0, 3.0, 6.0, 7.0, 4.0, 3.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3642578125, -1.3192291259765625, -1.274200439453125, -1.2291717529296875, -1.18414306640625, -1.1391143798828125, -1.094085693359375, -1.0490570068359375, -1.0040283203125, -0.9589996337890625, -0.913970947265625, -0.8689422607421875, -0.82391357421875, -0.7788848876953125, -0.733856201171875, -0.6888275146484375, -0.643798828125, -0.5987701416015625, -0.553741455078125, -0.5087127685546875, -0.46368408203125, -0.4186553955078125, -0.373626708984375, -0.3285980224609375, -0.2835693359375, -0.2385406494140625, -0.193511962890625, -0.1484832763671875, -0.10345458984375, -0.0584259033203125, -0.013397216796875, 0.0316314697265625, 0.07666015625, 0.1216888427734375, 0.166717529296875, 0.2117462158203125, 0.25677490234375, 0.3018035888671875, 0.346832275390625, 0.3918609619140625, 0.4368896484375, 0.4819183349609375, 0.526947021484375, 0.5719757080078125, 0.61700439453125, 0.6620330810546875, 0.707061767578125, 0.7520904541015625, 0.797119140625, 0.8421478271484375, 0.887176513671875, 0.9322052001953125, 0.97723388671875, 1.0222625732421875, 1.067291259765625, 1.1123199462890625, 1.1573486328125, 1.2023773193359375, 1.247406005859375, 1.2924346923828125, 1.33746337890625, 1.3824920654296875, 1.427520751953125, 1.4725494384765625, 1.517578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 7.0, 9.0, 8.0, 9.0, 12.0, 15.0, 26.0, 43.0, 48.0, 82.0, 111.0, 153.0, 263.0, 409.0, 626.0, 914.0, 1483.0, 2403.0, 3903.0, 6148.0, 10424.0, 17600.0, 30307.0, 52536.0, 90079.0, 155803.0, 643495.0, 699659.0, 159343.0, 91371.0, 53695.0, 30845.0, 18008.0, 10555.0, 6296.0, 3887.0, 2369.0, 1485.0, 930.0, 568.0, 391.0, 256.0, 163.0, 109.0, 72.0, 79.0, 50.0, 22.0, 21.0, 9.0, 11.0, 9.0, 6.0, 2.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.1326904296875, -0.12841224670410156, -0.12413406372070312, -0.11985588073730469, -0.11557769775390625, -0.11129951477050781, -0.10702133178710938, -0.10274314880371094, -0.0984649658203125, -0.09418678283691406, -0.08990859985351562, -0.08563041687011719, -0.08135223388671875, -0.07707405090332031, -0.07279586791992188, -0.06851768493652344, -0.064239501953125, -0.05996131896972656, -0.055683135986328125, -0.05140495300292969, -0.04712677001953125, -0.04284858703613281, -0.038570404052734375, -0.03429222106933594, -0.0300140380859375, -0.025735855102539062, -0.021457672119140625, -0.017179489135742188, -0.01290130615234375, -0.008623123168945312, -0.004344940185546875, -6.67572021484375e-05, 0.00421142578125, 0.008489608764648438, 0.012767791748046875, 0.017045974731445312, 0.02132415771484375, 0.025602340698242188, 0.029880523681640625, 0.03415870666503906, 0.0384368896484375, 0.04271507263183594, 0.046993255615234375, 0.05127143859863281, 0.05554962158203125, 0.05982780456542969, 0.06410598754882812, 0.06838417053222656, 0.072662353515625, 0.07694053649902344, 0.08121871948242188, 0.08549690246582031, 0.08977508544921875, 0.09405326843261719, 0.09833145141601562, 0.10260963439941406, 0.1068878173828125, 0.11116600036621094, 0.11544418334960938, 0.11972236633300781, 0.12400054931640625, 0.1282787322998047, 0.13255691528320312, 0.13683509826660156, 0.14111328125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 13.0, 33.0, 38.0, 73.0, 102.0, 173.0, 212.0, 136.0, 66.0, 54.0, 28.0, 19.0, 7.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.097900390625, -0.09546136856079102, -0.09302234649658203, -0.09058332443237305, -0.08814430236816406, -0.08570528030395508, -0.0832662582397461, -0.08082723617553711, -0.07838821411132812, -0.07594919204711914, -0.07351016998291016, -0.07107114791870117, -0.06863212585449219, -0.0661931037902832, -0.06375408172607422, -0.061315059661865234, -0.05887603759765625, -0.056437015533447266, -0.05399799346923828, -0.0515589714050293, -0.04911994934082031, -0.04668092727661133, -0.044241905212402344, -0.04180288314819336, -0.039363861083984375, -0.03692483901977539, -0.034485816955566406, -0.03204679489135742, -0.029607772827148438, -0.027168750762939453, -0.02472972869873047, -0.022290706634521484, -0.0198516845703125, -0.017412662506103516, -0.014973640441894531, -0.012534618377685547, -0.010095596313476562, -0.007656574249267578, -0.005217552185058594, -0.0027785301208496094, -0.000339508056640625, 0.0020995140075683594, 0.004538536071777344, 0.006977558135986328, 0.009416580200195312, 0.011855602264404297, 0.014294624328613281, 0.016733646392822266, 0.01917266845703125, 0.021611690521240234, 0.02405071258544922, 0.026489734649658203, 0.028928756713867188, 0.03136777877807617, 0.033806800842285156, 0.03624582290649414, 0.038684844970703125, 0.04112386703491211, 0.043562889099121094, 0.04600191116333008, 0.04844093322753906, 0.05087995529174805, 0.05331897735595703, 0.055757999420166016, 0.058197021484375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 2.0, 5.0, 3.0, 8.0, 5.0, 14.0, 13.0, 39.0, 50.0, 95.0, 208.0, 561.0, 5578.0, 1026558.0, 14068.0, 820.0, 268.0, 109.0, 65.0, 25.0, 17.0, 12.0, 7.0, 6.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748046875, -1.130645751953125, -1.08648681640625, -1.042327880859375, -0.9981689453125, -0.954010009765625, -0.90985107421875, -0.865692138671875, -0.821533203125, -0.777374267578125, -0.73321533203125, -0.689056396484375, -0.6448974609375, -0.600738525390625, -0.55657958984375, -0.512420654296875, -0.46826171875, -0.424102783203125, -0.37994384765625, -0.335784912109375, -0.2916259765625, -0.247467041015625, -0.20330810546875, -0.159149169921875, -0.114990234375, -0.070831298828125, -0.02667236328125, 0.017486572265625, 0.0616455078125, 0.105804443359375, 0.14996337890625, 0.194122314453125, 0.23828125, 0.282440185546875, 0.32659912109375, 0.370758056640625, 0.4149169921875, 0.459075927734375, 0.50323486328125, 0.547393798828125, 0.591552734375, 0.635711669921875, 0.67987060546875, 0.724029541015625, 0.7681884765625, 0.812347412109375, 0.85650634765625, 0.900665283203125, 0.94482421875, 0.988983154296875, 1.03314208984375, 1.077301025390625, 1.1214599609375, 1.165618896484375, 1.20977783203125, 1.253936767578125, 1.298095703125, 1.342254638671875, 1.38641357421875, 1.430572509765625, 1.4747314453125, 1.518890380859375, 1.56304931640625, 1.607208251953125, 1.6513671875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 12.0, 38.0, 269.0, 554.0, 116.0, 20.0, 5.0], "bins": [-1.0177274942398071, -1.0008455514907837, -0.9839636087417603, -0.9670816659927368, -0.9501997232437134, -0.9333177804946899, -0.9164358377456665, -0.8995538949966431, -0.8826719522476196, -0.8657900094985962, -0.8489080667495728, -0.8320261240005493, -0.8151441812515259, -0.7982622385025024, -0.781380295753479, -0.7644983530044556, -0.7476164102554321, -0.7307344675064087, -0.7138525247573853, -0.6969705820083618, -0.6800886392593384, -0.6632066965103149, -0.6463247537612915, -0.6294428110122681, -0.6125608682632446, -0.5956789255142212, -0.5787969827651978, -0.5619150400161743, -0.5450330972671509, -0.5281511545181274, -0.511269211769104, -0.49438726902008057, -0.47750529646873474, -0.4606233537197113, -0.44374141097068787, -0.42685946822166443, -0.409977525472641, -0.39309558272361755, -0.3762136399745941, -0.3593316972255707, -0.34244975447654724, -0.3255678117275238, -0.30868586897850037, -0.29180392622947693, -0.2749219834804535, -0.25804004073143005, -0.24115809798240662, -0.22427615523338318, -0.20739421248435974, -0.1905122697353363, -0.17363032698631287, -0.15674838423728943, -0.139866441488266, -0.12298449873924255, -0.10610255599021912, -0.08922061324119568, -0.07233867794275284, -0.0554567351937294, -0.03857479244470596, -0.021692849695682526, -0.004810906946659088, 0.01207103580236435, 0.028952978551387787, 0.045834921300411224, 0.06271686404943466]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 0.0, 4.0, 10.0, 11.0, 8.0, 6.0, 12.0, 18.0, 11.0, 29.0, 22.0, 26.0, 43.0, 34.0, 47.0, 35.0, 31.0, 46.0, 42.0, 54.0, 48.0, 44.0, 41.0, 40.0, 36.0, 33.0, 33.0, 35.0, 31.0, 32.0, 21.0, 22.0, 16.0, 21.0, 15.0, 11.0, 9.0, 8.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06644558906555176, -0.06441766023635864, -0.062389735132455826, -0.06036181002855301, -0.058333881199359894, -0.05630595237016678, -0.05427802726626396, -0.052250102162361145, -0.05022217333316803, -0.048194244503974915, -0.0461663194000721, -0.04413839429616928, -0.042110465466976166, -0.04008253663778305, -0.038054611533880234, -0.03602668642997742, -0.0339987576007843, -0.031970828771591187, -0.02994290366768837, -0.027914976701140404, -0.025887049734592438, -0.023859122768044472, -0.021831195801496506, -0.01980326883494854, -0.017775341868400574, -0.015747414901852608, -0.013719487935304642, -0.011691560968756676, -0.00966363400220871, -0.007635707035660744, -0.005607780069112778, -0.0035798531025648117, -0.0015519261360168457, 0.0004760008305311203, 0.0025039277970790863, 0.004531854763627052, 0.006559781730175018, 0.008587708696722984, 0.01061563566327095, 0.012643562629818916, 0.014671489596366882, 0.01669941656291485, 0.018727343529462814, 0.02075527049601078, 0.022783197462558746, 0.024811124429106712, 0.02683905139565468, 0.028866978362202644, 0.03089490532875061, 0.032922834157943726, 0.03495075926184654, 0.03697868436574936, 0.039006613194942474, 0.04103454202413559, 0.043062467128038406, 0.04509039223194122, 0.04711832106113434, 0.049146249890327454, 0.05117417499423027, 0.05320210009813309, 0.0552300289273262, 0.05725795775651932, 0.059285882860422134, 0.06131380796432495, 0.06334173679351807]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 8.0, 9.0, 10.0, 8.0, 17.0, 17.0, 20.0, 29.0, 39.0, 39.0, 44.0, 40.0, 60.0, 55.0, 54.0, 59.0, 60.0, 60.0, 62.0, 50.0, 52.0, 29.0, 25.0, 33.0, 19.0, 21.0, 15.0, 17.0, 9.0, 10.0, 4.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-2.82421875, -2.744659423828125, -2.66510009765625, -2.585540771484375, -2.5059814453125, -2.426422119140625, -2.34686279296875, -2.267303466796875, -2.187744140625, -2.108184814453125, -2.02862548828125, -1.949066162109375, -1.8695068359375, -1.789947509765625, -1.71038818359375, -1.630828857421875, -1.55126953125, -1.471710205078125, -1.39215087890625, -1.312591552734375, -1.2330322265625, -1.153472900390625, -1.07391357421875, -0.994354248046875, -0.914794921875, -0.835235595703125, -0.75567626953125, -0.676116943359375, -0.5965576171875, -0.516998291015625, -0.43743896484375, -0.357879638671875, -0.2783203125, -0.198760986328125, -0.11920166015625, -0.039642333984375, 0.0399169921875, 0.119476318359375, 0.19903564453125, 0.278594970703125, 0.358154296875, 0.437713623046875, 0.51727294921875, 0.596832275390625, 0.6763916015625, 0.755950927734375, 0.83551025390625, 0.915069580078125, 0.99462890625, 1.074188232421875, 1.15374755859375, 1.233306884765625, 1.3128662109375, 1.392425537109375, 1.47198486328125, 1.551544189453125, 1.631103515625, 1.710662841796875, 1.79022216796875, 1.869781494140625, 1.9493408203125, 2.028900146484375, 2.10845947265625, 2.188018798828125, 2.267578125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 9.0, 17.0, 16.0, 26.0, 38.0, 51.0, 65.0, 118.0, 180.0, 308.0, 511.0, 791.0, 1482.0, 2746.0, 5376.0, 11050.0, 23535.0, 54683.0, 136559.0, 324166.0, 284285.0, 115303.0, 47107.0, 20349.0, 9428.0, 4685.0, 2460.0, 1286.0, 749.0, 416.0, 269.0, 162.0, 108.0, 55.0, 43.0, 27.0, 25.0, 21.0, 15.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.935546875, -1.8729248046875, -1.810302734375, -1.7476806640625, -1.68505859375, -1.6224365234375, -1.559814453125, -1.4971923828125, -1.4345703125, -1.3719482421875, -1.309326171875, -1.2467041015625, -1.18408203125, -1.1214599609375, -1.058837890625, -0.9962158203125, -0.93359375, -0.8709716796875, -0.808349609375, -0.7457275390625, -0.68310546875, -0.6204833984375, -0.557861328125, -0.4952392578125, -0.4326171875, -0.3699951171875, -0.307373046875, -0.2447509765625, -0.18212890625, -0.1195068359375, -0.056884765625, 0.0057373046875, 0.068359375, 0.1309814453125, 0.193603515625, 0.2562255859375, 0.31884765625, 0.3814697265625, 0.444091796875, 0.5067138671875, 0.5693359375, 0.6319580078125, 0.694580078125, 0.7572021484375, 0.81982421875, 0.8824462890625, 0.945068359375, 1.0076904296875, 1.0703125, 1.1329345703125, 1.195556640625, 1.2581787109375, 1.32080078125, 1.3834228515625, 1.446044921875, 1.5086669921875, 1.5712890625, 1.6339111328125, 1.696533203125, 1.7591552734375, 1.82177734375, 1.8843994140625, 1.947021484375, 2.0096435546875, 2.072265625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 5.0, 10.0, 11.0, 11.0, 15.0, 8.0, 19.0, 13.0, 32.0, 23.0, 18.0, 37.0, 37.0, 46.0, 32.0, 38.0, 45.0, 74.0, 188.0, 1473.0, 351.0, 112.0, 77.0, 44.0, 31.0, 31.0, 40.0, 25.0, 16.0, 25.0, 22.0, 18.0, 18.0, 13.0, 8.0, 13.0, 7.0, 6.0, 5.0, 5.0, 8.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-6.94140625, -6.70843505859375, -6.4754638671875, -6.24249267578125, -6.009521484375, -5.77655029296875, -5.5435791015625, -5.31060791015625, -5.07763671875, -4.84466552734375, -4.6116943359375, -4.37872314453125, -4.145751953125, -3.91278076171875, -3.6798095703125, -3.44683837890625, -3.2138671875, -2.98089599609375, -2.7479248046875, -2.51495361328125, -2.281982421875, -2.04901123046875, -1.8160400390625, -1.58306884765625, -1.35009765625, -1.11712646484375, -0.8841552734375, -0.65118408203125, -0.418212890625, -0.18524169921875, 0.0477294921875, 0.28070068359375, 0.513671875, 0.74664306640625, 0.9796142578125, 1.21258544921875, 1.445556640625, 1.67852783203125, 1.9114990234375, 2.14447021484375, 2.37744140625, 2.61041259765625, 2.8433837890625, 3.07635498046875, 3.309326171875, 3.54229736328125, 3.7752685546875, 4.00823974609375, 4.2412109375, 4.47418212890625, 4.7071533203125, 4.94012451171875, 5.173095703125, 5.40606689453125, 5.6390380859375, 5.87200927734375, 6.10498046875, 6.33795166015625, 6.5709228515625, 6.80389404296875, 7.036865234375, 7.26983642578125, 7.5028076171875, 7.73577880859375, 7.96875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 5.0, 7.0, 8.0, 13.0, 4.0, 12.0, 10.0, 9.0, 27.0, 20.0, 28.0, 40.0, 50.0, 77.0, 120.0, 206.0, 409.0, 1062.0, 4832.0, 111716.0, 2917300.0, 102875.0, 4668.0, 1062.0, 437.0, 211.0, 121.0, 85.0, 65.0, 35.0, 27.0, 27.0, 20.0, 18.0, 13.0, 14.0, 7.0, 10.0, 13.0, 5.0, 4.0, 11.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.6015625, -12.2362060546875, -11.870849609375, -11.5054931640625, -11.14013671875, -10.7747802734375, -10.409423828125, -10.0440673828125, -9.6787109375, -9.3133544921875, -8.947998046875, -8.5826416015625, -8.21728515625, -7.8519287109375, -7.486572265625, -7.1212158203125, -6.755859375, -6.3905029296875, -6.025146484375, -5.6597900390625, -5.29443359375, -4.9290771484375, -4.563720703125, -4.1983642578125, -3.8330078125, -3.4676513671875, -3.102294921875, -2.7369384765625, -2.37158203125, -2.0062255859375, -1.640869140625, -1.2755126953125, -0.91015625, -0.5447998046875, -0.179443359375, 0.1859130859375, 0.55126953125, 0.9166259765625, 1.281982421875, 1.6473388671875, 2.0126953125, 2.3780517578125, 2.743408203125, 3.1087646484375, 3.47412109375, 3.8394775390625, 4.204833984375, 4.5701904296875, 4.935546875, 5.3009033203125, 5.666259765625, 6.0316162109375, 6.39697265625, 6.7623291015625, 7.127685546875, 7.4930419921875, 7.8583984375, 8.2237548828125, 8.589111328125, 8.9544677734375, 9.31982421875, 9.6851806640625, 10.050537109375, 10.4158935546875, 10.78125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 18.0, 237.0, 579.0, 175.0, 9.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1631927490234375, -4.3653244972229, -2.5674564838409424, -0.7695884704589844, 1.0282797813415527, 2.82614803314209, 4.624015808105469, 6.421884536743164, 8.219752311706543, 10.017620086669922, 11.815488815307617, 13.613356590270996, 15.411224365234375, 17.20909309387207, 19.006961822509766, 20.804828643798828, 22.602697372436523, 24.40056610107422, 26.19843292236328, 27.996301651000977, 29.794170379638672, 31.592037200927734, 33.38990783691406, 35.187774658203125, 36.98564147949219, 38.78350830078125, 40.58137893676758, 42.37924575805664, 44.1771125793457, 45.97498321533203, 47.772850036621094, 49.570716857910156, 51.368587493896484, 53.16645431518555, 54.964324951171875, 56.76219177246094, 58.56005859375, 60.35792922973633, 62.15579605102539, 63.95366668701172, 65.75153350830078, 67.54940032958984, 69.3472671508789, 71.1451416015625, 72.94300842285156, 74.74087524414062, 76.53874206542969, 78.33660888671875, 80.13447570800781, 81.93234252929688, 83.73020935058594, 85.528076171875, 87.3259506225586, 89.12381744384766, 90.92168426513672, 92.71955108642578, 94.51742553710938, 96.31529235839844, 98.1131591796875, 99.91102600097656, 101.70890045166016, 103.50676727294922, 105.30463409423828, 107.10250091552734, 108.9003677368164]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 12.0, 12.0, 17.0, 13.0, 15.0, 20.0, 27.0, 29.0, 39.0, 46.0, 37.0, 51.0, 44.0, 49.0, 38.0, 49.0, 52.0, 41.0, 51.0, 39.0, 34.0, 41.0, 35.0, 34.0, 21.0, 22.0, 19.0, 20.0, 20.0, 19.0, 4.0, 14.0, 8.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.071189880371094, -29.090368270874023, -28.109548568725586, -27.128726959228516, -26.147907257080078, -25.167085647583008, -24.18626594543457, -23.2054443359375, -22.224624633789062, -21.243803024291992, -20.262983322143555, -19.282161712646484, -18.301342010498047, -17.320520401000977, -16.33970069885254, -15.358879089355469, -14.378058433532715, -13.397237777709961, -12.416417121887207, -11.435596466064453, -10.4547758102417, -9.473955154418945, -8.493133544921875, -7.512313365936279, -6.531492710113525, -5.5506720542907715, -4.569851398468018, -3.5890305042266846, -2.6082098484039307, -1.6273889541625977, -0.6465682983398438, 0.33425235748291016, 1.315073013305664, 2.295893669128418, 3.276714324951172, 4.257534980773926, 5.23835563659668, 6.219176769256592, 7.199997425079346, 8.180818557739258, 9.161638259887695, 10.14245891571045, 11.123279571533203, 12.104100227355957, 13.084920883178711, 14.065742492675781, 15.046562194824219, 16.02738380432129, 17.00820541381836, 17.98902702331543, 18.969846725463867, 19.950668334960938, 20.931488037109375, 21.912309646606445, 22.893129348754883, 23.873950958251953, 24.85477066040039, 25.83559226989746, 26.8164119720459, 27.79723358154297, 28.778053283691406, 29.758874893188477, 30.739694595336914, 31.720516204833984, 32.70133590698242]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 5.0, 5.0, 10.0, 12.0, 18.0, 17.0, 29.0, 16.0, 30.0, 54.0, 63.0, 42.0, 51.0, 59.0, 58.0, 75.0, 69.0, 57.0, 47.0, 48.0, 48.0, 29.0, 24.0, 34.0, 19.0, 16.0, 8.0, 9.0, 11.0, 3.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.07421875, -2.986602783203125, -2.89898681640625, -2.811370849609375, -2.7237548828125, -2.636138916015625, -2.54852294921875, -2.460906982421875, -2.373291015625, -2.285675048828125, -2.19805908203125, -2.110443115234375, -2.0228271484375, -1.935211181640625, -1.84759521484375, -1.759979248046875, -1.67236328125, -1.584747314453125, -1.49713134765625, -1.409515380859375, -1.3218994140625, -1.234283447265625, -1.14666748046875, -1.059051513671875, -0.971435546875, -0.883819580078125, -0.79620361328125, -0.708587646484375, -0.6209716796875, -0.533355712890625, -0.44573974609375, -0.358123779296875, -0.2705078125, -0.182891845703125, -0.09527587890625, -0.007659912109375, 0.0799560546875, 0.167572021484375, 0.25518798828125, 0.342803955078125, 0.430419921875, 0.518035888671875, 0.60565185546875, 0.693267822265625, 0.7808837890625, 0.868499755859375, 0.95611572265625, 1.043731689453125, 1.13134765625, 1.218963623046875, 1.30657958984375, 1.394195556640625, 1.4818115234375, 1.569427490234375, 1.65704345703125, 1.744659423828125, 1.832275390625, 1.919891357421875, 2.00750732421875, 2.095123291015625, 2.1827392578125, 2.270355224609375, 2.35797119140625, 2.445587158203125, 2.533203125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 3.0, 10.0, 11.0, 16.0, 20.0, 25.0, 21.0, 41.0, 48.0, 79.0, 103.0, 142.0, 192.0, 230.0, 419.0, 559.0, 878.0, 1456.0, 2711.0, 5585.0, 12975.0, 42369.0, 375638.0, 3240248.0, 440014.0, 45870.0, 12754.0, 5336.0, 2602.0, 1434.0, 871.0, 548.0, 354.0, 260.0, 139.0, 101.0, 69.0, 51.0, 32.0, 22.0, 12.0, 17.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.421875, -10.13653564453125, -9.8511962890625, -9.56585693359375, -9.280517578125, -8.99517822265625, -8.7098388671875, -8.42449951171875, -8.13916015625, -7.85382080078125, -7.5684814453125, -7.28314208984375, -6.997802734375, -6.71246337890625, -6.4271240234375, -6.14178466796875, -5.8564453125, -5.57110595703125, -5.2857666015625, -5.00042724609375, -4.715087890625, -4.42974853515625, -4.1444091796875, -3.85906982421875, -3.57373046875, -3.28839111328125, -3.0030517578125, -2.71771240234375, -2.432373046875, -2.14703369140625, -1.8616943359375, -1.57635498046875, -1.291015625, -1.00567626953125, -0.7203369140625, -0.43499755859375, -0.149658203125, 0.13568115234375, 0.4210205078125, 0.70635986328125, 0.99169921875, 1.27703857421875, 1.5623779296875, 1.84771728515625, 2.133056640625, 2.41839599609375, 2.7037353515625, 2.98907470703125, 3.2744140625, 3.55975341796875, 3.8450927734375, 4.13043212890625, 4.415771484375, 4.70111083984375, 4.9864501953125, 5.27178955078125, 5.55712890625, 5.84246826171875, 6.1278076171875, 6.41314697265625, 6.698486328125, 6.98382568359375, 7.2691650390625, 7.55450439453125, 7.83984375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 10.0, 2.0, 13.0, 6.0, 9.0, 13.0, 14.0, 26.0, 23.0, 30.0, 43.0, 53.0, 65.0, 110.0, 150.0, 211.0, 276.0, 353.0, 466.0, 522.0, 427.0, 347.0, 236.0, 188.0, 121.0, 85.0, 65.0, 46.0, 43.0, 24.0, 22.0, 12.0, 9.0, 6.0, 10.0, 10.0, 10.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.359375, -6.1680908203125, -5.976806640625, -5.7855224609375, -5.59423828125, -5.4029541015625, -5.211669921875, -5.0203857421875, -4.8291015625, -4.6378173828125, -4.446533203125, -4.2552490234375, -4.06396484375, -3.8726806640625, -3.681396484375, -3.4901123046875, -3.298828125, -3.1075439453125, -2.916259765625, -2.7249755859375, -2.53369140625, -2.3424072265625, -2.151123046875, -1.9598388671875, -1.7685546875, -1.5772705078125, -1.385986328125, -1.1947021484375, -1.00341796875, -0.8121337890625, -0.620849609375, -0.4295654296875, -0.23828125, -0.0469970703125, 0.144287109375, 0.3355712890625, 0.52685546875, 0.7181396484375, 0.909423828125, 1.1007080078125, 1.2919921875, 1.4832763671875, 1.674560546875, 1.8658447265625, 2.05712890625, 2.2484130859375, 2.439697265625, 2.6309814453125, 2.822265625, 3.0135498046875, 3.204833984375, 3.3961181640625, 3.58740234375, 3.7786865234375, 3.969970703125, 4.1612548828125, 4.3525390625, 4.5438232421875, 4.735107421875, 4.9263916015625, 5.11767578125, 5.3089599609375, 5.500244140625, 5.6915283203125, 5.8828125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 12.0, 10.0, 30.0, 62.0, 62.0, 105.0, 181.0, 240.0, 420.0, 690.0, 1023.0, 1599.0, 2631.0, 4347.0, 7584.0, 14106.0, 30104.0, 81874.0, 362587.0, 1977363.0, 1363136.0, 232703.0, 60639.0, 24381.0, 11984.0, 6530.0, 3713.0, 2324.0, 1399.0, 843.0, 588.0, 347.0, 223.0, 159.0, 98.0, 76.0, 40.0, 26.0, 12.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.703125, -8.4117431640625, -8.120361328125, -7.8289794921875, -7.53759765625, -7.2462158203125, -6.954833984375, -6.6634521484375, -6.3720703125, -6.0806884765625, -5.789306640625, -5.4979248046875, -5.20654296875, -4.9151611328125, -4.623779296875, -4.3323974609375, -4.041015625, -3.7496337890625, -3.458251953125, -3.1668701171875, -2.87548828125, -2.5841064453125, -2.292724609375, -2.0013427734375, -1.7099609375, -1.4185791015625, -1.127197265625, -0.8358154296875, -0.54443359375, -0.2530517578125, 0.038330078125, 0.3297119140625, 0.62109375, 0.9124755859375, 1.203857421875, 1.4952392578125, 1.78662109375, 2.0780029296875, 2.369384765625, 2.6607666015625, 2.9521484375, 3.2435302734375, 3.534912109375, 3.8262939453125, 4.11767578125, 4.4090576171875, 4.700439453125, 4.9918212890625, 5.283203125, 5.5745849609375, 5.865966796875, 6.1573486328125, 6.44873046875, 6.7401123046875, 7.031494140625, 7.3228759765625, 7.6142578125, 7.9056396484375, 8.197021484375, 8.4884033203125, 8.77978515625, 9.0711669921875, 9.362548828125, 9.6539306640625, 9.9453125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 16.0, 23.0, 38.0, 52.0, 78.0, 107.0, 141.0, 130.0, 132.0, 103.0, 60.0, 47.0, 23.0, 18.0, 13.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.48488235473633, -39.05975341796875, -37.63462829589844, -36.20949935913086, -34.78437423706055, -33.35924530029297, -31.934118270874023, -30.508991241455078, -29.083864212036133, -27.658737182617188, -26.233610153198242, -24.808483123779297, -23.38335418701172, -21.958229064941406, -20.533100128173828, -19.107973098754883, -17.682846069335938, -16.257719039916992, -14.832592010498047, -13.407464027404785, -11.98233699798584, -10.557209968566895, -9.132081985473633, -7.7069549560546875, -6.281827926635742, -4.856700897216797, -3.4315733909606934, -2.00644588470459, -0.5813188552856445, 0.8438081741333008, 2.2689361572265625, 3.694063186645508, 5.1191864013671875, 6.544313430786133, 7.969440937042236, 9.39456844329834, 10.819695472717285, 12.24482250213623, 13.669950485229492, 15.095077514648438, 16.520204544067383, 17.945331573486328, 19.370458602905273, 20.79558563232422, 22.220714569091797, 23.64583969116211, 25.070968627929688, 26.496095657348633, 27.921222686767578, 29.346349716186523, 30.77147674560547, 32.19660568237305, 33.62173080444336, 35.04685974121094, 36.47198486328125, 37.89711380004883, 39.322242736816406, 40.747371673583984, 42.1724967956543, 43.597625732421875, 45.02275085449219, 46.447879791259766, 47.873008728027344, 49.298133850097656, 50.72325897216797]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 7.0, 3.0, 19.0, 15.0, 21.0, 11.0, 15.0, 19.0, 18.0, 20.0, 28.0, 23.0, 25.0, 26.0, 41.0, 40.0, 30.0, 39.0, 44.0, 33.0, 27.0, 34.0, 38.0, 40.0, 36.0, 34.0, 28.0, 31.0, 32.0, 27.0, 20.0, 24.0, 24.0, 15.0, 22.0, 11.0, 16.0, 13.0, 10.0, 9.0, 3.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.371700286865234, -18.7717342376709, -18.171768188476562, -17.571802139282227, -16.97183609008789, -16.371870040893555, -15.771903038024902, -15.171936988830566, -14.57197093963623, -13.972004890441895, -13.372038841247559, -12.772072792053223, -12.17210578918457, -11.572139739990234, -10.972173690795898, -10.372207641601562, -9.772241592407227, -9.17227554321289, -8.572309494018555, -7.9723429679870605, -7.372376918792725, -6.772410869598389, -6.1724443435668945, -5.572478294372559, -4.972512245178223, -4.372546195983887, -3.7725799083709717, -3.1726136207580566, -2.5726475715637207, -1.9726815223693848, -1.3727152347564697, -0.7727489471435547, -0.17278480529785156, 0.4271813631057739, 1.0271475315093994, 1.627113699913025, 2.2270798683166504, 2.8270459175109863, 3.4270122051239014, 4.026978492736816, 4.626944541931152, 5.226910591125488, 5.826876640319824, 6.426843166351318, 7.026809215545654, 7.62677526473999, 8.226741790771484, 8.82670783996582, 9.426673889160156, 10.026639938354492, 10.626605987548828, 11.226572036743164, 11.8265380859375, 12.426504135131836, 13.026471138000488, 13.626437187194824, 14.22640323638916, 14.826369285583496, 15.426335334777832, 16.026302337646484, 16.62626838684082, 17.226234436035156, 17.826200485229492, 18.426166534423828, 19.026132583618164]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 4.0, 6.0, 10.0, 12.0, 13.0, 19.0, 17.0, 22.0, 25.0, 40.0, 45.0, 52.0, 46.0, 48.0, 50.0, 60.0, 54.0, 74.0, 65.0, 58.0, 54.0, 35.0, 36.0, 25.0, 23.0, 24.0, 24.0, 13.0, 6.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.189453125, -3.0986328125, -3.0078125, -2.9169921875, -2.826171875, -2.7353515625, -2.64453125, -2.5537109375, -2.462890625, -2.3720703125, -2.28125, -2.1904296875, -2.099609375, -2.0087890625, -1.91796875, -1.8271484375, -1.736328125, -1.6455078125, -1.5546875, -1.4638671875, -1.373046875, -1.2822265625, -1.19140625, -1.1005859375, -1.009765625, -0.9189453125, -0.828125, -0.7373046875, -0.646484375, -0.5556640625, -0.46484375, -0.3740234375, -0.283203125, -0.1923828125, -0.1015625, -0.0107421875, 0.080078125, 0.1708984375, 0.26171875, 0.3525390625, 0.443359375, 0.5341796875, 0.625, 0.7158203125, 0.806640625, 0.8974609375, 0.98828125, 1.0791015625, 1.169921875, 1.2607421875, 1.3515625, 1.4423828125, 1.533203125, 1.6240234375, 1.71484375, 1.8056640625, 1.896484375, 1.9873046875, 2.078125, 2.1689453125, 2.259765625, 2.3505859375, 2.44140625, 2.5322265625, 2.623046875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 15.0, 28.0, 42.0, 51.0, 76.0, 119.0, 159.0, 219.0, 309.0, 445.0, 658.0, 932.0, 1532.0, 2533.0, 5168.0, 12807.0, 37582.0, 126014.0, 356166.0, 333919.0, 112623.0, 33751.0, 11686.0, 4796.0, 2451.0, 1390.0, 945.0, 642.0, 440.0, 343.0, 219.0, 141.0, 98.0, 64.0, 47.0, 38.0, 29.0, 22.0, 7.0, 11.0, 10.0, 3.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8330078125, -0.8051986694335938, -0.7773895263671875, -0.7495803833007812, -0.721771240234375, -0.6939620971679688, -0.6661529541015625, -0.6383438110351562, -0.61053466796875, -0.5827255249023438, -0.5549163818359375, -0.5271072387695312, -0.499298095703125, -0.47148895263671875, -0.4436798095703125, -0.41587066650390625, -0.3880615234375, -0.36025238037109375, -0.3324432373046875, -0.30463409423828125, -0.276824951171875, -0.24901580810546875, -0.2212066650390625, -0.19339752197265625, -0.16558837890625, -0.13777923583984375, -0.1099700927734375, -0.08216094970703125, -0.054351806640625, -0.02654266357421875, 0.0012664794921875, 0.02907562255859375, 0.056884765625, 0.08469390869140625, 0.1125030517578125, 0.14031219482421875, 0.168121337890625, 0.19593048095703125, 0.2237396240234375, 0.25154876708984375, 0.27935791015625, 0.30716705322265625, 0.3349761962890625, 0.36278533935546875, 0.390594482421875, 0.41840362548828125, 0.4462127685546875, 0.47402191162109375, 0.5018310546875, 0.5296401977539062, 0.5574493408203125, 0.5852584838867188, 0.613067626953125, 0.6408767700195312, 0.6686859130859375, 0.6964950561523438, 0.72430419921875, 0.7521133422851562, 0.7799224853515625, 0.8077316284179688, 0.835540771484375, 0.8633499145507812, 0.8911590576171875, 0.9189682006835938, 0.94677734375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 9.0, 6.0, 6.0, 12.0, 15.0, 21.0, 15.0, 30.0, 36.0, 17.0, 39.0, 37.0, 63.0, 51.0, 45.0, 48.0, 1073.0, 46.0, 61.0, 40.0, 51.0, 40.0, 35.0, 37.0, 39.0, 31.0, 29.0, 23.0, 11.0, 18.0, 6.0, 4.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.16796875, -2.10772705078125, -2.0474853515625, -1.98724365234375, -1.927001953125, -1.86676025390625, -1.8065185546875, -1.74627685546875, -1.68603515625, -1.62579345703125, -1.5655517578125, -1.50531005859375, -1.445068359375, -1.38482666015625, -1.3245849609375, -1.26434326171875, -1.2041015625, -1.14385986328125, -1.0836181640625, -1.02337646484375, -0.963134765625, -0.90289306640625, -0.8426513671875, -0.78240966796875, -0.72216796875, -0.66192626953125, -0.6016845703125, -0.54144287109375, -0.481201171875, -0.42095947265625, -0.3607177734375, -0.30047607421875, -0.240234375, -0.17999267578125, -0.1197509765625, -0.05950927734375, 0.000732421875, 0.06097412109375, 0.1212158203125, 0.18145751953125, 0.24169921875, 0.30194091796875, 0.3621826171875, 0.42242431640625, 0.482666015625, 0.54290771484375, 0.6031494140625, 0.66339111328125, 0.7236328125, 0.78387451171875, 0.8441162109375, 0.90435791015625, 0.964599609375, 1.02484130859375, 1.0850830078125, 1.14532470703125, 1.20556640625, 1.26580810546875, 1.3260498046875, 1.38629150390625, 1.446533203125, 1.50677490234375, 1.5670166015625, 1.62725830078125, 1.6875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 8.0, 12.0, 12.0, 32.0, 37.0, 79.0, 136.0, 274.0, 547.0, 1247.0, 3223.0, 9989.0, 36664.0, 163265.0, 1365255.0, 400915.0, 85237.0, 20432.0, 5977.0, 2075.0, 841.0, 389.0, 204.0, 115.0, 67.0, 27.0, 24.0, 9.0, 6.0, 4.0, 8.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.52392578125, -0.5104179382324219, -0.49691009521484375, -0.4834022521972656, -0.4698944091796875, -0.4563865661621094, -0.44287872314453125, -0.4293708801269531, -0.415863037109375, -0.4023551940917969, -0.38884735107421875, -0.3753395080566406, -0.3618316650390625, -0.3483238220214844, -0.33481597900390625, -0.3213081359863281, -0.30780029296875, -0.2942924499511719, -0.28078460693359375, -0.2672767639160156, -0.2537689208984375, -0.24026107788085938, -0.22675323486328125, -0.21324539184570312, -0.199737548828125, -0.18622970581054688, -0.17272186279296875, -0.15921401977539062, -0.1457061767578125, -0.13219833374023438, -0.11869049072265625, -0.10518264770507812, -0.0916748046875, -0.07816696166992188, -0.06465911865234375, -0.051151275634765625, -0.0376434326171875, -0.024135589599609375, -0.01062774658203125, 0.002880096435546875, 0.016387939453125, 0.029895782470703125, 0.04340362548828125, 0.056911468505859375, 0.0704193115234375, 0.08392715454101562, 0.09743499755859375, 0.11094284057617188, 0.12445068359375, 0.13795852661132812, 0.15146636962890625, 0.16497421264648438, 0.1784820556640625, 0.19198989868164062, 0.20549774169921875, 0.21900558471679688, 0.232513427734375, 0.24602127075195312, 0.25952911376953125, 0.2730369567871094, 0.2865447998046875, 0.3000526428222656, 0.31356048583984375, 0.3270683288574219, 0.340576171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 10.0, 11.0, 16.0, 39.0, 58.0, 125.0, 302.0, 203.0, 77.0, 42.0, 21.0, 14.0, 9.0, 3.0, 7.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.12810325622558594, -0.12363815307617188, -0.11917304992675781, -0.11470794677734375, -0.11024284362792969, -0.10577774047851562, -0.10131263732910156, -0.0968475341796875, -0.09238243103027344, -0.08791732788085938, -0.08345222473144531, -0.07898712158203125, -0.07452201843261719, -0.07005691528320312, -0.06559181213378906, -0.061126708984375, -0.05666160583496094, -0.052196502685546875, -0.04773139953613281, -0.04326629638671875, -0.03880119323730469, -0.034336090087890625, -0.029870986938476562, -0.0254058837890625, -0.020940780639648438, -0.016475677490234375, -0.012010574340820312, -0.00754547119140625, -0.0030803680419921875, 0.001384735107421875, 0.0058498382568359375, 0.01031494140625, 0.014780044555664062, 0.019245147705078125, 0.023710250854492188, 0.02817535400390625, 0.03264045715332031, 0.037105560302734375, 0.04157066345214844, 0.0460357666015625, 0.05050086975097656, 0.054965972900390625, 0.05943107604980469, 0.06389617919921875, 0.06836128234863281, 0.07282638549804688, 0.07729148864746094, 0.081756591796875, 0.08622169494628906, 0.09068679809570312, 0.09515190124511719, 0.09961700439453125, 0.10408210754394531, 0.10854721069335938, 0.11301231384277344, 0.1174774169921875, 0.12194252014160156, 0.12640762329101562, 0.1308727264404297, 0.13533782958984375, 0.1398029327392578, 0.14426803588867188, 0.14873313903808594, 0.1531982421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 4.0, 7.0, 13.0, 11.0, 6.0, 8.0, 9.0, 19.0, 20.0, 20.0, 28.0, 40.0, 40.0, 56.0, 89.0, 191.0, 665.0, 5964.0, 895583.0, 140441.0, 4326.0, 507.0, 149.0, 85.0, 47.0, 38.0, 34.0, 24.0, 14.0, 10.0, 12.0, 12.0, 14.0, 8.0, 9.0, 3.0, 14.0, 3.0, 6.0, 7.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.78515625, -1.727447509765625, -1.66973876953125, -1.612030029296875, -1.5543212890625, -1.496612548828125, -1.43890380859375, -1.381195068359375, -1.323486328125, -1.265777587890625, -1.20806884765625, -1.150360107421875, -1.0926513671875, -1.034942626953125, -0.97723388671875, -0.919525146484375, -0.86181640625, -0.804107666015625, -0.74639892578125, -0.688690185546875, -0.6309814453125, -0.573272705078125, -0.51556396484375, -0.457855224609375, -0.400146484375, -0.342437744140625, -0.28472900390625, -0.227020263671875, -0.1693115234375, -0.111602783203125, -0.05389404296875, 0.003814697265625, 0.0615234375, 0.119232177734375, 0.17694091796875, 0.234649658203125, 0.2923583984375, 0.350067138671875, 0.40777587890625, 0.465484619140625, 0.523193359375, 0.580902099609375, 0.63861083984375, 0.696319580078125, 0.7540283203125, 0.811737060546875, 0.86944580078125, 0.927154541015625, 0.98486328125, 1.042572021484375, 1.10028076171875, 1.157989501953125, 1.2156982421875, 1.273406982421875, 1.33111572265625, 1.388824462890625, 1.446533203125, 1.504241943359375, 1.56195068359375, 1.619659423828125, 1.6773681640625, 1.735076904296875, 1.79278564453125, 1.850494384765625, 1.908203125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 85.0, 830.0, 90.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.312405586242676, -3.25169038772583, -3.1909751892089844, -3.1302599906921387, -3.069544792175293, -3.0088295936584473, -2.9481143951416016, -2.8873989582061768, -2.826683759689331, -2.7659685611724854, -2.7052533626556396, -2.644538164138794, -2.5838229656219482, -2.5231075286865234, -2.4623923301696777, -2.401677131652832, -2.3409619331359863, -2.2802467346191406, -2.219531536102295, -2.158816337585449, -2.0981011390686035, -2.037385940551758, -1.9766706228256226, -1.9159554243087769, -1.8552403450012207, -1.794525146484375, -1.7338099479675293, -1.6730947494506836, -1.6123794317245483, -1.5516642332077026, -1.490949034690857, -1.4302338361740112, -1.3695183992385864, -1.3088032007217407, -1.248088002204895, -1.1873726844787598, -1.126657485961914, -1.0659422874450684, -1.0052270889282227, -0.944511890411377, -0.8837966322898865, -0.8230814337730408, -0.7623661756515503, -0.7016509771347046, -0.6409357786178589, -0.5802205204963684, -0.5195053219795227, -0.4587900936603546, -0.3980748653411865, -0.33735963702201843, -0.27664440870285034, -0.21592921018600464, -0.15521398186683655, -0.09449875354766846, -0.033783555030822754, 0.026931673288345337, 0.08764690160751343, 0.14836212992668152, 0.20907734334468842, 0.2697925567626953, 0.3305077850818634, 0.3912230134010315, 0.4519382119178772, 0.5126534700393677, 0.5733686685562134]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 7.0, 9.0, 8.0, 15.0, 11.0, 13.0, 27.0, 19.0, 21.0, 26.0, 32.0, 30.0, 37.0, 42.0, 37.0, 41.0, 43.0, 52.0, 44.0, 45.0, 53.0, 30.0, 35.0, 41.0, 49.0, 27.0, 39.0, 22.0, 28.0, 24.0, 9.0, 19.0, 9.0, 14.0, 10.0, 9.0, 8.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20820069313049316, -0.20022165775299072, -0.19224262237548828, -0.18426358699798584, -0.1762845516204834, -0.16830551624298096, -0.1603264957666397, -0.15234746038913727, -0.14436842501163483, -0.13638938963413239, -0.12841035425662994, -0.1204313263297081, -0.11245229095220566, -0.10447325557470322, -0.09649422764778137, -0.08851519227027893, -0.08053615689277649, -0.07255712151527405, -0.0645780861377716, -0.05659905821084976, -0.04862002283334732, -0.04064098745584488, -0.032661955803632736, -0.024682924151420593, -0.016703888773918152, -0.00872485525906086, -0.0007458217442035675, 0.007233211770653725, 0.015212245285511017, 0.023191280663013458, 0.0311703123152256, 0.039149343967437744, 0.047128379344940186, 0.05510741472244263, 0.06308645009994507, 0.07106547802686691, 0.07904451340436935, 0.0870235487818718, 0.09500257670879364, 0.10298161208629608, 0.11096064746379852, 0.11893968284130096, 0.1269187182188034, 0.13489775359630585, 0.1428767740726471, 0.15085580945014954, 0.15883484482765198, 0.16681388020515442, 0.17479291558265686, 0.1827719509601593, 0.19075098633766174, 0.19873002171516418, 0.20670905709266663, 0.21468809247016907, 0.22266711294651031, 0.23064614832401276, 0.2386251837015152, 0.24660421907901764, 0.2545832395553589, 0.26256227493286133, 0.27054131031036377, 0.2785203456878662, 0.28649938106536865, 0.2944784164428711, 0.30245745182037354]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 2.0, 4.0, 10.0, 17.0, 12.0, 15.0, 16.0, 19.0, 29.0, 41.0, 45.0, 50.0, 52.0, 49.0, 63.0, 58.0, 63.0, 65.0, 71.0, 48.0, 35.0, 36.0, 44.0, 26.0, 14.0, 39.0, 13.0, 12.0, 12.0, 7.0, 6.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.20703125, -3.115753173828125, -3.02447509765625, -2.933197021484375, -2.8419189453125, -2.750640869140625, -2.65936279296875, -2.568084716796875, -2.476806640625, -2.385528564453125, -2.29425048828125, -2.202972412109375, -2.1116943359375, -2.020416259765625, -1.92913818359375, -1.837860107421875, -1.74658203125, -1.655303955078125, -1.56402587890625, -1.472747802734375, -1.3814697265625, -1.290191650390625, -1.19891357421875, -1.107635498046875, -1.016357421875, -0.925079345703125, -0.83380126953125, -0.742523193359375, -0.6512451171875, -0.559967041015625, -0.46868896484375, -0.377410888671875, -0.2861328125, -0.194854736328125, -0.10357666015625, -0.012298583984375, 0.0789794921875, 0.170257568359375, 0.26153564453125, 0.352813720703125, 0.444091796875, 0.535369873046875, 0.62664794921875, 0.717926025390625, 0.8092041015625, 0.900482177734375, 0.99176025390625, 1.083038330078125, 1.17431640625, 1.265594482421875, 1.35687255859375, 1.448150634765625, 1.5394287109375, 1.630706787109375, 1.72198486328125, 1.813262939453125, 1.904541015625, 1.995819091796875, 2.08709716796875, 2.178375244140625, 2.2696533203125, 2.360931396484375, 2.45220947265625, 2.543487548828125, 2.634765625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 10.0, 13.0, 20.0, 29.0, 41.0, 69.0, 114.0, 191.0, 302.0, 524.0, 847.0, 1506.0, 2860.0, 5233.0, 9992.0, 19761.0, 40236.0, 82778.0, 165972.0, 264770.0, 219617.0, 118463.0, 57311.0, 28091.0, 13885.0, 7216.0, 3903.0, 1981.0, 1171.0, 680.0, 339.0, 229.0, 149.0, 93.0, 45.0, 31.0, 21.0, 22.0, 13.0, 4.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.2169036865234375, -1.175994873046875, -1.1350860595703125, -1.09417724609375, -1.0532684326171875, -1.012359619140625, -0.9714508056640625, -0.9305419921875, -0.8896331787109375, -0.848724365234375, -0.8078155517578125, -0.76690673828125, -0.7259979248046875, -0.685089111328125, -0.6441802978515625, -0.603271484375, -0.5623626708984375, -0.521453857421875, -0.4805450439453125, -0.43963623046875, -0.3987274169921875, -0.357818603515625, -0.3169097900390625, -0.2760009765625, -0.2350921630859375, -0.194183349609375, -0.1532745361328125, -0.11236572265625, -0.0714569091796875, -0.030548095703125, 0.0103607177734375, 0.05126953125, 0.0921783447265625, 0.133087158203125, 0.1739959716796875, 0.21490478515625, 0.2558135986328125, 0.296722412109375, 0.3376312255859375, 0.3785400390625, 0.4194488525390625, 0.460357666015625, 0.5012664794921875, 0.54217529296875, 0.5830841064453125, 0.623992919921875, 0.6649017333984375, 0.705810546875, 0.7467193603515625, 0.787628173828125, 0.8285369873046875, 0.86944580078125, 0.9103546142578125, 0.951263427734375, 0.9921722412109375, 1.0330810546875, 1.0739898681640625, 1.114898681640625, 1.1558074951171875, 1.19671630859375, 1.2376251220703125, 1.278533935546875, 1.3194427490234375, 1.3603515625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 3.0, 5.0, 9.0, 6.0, 17.0, 13.0, 12.0, 18.0, 13.0, 31.0, 33.0, 32.0, 29.0, 42.0, 25.0, 32.0, 54.0, 64.0, 117.0, 1491.0, 428.0, 138.0, 61.0, 47.0, 48.0, 40.0, 37.0, 25.0, 32.0, 25.0, 17.0, 14.0, 18.0, 12.0, 7.0, 9.0, 11.0, 7.0, 7.0, 11.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.46875, -9.190185546875, -8.91162109375, -8.633056640625, -8.3544921875, -8.075927734375, -7.79736328125, -7.518798828125, -7.240234375, -6.961669921875, -6.68310546875, -6.404541015625, -6.1259765625, -5.847412109375, -5.56884765625, -5.290283203125, -5.01171875, -4.733154296875, -4.45458984375, -4.176025390625, -3.8974609375, -3.618896484375, -3.34033203125, -3.061767578125, -2.783203125, -2.504638671875, -2.22607421875, -1.947509765625, -1.6689453125, -1.390380859375, -1.11181640625, -0.833251953125, -0.5546875, -0.276123046875, 0.00244140625, 0.281005859375, 0.5595703125, 0.838134765625, 1.11669921875, 1.395263671875, 1.673828125, 1.952392578125, 2.23095703125, 2.509521484375, 2.7880859375, 3.066650390625, 3.34521484375, 3.623779296875, 3.90234375, 4.180908203125, 4.45947265625, 4.738037109375, 5.0166015625, 5.295166015625, 5.57373046875, 5.852294921875, 6.130859375, 6.409423828125, 6.68798828125, 6.966552734375, 7.2451171875, 7.523681640625, 7.80224609375, 8.080810546875, 8.359375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 8.0, 7.0, 11.0, 11.0, 6.0, 14.0, 16.0, 14.0, 16.0, 26.0, 38.0, 54.0, 82.0, 133.0, 183.0, 396.0, 1254.0, 10417.0, 1363460.0, 1755330.0, 11867.0, 1264.0, 432.0, 201.0, 115.0, 80.0, 51.0, 44.0, 44.0, 29.0, 7.0, 20.0, 15.0, 13.0, 13.0, 7.0, 7.0, 5.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.9140625, -11.5172119140625, -11.120361328125, -10.7235107421875, -10.32666015625, -9.9298095703125, -9.532958984375, -9.1361083984375, -8.7392578125, -8.3424072265625, -7.945556640625, -7.5487060546875, -7.15185546875, -6.7550048828125, -6.358154296875, -5.9613037109375, -5.564453125, -5.1676025390625, -4.770751953125, -4.3739013671875, -3.97705078125, -3.5802001953125, -3.183349609375, -2.7864990234375, -2.3896484375, -1.9927978515625, -1.595947265625, -1.1990966796875, -0.80224609375, -0.4053955078125, -0.008544921875, 0.3883056640625, 0.78515625, 1.1820068359375, 1.578857421875, 1.9757080078125, 2.37255859375, 2.7694091796875, 3.166259765625, 3.5631103515625, 3.9599609375, 4.3568115234375, 4.753662109375, 5.1505126953125, 5.54736328125, 5.9442138671875, 6.341064453125, 6.7379150390625, 7.134765625, 7.5316162109375, 7.928466796875, 8.3253173828125, 8.72216796875, 9.1190185546875, 9.515869140625, 9.9127197265625, 10.3095703125, 10.7064208984375, 11.103271484375, 11.5001220703125, 11.89697265625, 12.2938232421875, 12.690673828125, 13.0875244140625, 13.484375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [150.0, 824.0, 44.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.514115810394287, -1.1807615756988525, 2.152592658996582, 5.485947132110596, 8.81930160522461, 12.152654647827148, 15.48600959777832, 18.81936264038086, 22.15271759033203, 25.486072540283203, 28.819425582885742, 32.15277862548828, 35.48613357543945, 38.819488525390625, 42.1528434753418, 45.48619842529297, 48.81955337524414, 52.15290832519531, 55.486263275146484, 58.819618225097656, 62.15296936035156, 65.486328125, 68.8196792602539, 72.15303039550781, 75.48638916015625, 78.81974029541016, 82.1530990600586, 85.4864501953125, 88.81980895996094, 92.15316009521484, 95.48651123046875, 98.81986999511719, 102.1532211303711, 105.486572265625, 108.81993103027344, 112.15328216552734, 115.48664093017578, 118.81999206542969, 122.15335083007812, 125.48670196533203, 128.82005310058594, 132.15341186523438, 135.48675537109375, 138.8201141357422, 142.15347290039062, 145.48681640625, 148.82017517089844, 152.15353393554688, 155.4868927001953, 158.82025146484375, 162.15359497070312, 165.48695373535156, 168.8203125, 172.15365600585938, 175.4870147705078, 178.82037353515625, 182.15371704101562, 185.48707580566406, 188.82041931152344, 192.15377807617188, 195.4871368408203, 198.82049560546875, 202.15383911132812, 205.48719787597656, 208.820556640625]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 5.0, 6.0, 8.0, 10.0, 5.0, 11.0, 11.0, 24.0, 13.0, 21.0, 19.0, 12.0, 28.0, 28.0, 30.0, 30.0, 44.0, 33.0, 41.0, 45.0, 50.0, 40.0, 31.0, 48.0, 42.0, 51.0, 42.0, 44.0, 24.0, 39.0, 20.0, 24.0, 25.0, 17.0, 18.0, 15.0, 11.0, 10.0, 12.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.02629470825195, -31.104158401489258, -30.18202018737793, -29.259883880615234, -28.33774757385254, -27.41560935974121, -26.493473052978516, -25.571334838867188, -24.649198532104492, -23.727062225341797, -22.80492401123047, -21.882787704467773, -20.960651397705078, -20.03851318359375, -19.116376876831055, -18.19424057006836, -17.27210235595703, -16.349966049194336, -15.427828788757324, -14.505691528320312, -13.5835542678833, -12.661417007446289, -11.739280700683594, -10.817143440246582, -9.895008087158203, -8.972870826721191, -8.050734519958496, -7.128597259521484, -6.206459999084473, -5.284323215484619, -4.362186431884766, -3.440049171447754, -2.517911911010742, -1.5957748889923096, -0.6736379861831665, 0.24849891662597656, 1.1706359386444092, 2.092772960662842, 3.0149097442626953, 3.937047004699707, 4.8591837882995605, 5.781320571899414, 6.703457832336426, 7.625594615936279, 8.547731399536133, 9.469868659973145, 10.392005920410156, 11.314142227172852, 12.236279487609863, 13.158416748046875, 14.08055305480957, 15.002690315246582, 15.924827575683594, 16.84696388244629, 17.769100189208984, 18.691238403320312, 19.613374710083008, 20.535511016845703, 21.45764923095703, 22.379785537719727, 23.301921844482422, 24.22406005859375, 25.146196365356445, 26.06833267211914, 26.99047088623047]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 8.0, 6.0, 14.0, 10.0, 17.0, 18.0, 27.0, 35.0, 36.0, 41.0, 55.0, 51.0, 57.0, 74.0, 52.0, 78.0, 56.0, 64.0, 43.0, 53.0, 41.0, 25.0, 30.0, 21.0, 18.0, 15.0, 6.0, 5.0, 10.0, 5.0, 6.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.4296875, -3.333465576171875, -3.23724365234375, -3.141021728515625, -3.0447998046875, -2.948577880859375, -2.85235595703125, -2.756134033203125, -2.659912109375, -2.563690185546875, -2.46746826171875, -2.371246337890625, -2.2750244140625, -2.178802490234375, -2.08258056640625, -1.986358642578125, -1.89013671875, -1.793914794921875, -1.69769287109375, -1.601470947265625, -1.5052490234375, -1.409027099609375, -1.31280517578125, -1.216583251953125, -1.120361328125, -1.024139404296875, -0.92791748046875, -0.831695556640625, -0.7354736328125, -0.639251708984375, -0.54302978515625, -0.446807861328125, -0.3505859375, -0.254364013671875, -0.15814208984375, -0.061920166015625, 0.0343017578125, 0.130523681640625, 0.22674560546875, 0.322967529296875, 0.419189453125, 0.515411376953125, 0.61163330078125, 0.707855224609375, 0.8040771484375, 0.900299072265625, 0.99652099609375, 1.092742919921875, 1.18896484375, 1.285186767578125, 1.38140869140625, 1.477630615234375, 1.5738525390625, 1.670074462890625, 1.76629638671875, 1.862518310546875, 1.958740234375, 2.054962158203125, 2.15118408203125, 2.247406005859375, 2.3436279296875, 2.439849853515625, 2.53607177734375, 2.632293701171875, 2.728515625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 15.0, 21.0, 28.0, 32.0, 55.0, 63.0, 106.0, 149.0, 269.0, 372.0, 718.0, 1372.0, 2944.0, 7574.0, 26969.0, 319520.0, 3481040.0, 312787.0, 26582.0, 7360.0, 2964.0, 1429.0, 772.0, 415.0, 241.0, 172.0, 87.0, 64.0, 40.0, 34.0, 17.0, 16.0, 5.0, 5.0, 10.0, 0.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.921875, -12.5772705078125, -12.232666015625, -11.8880615234375, -11.54345703125, -11.1988525390625, -10.854248046875, -10.5096435546875, -10.1650390625, -9.8204345703125, -9.475830078125, -9.1312255859375, -8.78662109375, -8.4420166015625, -8.097412109375, -7.7528076171875, -7.408203125, -7.0635986328125, -6.718994140625, -6.3743896484375, -6.02978515625, -5.6851806640625, -5.340576171875, -4.9959716796875, -4.6513671875, -4.3067626953125, -3.962158203125, -3.6175537109375, -3.27294921875, -2.9283447265625, -2.583740234375, -2.2391357421875, -1.89453125, -1.5499267578125, -1.205322265625, -0.8607177734375, -0.51611328125, -0.1715087890625, 0.173095703125, 0.5177001953125, 0.8623046875, 1.2069091796875, 1.551513671875, 1.8961181640625, 2.24072265625, 2.5853271484375, 2.929931640625, 3.2745361328125, 3.619140625, 3.9637451171875, 4.308349609375, 4.6529541015625, 4.99755859375, 5.3421630859375, 5.686767578125, 6.0313720703125, 6.3759765625, 6.7205810546875, 7.065185546875, 7.4097900390625, 7.75439453125, 8.0989990234375, 8.443603515625, 8.7882080078125, 9.1328125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 3.0, 5.0, 9.0, 9.0, 13.0, 20.0, 27.0, 31.0, 42.0, 73.0, 103.0, 165.0, 243.0, 375.0, 574.0, 628.0, 602.0, 391.0, 251.0, 179.0, 106.0, 70.0, 53.0, 31.0, 16.0, 16.0, 13.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.7763671875, -7.529296875, -7.2822265625, -7.03515625, -6.7880859375, -6.541015625, -6.2939453125, -6.046875, -5.7998046875, -5.552734375, -5.3056640625, -5.05859375, -4.8115234375, -4.564453125, -4.3173828125, -4.0703125, -3.8232421875, -3.576171875, -3.3291015625, -3.08203125, -2.8349609375, -2.587890625, -2.3408203125, -2.09375, -1.8466796875, -1.599609375, -1.3525390625, -1.10546875, -0.8583984375, -0.611328125, -0.3642578125, -0.1171875, 0.1298828125, 0.376953125, 0.6240234375, 0.87109375, 1.1181640625, 1.365234375, 1.6123046875, 1.859375, 2.1064453125, 2.353515625, 2.6005859375, 2.84765625, 3.0947265625, 3.341796875, 3.5888671875, 3.8359375, 4.0830078125, 4.330078125, 4.5771484375, 4.82421875, 5.0712890625, 5.318359375, 5.5654296875, 5.8125, 6.0595703125, 6.306640625, 6.5537109375, 6.80078125, 7.0478515625, 7.294921875, 7.5419921875, 7.7890625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 11.0, 17.0, 30.0, 29.0, 61.0, 86.0, 111.0, 203.0, 300.0, 440.0, 673.0, 1117.0, 1770.0, 2790.0, 4886.0, 9201.0, 19526.0, 52595.0, 226103.0, 1407561.0, 1999877.0, 346244.0, 71669.0, 23945.0, 10811.0, 5778.0, 3234.0, 1947.0, 1164.0, 726.0, 470.0, 297.0, 214.0, 137.0, 80.0, 46.0, 38.0, 29.0, 20.0, 11.0, 13.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.640625, -8.353759765625, -8.06689453125, -7.780029296875, -7.4931640625, -7.206298828125, -6.91943359375, -6.632568359375, -6.345703125, -6.058837890625, -5.77197265625, -5.485107421875, -5.1982421875, -4.911376953125, -4.62451171875, -4.337646484375, -4.05078125, -3.763916015625, -3.47705078125, -3.190185546875, -2.9033203125, -2.616455078125, -2.32958984375, -2.042724609375, -1.755859375, -1.468994140625, -1.18212890625, -0.895263671875, -0.6083984375, -0.321533203125, -0.03466796875, 0.252197265625, 0.5390625, 0.825927734375, 1.11279296875, 1.399658203125, 1.6865234375, 1.973388671875, 2.26025390625, 2.547119140625, 2.833984375, 3.120849609375, 3.40771484375, 3.694580078125, 3.9814453125, 4.268310546875, 4.55517578125, 4.842041015625, 5.12890625, 5.415771484375, 5.70263671875, 5.989501953125, 6.2763671875, 6.563232421875, 6.85009765625, 7.136962890625, 7.423828125, 7.710693359375, 7.99755859375, 8.284423828125, 8.5712890625, 8.858154296875, 9.14501953125, 9.431884765625, 9.71875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 7.0, 23.0, 38.0, 81.0, 142.0, 222.0, 210.0, 136.0, 83.0, 33.0, 13.0, 8.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.362571716308594, -49.126522064208984, -46.890472412109375, -44.654422760009766, -42.418373107910156, -40.18232345581055, -37.94627380371094, -35.71022415161133, -33.47417449951172, -31.23812484741211, -29.0020751953125, -26.76602554321289, -24.52997589111328, -22.293926239013672, -20.057876586914062, -17.821826934814453, -15.585777282714844, -13.349727630615234, -11.113677978515625, -8.877628326416016, -6.641578674316406, -4.405529022216797, -2.1694793701171875, 0.06657028198242188, 2.3026199340820312, 4.538669586181641, 6.77471923828125, 9.01076889038086, 11.246818542480469, 13.482868194580078, 15.718917846679688, 17.954967498779297, 20.191017150878906, 22.427066802978516, 24.663116455078125, 26.899166107177734, 29.135215759277344, 31.371265411376953, 33.60731506347656, 35.84336471557617, 38.07941436767578, 40.31546401977539, 42.551513671875, 44.78756332397461, 47.02361297607422, 49.25966262817383, 51.49571228027344, 53.73176193237305, 55.967811584472656, 58.203861236572266, 60.439910888671875, 62.675960540771484, 64.9120101928711, 67.14805603027344, 69.38410949707031, 71.62016296386719, 73.85620880126953, 76.09225463867188, 78.32830810546875, 80.56436157226562, 82.80040740966797, 85.03645324707031, 87.27250671386719, 89.50856018066406, 91.7446060180664]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 9.0, 10.0, 9.0, 16.0, 10.0, 19.0, 18.0, 19.0, 14.0, 28.0, 29.0, 16.0, 32.0, 34.0, 30.0, 35.0, 32.0, 22.0, 26.0, 43.0, 41.0, 40.0, 43.0, 43.0, 47.0, 37.0, 36.0, 24.0, 28.0, 25.0, 24.0, 25.0, 20.0, 17.0, 16.0, 14.0, 10.0, 5.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-18.91483497619629, -18.304473876953125, -17.694114685058594, -17.08375358581543, -16.4733943939209, -15.863033294677734, -15.252673149108887, -14.642313003540039, -14.031951904296875, -13.421591758728027, -12.81123161315918, -12.200870513916016, -11.590510368347168, -10.98015022277832, -10.369790077209473, -9.759429931640625, -9.149069786071777, -8.53870964050293, -7.928349018096924, -7.317988872528076, -6.70762825012207, -6.097268104553223, -5.486907958984375, -4.876547336578369, -4.2661871910095215, -3.6558268070220947, -3.045466423034668, -2.4351062774658203, -1.8247458934783936, -1.2143855094909668, -0.6040253639221191, 0.006335258483886719, 0.6166954040527344, 1.2270557880401611, 1.8374160528182983, 2.4477763175964355, 3.0581367015838623, 3.668497085571289, 4.278857231140137, 4.889217853546143, 5.49957799911499, 6.109938144683838, 6.720298767089844, 7.330658912658691, 7.941019058227539, 8.551380157470703, 9.161739349365234, 9.772100448608398, 10.382460594177246, 10.992820739746094, 11.603180885314941, 12.213541030883789, 12.823902130126953, 13.4342622756958, 14.044622421264648, 14.654983520507812, 15.265342712402344, 15.875702857971191, 16.48606300354004, 17.096424102783203, 17.706783294677734, 18.3171443939209, 18.927505493164062, 19.537864685058594, 20.148225784301758]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 14.0, 8.0, 13.0, 20.0, 27.0, 30.0, 26.0, 47.0, 44.0, 42.0, 39.0, 50.0, 64.0, 59.0, 50.0, 58.0, 61.0, 57.0, 50.0, 35.0, 33.0, 24.0, 32.0, 17.0, 16.0, 11.0, 11.0, 9.0, 12.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.2578125, -3.16693115234375, -3.0760498046875, -2.98516845703125, -2.894287109375, -2.80340576171875, -2.7125244140625, -2.62164306640625, -2.53076171875, -2.43988037109375, -2.3489990234375, -2.25811767578125, -2.167236328125, -2.07635498046875, -1.9854736328125, -1.89459228515625, -1.8037109375, -1.71282958984375, -1.6219482421875, -1.53106689453125, -1.440185546875, -1.34930419921875, -1.2584228515625, -1.16754150390625, -1.07666015625, -0.98577880859375, -0.8948974609375, -0.80401611328125, -0.713134765625, -0.62225341796875, -0.5313720703125, -0.44049072265625, -0.349609375, -0.25872802734375, -0.1678466796875, -0.07696533203125, 0.013916015625, 0.10479736328125, 0.1956787109375, 0.28656005859375, 0.37744140625, 0.46832275390625, 0.5592041015625, 0.65008544921875, 0.740966796875, 0.83184814453125, 0.9227294921875, 1.01361083984375, 1.1044921875, 1.19537353515625, 1.2862548828125, 1.37713623046875, 1.468017578125, 1.55889892578125, 1.6497802734375, 1.74066162109375, 1.83154296875, 1.92242431640625, 2.0133056640625, 2.10418701171875, 2.195068359375, 2.28594970703125, 2.3768310546875, 2.46771240234375, 2.55859375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 9.0, 21.0, 20.0, 32.0, 48.0, 79.0, 122.0, 182.0, 285.0, 464.0, 699.0, 1166.0, 1882.0, 3182.0, 5323.0, 9202.0, 16091.0, 27456.0, 47664.0, 81019.0, 133160.0, 190868.0, 192461.0, 136966.0, 83297.0, 49046.0, 28094.0, 16165.0, 9541.0, 5532.0, 3213.0, 2023.0, 1181.0, 752.0, 489.0, 255.0, 183.0, 137.0, 82.0, 56.0, 28.0, 22.0, 19.0, 8.0, 8.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.467529296875, -0.45378875732421875, -0.4400482177734375, -0.42630767822265625, -0.412567138671875, -0.39882659912109375, -0.3850860595703125, -0.37134552001953125, -0.35760498046875, -0.34386444091796875, -0.3301239013671875, -0.31638336181640625, -0.302642822265625, -0.28890228271484375, -0.2751617431640625, -0.26142120361328125, -0.2476806640625, -0.23394012451171875, -0.2201995849609375, -0.20645904541015625, -0.192718505859375, -0.17897796630859375, -0.1652374267578125, -0.15149688720703125, -0.13775634765625, -0.12401580810546875, -0.1102752685546875, -0.09653472900390625, -0.082794189453125, -0.06905364990234375, -0.0553131103515625, -0.04157257080078125, -0.02783203125, -0.01409149169921875, -0.0003509521484375, 0.01338958740234375, 0.027130126953125, 0.04087066650390625, 0.0546112060546875, 0.06835174560546875, 0.08209228515625, 0.09583282470703125, 0.1095733642578125, 0.12331390380859375, 0.137054443359375, 0.15079498291015625, 0.1645355224609375, 0.17827606201171875, 0.1920166015625, 0.20575714111328125, 0.2194976806640625, 0.23323822021484375, 0.246978759765625, 0.26071929931640625, 0.2744598388671875, 0.28820037841796875, 0.30194091796875, 0.31568145751953125, 0.3294219970703125, 0.34316253662109375, 0.356903076171875, 0.37064361572265625, 0.3843841552734375, 0.39812469482421875, 0.411865234375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 6.0, 8.0, 9.0, 13.0, 13.0, 14.0, 14.0, 14.0, 14.0, 18.0, 20.0, 28.0, 26.0, 28.0, 30.0, 39.0, 40.0, 42.0, 31.0, 41.0, 39.0, 1055.0, 26.0, 47.0, 33.0, 40.0, 31.0, 29.0, 34.0, 32.0, 25.0, 24.0, 38.0, 15.0, 12.0, 18.0, 11.0, 10.0, 5.0, 13.0, 10.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.611328125, -1.5611419677734375, -1.510955810546875, -1.4607696533203125, -1.41058349609375, -1.3603973388671875, -1.310211181640625, -1.2600250244140625, -1.2098388671875, -1.1596527099609375, -1.109466552734375, -1.0592803955078125, -1.00909423828125, -0.9589080810546875, -0.908721923828125, -0.8585357666015625, -0.808349609375, -0.7581634521484375, -0.707977294921875, -0.6577911376953125, -0.60760498046875, -0.5574188232421875, -0.507232666015625, -0.4570465087890625, -0.4068603515625, -0.3566741943359375, -0.306488037109375, -0.2563018798828125, -0.20611572265625, -0.1559295654296875, -0.105743408203125, -0.0555572509765625, -0.00537109375, 0.0448150634765625, 0.095001220703125, 0.1451873779296875, 0.19537353515625, 0.2455596923828125, 0.295745849609375, 0.3459320068359375, 0.3961181640625, 0.4463043212890625, 0.496490478515625, 0.5466766357421875, 0.59686279296875, 0.6470489501953125, 0.697235107421875, 0.7474212646484375, 0.797607421875, 0.8477935791015625, 0.897979736328125, 0.9481658935546875, 0.99835205078125, 1.0485382080078125, 1.098724365234375, 1.1489105224609375, 1.1990966796875, 1.2492828369140625, 1.299468994140625, 1.3496551513671875, 1.39984130859375, 1.4500274658203125, 1.500213623046875, 1.5503997802734375, 1.6005859375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 6.0, 11.0, 17.0, 20.0, 36.0, 51.0, 75.0, 111.0, 171.0, 264.0, 436.0, 688.0, 1048.0, 1732.0, 2829.0, 4803.0, 8222.0, 14320.0, 25015.0, 44022.0, 77783.0, 137977.0, 368330.0, 984133.0, 188676.0, 101576.0, 57349.0, 32410.0, 18637.0, 10671.0, 6277.0, 3646.0, 2134.0, 1338.0, 881.0, 500.0, 321.0, 202.0, 126.0, 90.0, 60.0, 43.0, 30.0, 17.0, 16.0, 9.0, 10.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1781005859375, -0.1725749969482422, -0.16704940795898438, -0.16152381896972656, -0.15599822998046875, -0.15047264099121094, -0.14494705200195312, -0.1394214630126953, -0.1338958740234375, -0.1283702850341797, -0.12284469604492188, -0.11731910705566406, -0.11179351806640625, -0.10626792907714844, -0.10074234008789062, -0.09521675109863281, -0.089691162109375, -0.08416557312011719, -0.07863998413085938, -0.07311439514160156, -0.06758880615234375, -0.06206321716308594, -0.056537628173828125, -0.05101203918457031, -0.0454864501953125, -0.03996086120605469, -0.034435272216796875, -0.028909683227539062, -0.02338409423828125, -0.017858505249023438, -0.012332916259765625, -0.0068073272705078125, -0.00128173828125, 0.0042438507080078125, 0.009769439697265625, 0.015295028686523438, 0.02082061767578125, 0.026346206665039062, 0.031871795654296875, 0.03739738464355469, 0.0429229736328125, 0.04844856262207031, 0.053974151611328125, 0.05949974060058594, 0.06502532958984375, 0.07055091857910156, 0.07607650756835938, 0.08160209655761719, 0.087127685546875, 0.09265327453613281, 0.09817886352539062, 0.10370445251464844, 0.10923004150390625, 0.11475563049316406, 0.12028121948242188, 0.1258068084716797, 0.1313323974609375, 0.1368579864501953, 0.14238357543945312, 0.14790916442871094, 0.15343475341796875, 0.15896034240722656, 0.16448593139648438, 0.1700115203857422, 0.175537109375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 11.0, 21.0, 64.0, 105.0, 157.0, 206.0, 163.0, 111.0, 61.0, 29.0, 12.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0645751953125, -0.0623931884765625, -0.060211181640625, -0.0580291748046875, -0.05584716796875, -0.0536651611328125, -0.051483154296875, -0.0493011474609375, -0.047119140625, -0.0449371337890625, -0.042755126953125, -0.0405731201171875, -0.03839111328125, -0.0362091064453125, -0.034027099609375, -0.0318450927734375, -0.0296630859375, -0.0274810791015625, -0.025299072265625, -0.0231170654296875, -0.02093505859375, -0.0187530517578125, -0.016571044921875, -0.0143890380859375, -0.01220703125, -0.0100250244140625, -0.007843017578125, -0.0056610107421875, -0.00347900390625, -0.0012969970703125, 0.000885009765625, 0.0030670166015625, 0.0052490234375, 0.0074310302734375, 0.009613037109375, 0.0117950439453125, 0.01397705078125, 0.0161590576171875, 0.018341064453125, 0.0205230712890625, 0.022705078125, 0.0248870849609375, 0.027069091796875, 0.0292510986328125, 0.03143310546875, 0.0336151123046875, 0.035797119140625, 0.0379791259765625, 0.0401611328125, 0.0423431396484375, 0.044525146484375, 0.0467071533203125, 0.04888916015625, 0.0510711669921875, 0.053253173828125, 0.0554351806640625, 0.0576171875, 0.0597991943359375, 0.061981201171875, 0.0641632080078125, 0.06634521484375, 0.0685272216796875, 0.070709228515625, 0.0728912353515625, 0.0750732421875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 18.0, 19.0, 25.0, 55.0, 72.0, 142.0, 382.0, 2567.0, 38301.0, 986203.0, 18376.0, 1708.0, 290.0, 122.0, 84.0, 33.0, 23.0, 14.0, 12.0, 7.0, 5.0, 11.0, 4.0, 5.0, 2.0, 1.0, 2.0, 5.0, 6.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.234375, -1.198486328125, -1.16259765625, -1.126708984375, -1.0908203125, -1.054931640625, -1.01904296875, -0.983154296875, -0.947265625, -0.911376953125, -0.87548828125, -0.839599609375, -0.8037109375, -0.767822265625, -0.73193359375, -0.696044921875, -0.66015625, -0.624267578125, -0.58837890625, -0.552490234375, -0.5166015625, -0.480712890625, -0.44482421875, -0.408935546875, -0.373046875, -0.337158203125, -0.30126953125, -0.265380859375, -0.2294921875, -0.193603515625, -0.15771484375, -0.121826171875, -0.0859375, -0.050048828125, -0.01416015625, 0.021728515625, 0.0576171875, 0.093505859375, 0.12939453125, 0.165283203125, 0.201171875, 0.237060546875, 0.27294921875, 0.308837890625, 0.3447265625, 0.380615234375, 0.41650390625, 0.452392578125, 0.48828125, 0.524169921875, 0.56005859375, 0.595947265625, 0.6318359375, 0.667724609375, 0.70361328125, 0.739501953125, 0.775390625, 0.811279296875, 0.84716796875, 0.883056640625, 0.9189453125, 0.954833984375, 0.99072265625, 1.026611328125, 1.0625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 18.0, 20.0, 38.0, 66.0, 111.0, 254.0, 256.0, 101.0, 67.0, 30.0, 13.0, 9.0, 10.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.5029296875, -0.49344804883003235, -0.4839664101600647, -0.47448480129241943, -0.4650031626224518, -0.45552152395248413, -0.44603991508483887, -0.4365582764148712, -0.42707663774490356, -0.4175949990749359, -0.40811336040496826, -0.398631751537323, -0.38915011286735535, -0.3796684741973877, -0.37018686532974243, -0.3607052266597748, -0.35122358798980713, -0.3417419493198395, -0.3322603106498718, -0.32277870178222656, -0.3132970631122589, -0.30381542444229126, -0.294333815574646, -0.28485217690467834, -0.2753705382347107, -0.26588889956474304, -0.2564072608947754, -0.24692565202713013, -0.23744401335716248, -0.22796237468719482, -0.21848075091838837, -0.2089991271495819, -0.19951751828193665, -0.190035879611969, -0.18055425584316254, -0.17107263207435608, -0.16159099340438843, -0.15210935473442078, -0.14262773096561432, -0.13314610719680786, -0.12366446852684021, -0.11418283730745316, -0.1047012060880661, -0.09521957486867905, -0.08573794364929199, -0.07625631242990494, -0.06677468121051788, -0.05729304999113083, -0.047811418771743774, -0.03832978755235672, -0.028848156332969666, -0.01936652511358261, -0.009884893894195557, -0.0004032626748085022, 0.009078368544578552, 0.018559999763965607, 0.02804163098335266, 0.037523262202739716, 0.04700489342212677, 0.056486524641513824, 0.06596815586090088, 0.07544978708028793, 0.08493141829967499, 0.09441304951906204, 0.1038946807384491]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 11.0, 6.0, 10.0, 7.0, 15.0, 19.0, 30.0, 31.0, 33.0, 22.0, 41.0, 40.0, 50.0, 49.0, 38.0, 48.0, 58.0, 49.0, 56.0, 36.0, 39.0, 38.0, 39.0, 37.0, 36.0, 22.0, 22.0, 16.0, 20.0, 20.0, 14.0, 13.0, 9.0, 3.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.048183321952819824, -0.04676072672009468, -0.04533813148736954, -0.043915532529354095, -0.04249293729662895, -0.04107034206390381, -0.03964774310588837, -0.03822514787316322, -0.03680255264043808, -0.035379957407712936, -0.03395736217498779, -0.03253476321697235, -0.031112167984247208, -0.029689572751522064, -0.02826697565615177, -0.02684437856078148, -0.025421783328056335, -0.023999188095331192, -0.0225765909999609, -0.021153993904590607, -0.019731398671865463, -0.01830880343914032, -0.016886206343770027, -0.015463610179722309, -0.014041014015674591, -0.012618417851626873, -0.011195821687579155, -0.009773225523531437, -0.008350629359483719, -0.006928033195436001, -0.005505437031388283, -0.004082840867340565, -0.0026602447032928467, -0.0012376485392451286, 0.00018494762480258942, 0.0016075437888503075, 0.0030301399528980255, 0.0044527361169457436, 0.005875332280993462, 0.00729792844504118, 0.008720524609088898, 0.010143120773136616, 0.011565716937184334, 0.012988313101232052, 0.01441090926527977, 0.015833504498004913, 0.017256101593375206, 0.0186786986887455, 0.020101293921470642, 0.021523889154195786, 0.022946486249566078, 0.02436908334493637, 0.025791678577661514, 0.027214273810386658, 0.02863687090575695, 0.030059468001127243, 0.031482063233852386, 0.03290465846657753, 0.03432725369930267, 0.035749852657318115, 0.03717244789004326, 0.0385950431227684, 0.040017642080783844, 0.04144023731350899, 0.04286283254623413]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 6.0, 10.0, 10.0, 14.0, 17.0, 28.0, 27.0, 38.0, 39.0, 58.0, 53.0, 47.0, 61.0, 54.0, 59.0, 63.0, 56.0, 63.0, 56.0, 42.0, 41.0, 18.0, 30.0, 23.0, 11.0, 10.0, 11.0, 11.0, 9.0, 4.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.412109375, -3.31732177734375, -3.2225341796875, -3.12774658203125, -3.032958984375, -2.93817138671875, -2.8433837890625, -2.74859619140625, -2.65380859375, -2.55902099609375, -2.4642333984375, -2.36944580078125, -2.274658203125, -2.17987060546875, -2.0850830078125, -1.99029541015625, -1.8955078125, -1.80072021484375, -1.7059326171875, -1.61114501953125, -1.516357421875, -1.42156982421875, -1.3267822265625, -1.23199462890625, -1.13720703125, -1.04241943359375, -0.9476318359375, -0.85284423828125, -0.758056640625, -0.66326904296875, -0.5684814453125, -0.47369384765625, -0.37890625, -0.28411865234375, -0.1893310546875, -0.09454345703125, 0.000244140625, 0.09503173828125, 0.1898193359375, 0.28460693359375, 0.37939453125, 0.47418212890625, 0.5689697265625, 0.66375732421875, 0.758544921875, 0.85333251953125, 0.9481201171875, 1.04290771484375, 1.1376953125, 1.23248291015625, 1.3272705078125, 1.42205810546875, 1.516845703125, 1.61163330078125, 1.7064208984375, 1.80120849609375, 1.89599609375, 1.99078369140625, 2.0855712890625, 2.18035888671875, 2.275146484375, 2.36993408203125, 2.4647216796875, 2.55950927734375, 2.654296875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 4.0, 6.0, 15.0, 18.0, 17.0, 30.0, 46.0, 50.0, 92.0, 113.0, 209.0, 370.0, 651.0, 1229.0, 2825.0, 7868.0, 27521.0, 142120.0, 644533.0, 174189.0, 31598.0, 8727.0, 3165.0, 1350.0, 708.0, 417.0, 248.0, 130.0, 91.0, 56.0, 53.0, 26.0, 23.0, 13.0, 13.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0], "bins": [-5.97265625, -5.8135986328125, -5.654541015625, -5.4954833984375, -5.33642578125, -5.1773681640625, -5.018310546875, -4.8592529296875, -4.7001953125, -4.5411376953125, -4.382080078125, -4.2230224609375, -4.06396484375, -3.9049072265625, -3.745849609375, -3.5867919921875, -3.427734375, -3.2686767578125, -3.109619140625, -2.9505615234375, -2.79150390625, -2.6324462890625, -2.473388671875, -2.3143310546875, -2.1552734375, -1.9962158203125, -1.837158203125, -1.6781005859375, -1.51904296875, -1.3599853515625, -1.200927734375, -1.0418701171875, -0.8828125, -0.7237548828125, -0.564697265625, -0.4056396484375, -0.24658203125, -0.0875244140625, 0.071533203125, 0.2305908203125, 0.3896484375, 0.5487060546875, 0.707763671875, 0.8668212890625, 1.02587890625, 1.1849365234375, 1.343994140625, 1.5030517578125, 1.662109375, 1.8211669921875, 1.980224609375, 2.1392822265625, 2.29833984375, 2.4573974609375, 2.616455078125, 2.7755126953125, 2.9345703125, 3.0936279296875, 3.252685546875, 3.4117431640625, 3.57080078125, 3.7298583984375, 3.888916015625, 4.0479736328125, 4.20703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 6.0, 6.0, 6.0, 9.0, 12.0, 18.0, 21.0, 22.0, 18.0, 26.0, 26.0, 32.0, 36.0, 39.0, 34.0, 39.0, 45.0, 80.0, 154.0, 1456.0, 324.0, 132.0, 65.0, 55.0, 56.0, 38.0, 24.0, 34.0, 30.0, 35.0, 24.0, 26.0, 14.0, 13.0, 17.0, 13.0, 15.0, 6.0, 4.0, 7.0, 7.0, 4.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.734375, -8.47662353515625, -8.2188720703125, -7.96112060546875, -7.703369140625, -7.44561767578125, -7.1878662109375, -6.93011474609375, -6.67236328125, -6.41461181640625, -6.1568603515625, -5.89910888671875, -5.641357421875, -5.38360595703125, -5.1258544921875, -4.86810302734375, -4.6103515625, -4.35260009765625, -4.0948486328125, -3.83709716796875, -3.579345703125, -3.32159423828125, -3.0638427734375, -2.80609130859375, -2.54833984375, -2.29058837890625, -2.0328369140625, -1.77508544921875, -1.517333984375, -1.25958251953125, -1.0018310546875, -0.74407958984375, -0.486328125, -0.22857666015625, 0.0291748046875, 0.28692626953125, 0.544677734375, 0.80242919921875, 1.0601806640625, 1.31793212890625, 1.57568359375, 1.83343505859375, 2.0911865234375, 2.34893798828125, 2.606689453125, 2.86444091796875, 3.1221923828125, 3.37994384765625, 3.6376953125, 3.89544677734375, 4.1531982421875, 4.41094970703125, 4.668701171875, 4.92645263671875, 5.1842041015625, 5.44195556640625, 5.69970703125, 5.95745849609375, 6.2152099609375, 6.47296142578125, 6.730712890625, 6.98846435546875, 7.2462158203125, 7.50396728515625, 7.76171875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 14.0, 8.0, 22.0, 21.0, 40.0, 32.0, 72.0, 74.0, 122.0, 172.0, 293.0, 470.0, 961.0, 1882.0, 5804.0, 29050.0, 1689234.0, 1380855.0, 27028.0, 5407.0, 1969.0, 863.0, 439.0, 268.0, 186.0, 120.0, 77.0, 53.0, 49.0, 32.0, 30.0, 7.0, 12.0, 8.0, 13.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4765625, -15.00732421875, -14.5380859375, -14.06884765625, -13.599609375, -13.13037109375, -12.6611328125, -12.19189453125, -11.72265625, -11.25341796875, -10.7841796875, -10.31494140625, -9.845703125, -9.37646484375, -8.9072265625, -8.43798828125, -7.96875, -7.49951171875, -7.0302734375, -6.56103515625, -6.091796875, -5.62255859375, -5.1533203125, -4.68408203125, -4.21484375, -3.74560546875, -3.2763671875, -2.80712890625, -2.337890625, -1.86865234375, -1.3994140625, -0.93017578125, -0.4609375, 0.00830078125, 0.4775390625, 0.94677734375, 1.416015625, 1.88525390625, 2.3544921875, 2.82373046875, 3.29296875, 3.76220703125, 4.2314453125, 4.70068359375, 5.169921875, 5.63916015625, 6.1083984375, 6.57763671875, 7.046875, 7.51611328125, 7.9853515625, 8.45458984375, 8.923828125, 9.39306640625, 9.8623046875, 10.33154296875, 10.80078125, 11.27001953125, 11.7392578125, 12.20849609375, 12.677734375, 13.14697265625, 13.6162109375, 14.08544921875, 14.5546875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [36.0, 383.0, 517.0, 78.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.998574733734131, -4.2890167236328125, -0.5794587135314941, 3.130098819732666, 6.839657306671143, 10.549215316772461, 14.258771896362305, 17.96833038330078, 21.677888870239258, 25.387447357177734, 29.097003936767578, 32.80656433105469, 36.51612091064453, 40.225677490234375, 43.93523406982422, 47.64479446411133, 51.35435485839844, 55.06391143798828, 58.77347183227539, 62.483028411865234, 66.19258880615234, 69.90214538574219, 73.61170196533203, 77.32125854492188, 81.03081512451172, 84.74037170410156, 88.4499282836914, 92.15948486328125, 95.86904907226562, 99.57860565185547, 103.28816223144531, 106.99771881103516, 110.707275390625, 114.41683197021484, 118.12638854980469, 121.83595275878906, 125.5455093383789, 129.25506591796875, 132.96463012695312, 136.67417907714844, 140.3837432861328, 144.0933074951172, 147.8028564453125, 151.51242065429688, 155.2219696044922, 158.93153381347656, 162.64108276367188, 166.35064697265625, 170.06021118164062, 173.769775390625, 177.4793243408203, 181.1888885498047, 184.8984375, 188.60800170898438, 192.31756591796875, 196.02711486816406, 199.73666381835938, 203.44622802734375, 207.15577697753906, 210.86534118652344, 214.57489013671875, 218.28445434570312, 221.9940185546875, 225.7035675048828, 229.4131317138672]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 1.0, 7.0, 4.0, 8.0, 12.0, 6.0, 8.0, 25.0, 15.0, 28.0, 23.0, 29.0, 25.0, 15.0, 38.0, 31.0, 31.0, 43.0, 33.0, 41.0, 49.0, 36.0, 45.0, 37.0, 39.0, 35.0, 47.0, 37.0, 29.0, 39.0, 23.0, 27.0, 23.0, 9.0, 16.0, 15.0, 11.0, 19.0, 4.0, 7.0, 8.0, 5.0, 8.0, 2.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.555240631103516, -27.669776916503906, -26.784311294555664, -25.898847579956055, -25.013383865356445, -24.127918243408203, -23.242454528808594, -22.356990814208984, -21.471527099609375, -20.586063385009766, -19.700597763061523, -18.815134048461914, -17.929670333862305, -17.044204711914062, -16.158740997314453, -15.273277282714844, -14.387812614440918, -13.502347946166992, -12.616884231567383, -11.731419563293457, -10.845955848693848, -9.960491180419922, -9.075027465820312, -8.189562797546387, -7.304098606109619, -6.418634414672852, -5.533170223236084, -4.647706031799316, -3.7622416019439697, -2.876777172088623, -1.9913129806518555, -1.105848789215088, -0.2203845977783203, 0.665079653263092, 1.5505439043045044, 2.4360082149505615, 3.321472406387329, 4.206936836242676, 5.092401027679443, 5.977865219116211, 6.8633294105529785, 7.748793601989746, 8.634258270263672, 9.519721984863281, 10.405186653137207, 11.290651321411133, 12.176115036010742, 13.061578750610352, 13.947043418884277, 14.832508087158203, 15.717971801757812, 16.603435516357422, 17.488901138305664, 18.374364852905273, 19.259828567504883, 20.145294189453125, 21.030757904052734, 21.916221618652344, 22.801687240600586, 23.687150955200195, 24.572614669799805, 25.458080291748047, 26.343544006347656, 27.229007720947266, 28.114471435546875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 11.0, 9.0, 13.0, 13.0, 14.0, 24.0, 21.0, 27.0, 40.0, 48.0, 43.0, 49.0, 43.0, 53.0, 51.0, 64.0, 58.0, 60.0, 63.0, 55.0, 46.0, 36.0, 26.0, 20.0, 24.0, 20.0, 11.0, 16.0, 6.0, 7.0, 3.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.6171875, -3.51708984375, -3.4169921875, -3.31689453125, -3.216796875, -3.11669921875, -3.0166015625, -2.91650390625, -2.81640625, -2.71630859375, -2.6162109375, -2.51611328125, -2.416015625, -2.31591796875, -2.2158203125, -2.11572265625, -2.015625, -1.91552734375, -1.8154296875, -1.71533203125, -1.615234375, -1.51513671875, -1.4150390625, -1.31494140625, -1.21484375, -1.11474609375, -1.0146484375, -0.91455078125, -0.814453125, -0.71435546875, -0.6142578125, -0.51416015625, -0.4140625, -0.31396484375, -0.2138671875, -0.11376953125, -0.013671875, 0.08642578125, 0.1865234375, 0.28662109375, 0.38671875, 0.48681640625, 0.5869140625, 0.68701171875, 0.787109375, 0.88720703125, 0.9873046875, 1.08740234375, 1.1875, 1.28759765625, 1.3876953125, 1.48779296875, 1.587890625, 1.68798828125, 1.7880859375, 1.88818359375, 1.98828125, 2.08837890625, 2.1884765625, 2.28857421875, 2.388671875, 2.48876953125, 2.5888671875, 2.68896484375, 2.7890625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 8.0, 4.0, 12.0, 9.0, 23.0, 18.0, 48.0, 57.0, 63.0, 109.0, 158.0, 190.0, 346.0, 545.0, 771.0, 1395.0, 2440.0, 4571.0, 10062.0, 30220.0, 194621.0, 2316234.0, 1473094.0, 117816.0, 22956.0, 8536.0, 4069.0, 2216.0, 1277.0, 795.0, 556.0, 334.0, 193.0, 167.0, 108.0, 79.0, 53.0, 30.0, 25.0, 24.0, 9.0, 11.0, 10.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-9.578125, -9.3184814453125, -9.058837890625, -8.7991943359375, -8.53955078125, -8.2799072265625, -8.020263671875, -7.7606201171875, -7.5009765625, -7.2413330078125, -6.981689453125, -6.7220458984375, -6.46240234375, -6.2027587890625, -5.943115234375, -5.6834716796875, -5.423828125, -5.1641845703125, -4.904541015625, -4.6448974609375, -4.38525390625, -4.1256103515625, -3.865966796875, -3.6063232421875, -3.3466796875, -3.0870361328125, -2.827392578125, -2.5677490234375, -2.30810546875, -2.0484619140625, -1.788818359375, -1.5291748046875, -1.26953125, -1.0098876953125, -0.750244140625, -0.4906005859375, -0.23095703125, 0.0286865234375, 0.288330078125, 0.5479736328125, 0.8076171875, 1.0672607421875, 1.326904296875, 1.5865478515625, 1.84619140625, 2.1058349609375, 2.365478515625, 2.6251220703125, 2.884765625, 3.1444091796875, 3.404052734375, 3.6636962890625, 3.92333984375, 4.1829833984375, 4.442626953125, 4.7022705078125, 4.9619140625, 5.2215576171875, 5.481201171875, 5.7408447265625, 6.00048828125, 6.2601318359375, 6.519775390625, 6.7794189453125, 7.0390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 3.0, 6.0, 6.0, 15.0, 14.0, 30.0, 38.0, 37.0, 66.0, 108.0, 130.0, 198.0, 242.0, 368.0, 441.0, 548.0, 470.0, 359.0, 262.0, 216.0, 134.0, 98.0, 64.0, 65.0, 31.0, 23.0, 16.0, 18.0, 8.0, 10.0, 8.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.4453125, -7.235595703125, -7.02587890625, -6.816162109375, -6.6064453125, -6.396728515625, -6.18701171875, -5.977294921875, -5.767578125, -5.557861328125, -5.34814453125, -5.138427734375, -4.9287109375, -4.718994140625, -4.50927734375, -4.299560546875, -4.08984375, -3.880126953125, -3.67041015625, -3.460693359375, -3.2509765625, -3.041259765625, -2.83154296875, -2.621826171875, -2.412109375, -2.202392578125, -1.99267578125, -1.782958984375, -1.5732421875, -1.363525390625, -1.15380859375, -0.944091796875, -0.734375, -0.524658203125, -0.31494140625, -0.105224609375, 0.1044921875, 0.314208984375, 0.52392578125, 0.733642578125, 0.943359375, 1.153076171875, 1.36279296875, 1.572509765625, 1.7822265625, 1.991943359375, 2.20166015625, 2.411376953125, 2.62109375, 2.830810546875, 3.04052734375, 3.250244140625, 3.4599609375, 3.669677734375, 3.87939453125, 4.089111328125, 4.298828125, 4.508544921875, 4.71826171875, 4.927978515625, 5.1376953125, 5.347412109375, 5.55712890625, 5.766845703125, 5.9765625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 10.0, 8.0, 22.0, 25.0, 45.0, 50.0, 67.0, 110.0, 159.0, 227.0, 342.0, 492.0, 730.0, 1113.0, 1660.0, 2431.0, 3931.0, 6405.0, 11623.0, 23778.0, 64502.0, 238493.0, 1082819.0, 1975943.0, 567033.0, 130589.0, 40709.0, 17328.0, 8917.0, 5146.0, 3239.0, 2068.0, 1361.0, 926.0, 640.0, 444.0, 291.0, 211.0, 117.0, 94.0, 42.0, 45.0, 23.0, 20.0, 13.0, 13.0, 11.0, 3.0, 8.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.171875, -7.93353271484375, -7.6951904296875, -7.45684814453125, -7.218505859375, -6.98016357421875, -6.7418212890625, -6.50347900390625, -6.26513671875, -6.02679443359375, -5.7884521484375, -5.55010986328125, -5.311767578125, -5.07342529296875, -4.8350830078125, -4.59674072265625, -4.3583984375, -4.12005615234375, -3.8817138671875, -3.64337158203125, -3.405029296875, -3.16668701171875, -2.9283447265625, -2.69000244140625, -2.45166015625, -2.21331787109375, -1.9749755859375, -1.73663330078125, -1.498291015625, -1.25994873046875, -1.0216064453125, -0.78326416015625, -0.544921875, -0.30657958984375, -0.0682373046875, 0.17010498046875, 0.408447265625, 0.64678955078125, 0.8851318359375, 1.12347412109375, 1.36181640625, 1.60015869140625, 1.8385009765625, 2.07684326171875, 2.315185546875, 2.55352783203125, 2.7918701171875, 3.03021240234375, 3.2685546875, 3.50689697265625, 3.7452392578125, 3.98358154296875, 4.221923828125, 4.46026611328125, 4.6986083984375, 4.93695068359375, 5.17529296875, 5.41363525390625, 5.6519775390625, 5.89031982421875, 6.128662109375, 6.36700439453125, 6.6053466796875, 6.84368896484375, 7.08203125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 4.0, 11.0, 16.0, 24.0, 28.0, 40.0, 55.0, 80.0, 99.0, 118.0, 130.0, 115.0, 83.0, 64.0, 56.0, 30.0, 18.0, 9.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-59.97016906738281, -58.69586944580078, -57.421566009521484, -56.14726638793945, -54.872962951660156, -53.598663330078125, -52.32435989379883, -51.0500602722168, -49.7757568359375, -48.50145721435547, -47.22715377807617, -45.95285415649414, -44.678550720214844, -43.40425109863281, -42.129947662353516, -40.855648040771484, -39.58134460449219, -38.307044982910156, -37.03274154663086, -35.75844192504883, -34.48413848876953, -33.2098388671875, -31.935535430908203, -30.661235809326172, -29.38693618774414, -28.112634658813477, -26.838333129882812, -25.56403160095215, -24.289730072021484, -23.01542854309082, -21.741127014160156, -20.466827392578125, -19.19252586364746, -17.918224334716797, -16.643922805786133, -15.369621276855469, -14.095319747924805, -12.82101821899414, -11.546717643737793, -10.272416114807129, -8.998114585876465, -7.723813056945801, -6.449511528015137, -5.175210475921631, -3.900908946990967, -2.6266074180603027, -1.3523063659667969, -0.07800483703613281, 1.1962966918945312, 2.4705982208251953, 3.7448995113372803, 5.019200801849365, 6.293502330780029, 7.567803859710693, 8.8421049118042, 10.116406440734863, 11.390707969665527, 12.665009498596191, 13.939311027526855, 15.213611602783203, 16.487913131713867, 17.76221466064453, 19.036516189575195, 20.31081771850586, 21.585119247436523]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 7.0, 6.0, 10.0, 13.0, 14.0, 12.0, 14.0, 22.0, 25.0, 30.0, 26.0, 35.0, 31.0, 45.0, 46.0, 34.0, 44.0, 48.0, 54.0, 50.0, 38.0, 36.0, 44.0, 35.0, 44.0, 27.0, 30.0, 27.0, 22.0, 18.0, 16.0, 12.0, 14.0, 13.0, 10.0, 9.0, 5.0, 8.0, 6.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.33960723876953, -22.65927505493164, -21.978944778442383, -21.298612594604492, -20.618282318115234, -19.937950134277344, -19.257617950439453, -18.577287673950195, -17.896957397460938, -17.216625213623047, -16.53629493713379, -15.855962753295898, -15.17563247680664, -14.49530029296875, -13.814969062805176, -13.134637832641602, -12.454305648803711, -11.773974418640137, -11.093643188476562, -10.413311004638672, -9.732980728149414, -9.052648544311523, -8.37231731414795, -7.691986083984375, -7.011654853820801, -6.331323623657227, -5.650992393493652, -4.97066068649292, -4.290329456329346, -3.6099982261657715, -2.929666519165039, -2.249335289001465, -1.5690059661865234, -0.8886746168136597, -0.2083432674407959, 0.4719882011413574, 1.1523194313049316, 1.8326506614685059, 2.5129823684692383, 3.1933135986328125, 3.8736448287963867, 4.553976058959961, 5.234307289123535, 5.914638996124268, 6.594970226287842, 7.275301456451416, 7.955633163452148, 8.635964393615723, 9.316295623779297, 9.996626853942871, 10.676958084106445, 11.357290267944336, 12.037620544433594, 12.717952728271484, 13.398283958435059, 14.078615188598633, 14.758946418762207, 15.439277648925781, 16.119609832763672, 16.79994010925293, 17.48027229309082, 18.160602569580078, 18.84093475341797, 19.52126693725586, 20.201597213745117]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 4.0, 2.0, 9.0, 9.0, 13.0, 15.0, 20.0, 18.0, 22.0, 27.0, 38.0, 40.0, 63.0, 50.0, 51.0, 54.0, 71.0, 62.0, 54.0, 63.0, 49.0, 46.0, 39.0, 32.0, 33.0, 26.0, 28.0, 14.0, 14.0, 10.0, 11.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.86328125, -3.755340576171875, -3.64739990234375, -3.539459228515625, -3.4315185546875, -3.323577880859375, -3.21563720703125, -3.107696533203125, -2.999755859375, -2.891815185546875, -2.78387451171875, -2.675933837890625, -2.5679931640625, -2.460052490234375, -2.35211181640625, -2.244171142578125, -2.13623046875, -2.028289794921875, -1.92034912109375, -1.812408447265625, -1.7044677734375, -1.596527099609375, -1.48858642578125, -1.380645751953125, -1.272705078125, -1.164764404296875, -1.05682373046875, -0.948883056640625, -0.8409423828125, -0.733001708984375, -0.62506103515625, -0.517120361328125, -0.4091796875, -0.301239013671875, -0.19329833984375, -0.085357666015625, 0.0225830078125, 0.130523681640625, 0.23846435546875, 0.346405029296875, 0.454345703125, 0.562286376953125, 0.67022705078125, 0.778167724609375, 0.8861083984375, 0.994049072265625, 1.10198974609375, 1.209930419921875, 1.31787109375, 1.425811767578125, 1.53375244140625, 1.641693115234375, 1.7496337890625, 1.857574462890625, 1.96551513671875, 2.073455810546875, 2.181396484375, 2.289337158203125, 2.39727783203125, 2.505218505859375, 2.6131591796875, 2.721099853515625, 2.82904052734375, 2.936981201171875, 3.044921875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 5.0, 13.0, 29.0, 37.0, 64.0, 78.0, 143.0, 167.0, 250.0, 344.0, 530.0, 741.0, 1178.0, 1854.0, 3468.0, 7782.0, 21037.0, 70117.0, 235926.0, 409910.0, 202695.0, 58810.0, 18233.0, 6804.0, 3216.0, 1805.0, 1047.0, 678.0, 497.0, 341.0, 224.0, 186.0, 113.0, 65.0, 63.0, 34.0, 28.0, 16.0, 9.0, 7.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.021484375, -0.9909286499023438, -0.9603729248046875, -0.9298171997070312, -0.899261474609375, -0.8687057495117188, -0.8381500244140625, -0.8075942993164062, -0.77703857421875, -0.7464828491210938, -0.7159271240234375, -0.6853713989257812, -0.654815673828125, -0.6242599487304688, -0.5937042236328125, -0.5631484985351562, -0.5325927734375, -0.5020370483398438, -0.4714813232421875, -0.44092559814453125, -0.410369873046875, -0.37981414794921875, -0.3492584228515625, -0.31870269775390625, -0.28814697265625, -0.25759124755859375, -0.2270355224609375, -0.19647979736328125, -0.165924072265625, -0.13536834716796875, -0.1048126220703125, -0.07425689697265625, -0.043701171875, -0.01314544677734375, 0.0174102783203125, 0.04796600341796875, 0.078521728515625, 0.10907745361328125, 0.1396331787109375, 0.17018890380859375, 0.20074462890625, 0.23130035400390625, 0.2618560791015625, 0.29241180419921875, 0.322967529296875, 0.35352325439453125, 0.3840789794921875, 0.41463470458984375, 0.4451904296875, 0.47574615478515625, 0.5063018798828125, 0.5368576049804688, 0.567413330078125, 0.5979690551757812, 0.6285247802734375, 0.6590805053710938, 0.68963623046875, 0.7201919555664062, 0.7507476806640625, 0.7813034057617188, 0.811859130859375, 0.8424148559570312, 0.8729705810546875, 0.9035263061523438, 0.93408203125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 2.0, 2.0, 9.0, 7.0, 12.0, 15.0, 14.0, 20.0, 19.0, 37.0, 28.0, 32.0, 30.0, 32.0, 30.0, 52.0, 40.0, 41.0, 48.0, 1060.0, 52.0, 46.0, 52.0, 41.0, 39.0, 37.0, 27.0, 30.0, 25.0, 27.0, 25.0, 14.0, 15.0, 10.0, 15.0, 15.0, 8.0, 10.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.296875, -2.23370361328125, -2.1705322265625, -2.10736083984375, -2.044189453125, -1.98101806640625, -1.9178466796875, -1.85467529296875, -1.79150390625, -1.72833251953125, -1.6651611328125, -1.60198974609375, -1.538818359375, -1.47564697265625, -1.4124755859375, -1.34930419921875, -1.2861328125, -1.22296142578125, -1.1597900390625, -1.09661865234375, -1.033447265625, -0.97027587890625, -0.9071044921875, -0.84393310546875, -0.78076171875, -0.71759033203125, -0.6544189453125, -0.59124755859375, -0.528076171875, -0.46490478515625, -0.4017333984375, -0.33856201171875, -0.275390625, -0.21221923828125, -0.1490478515625, -0.08587646484375, -0.022705078125, 0.04046630859375, 0.1036376953125, 0.16680908203125, 0.22998046875, 0.29315185546875, 0.3563232421875, 0.41949462890625, 0.482666015625, 0.54583740234375, 0.6090087890625, 0.67218017578125, 0.7353515625, 0.79852294921875, 0.8616943359375, 0.92486572265625, 0.988037109375, 1.05120849609375, 1.1143798828125, 1.17755126953125, 1.24072265625, 1.30389404296875, 1.3670654296875, 1.43023681640625, 1.493408203125, 1.55657958984375, 1.6197509765625, 1.68292236328125, 1.74609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 11.0, 8.0, 28.0, 37.0, 39.0, 55.0, 90.0, 158.0, 272.0, 468.0, 965.0, 2482.0, 7153.0, 28291.0, 137801.0, 1377462.0, 434985.0, 80752.0, 17568.0, 4968.0, 1767.0, 792.0, 388.0, 201.0, 131.0, 76.0, 56.0, 32.0, 25.0, 15.0, 7.0, 7.0, 7.0, 9.0, 4.0, 2.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.5458984375, -0.5302276611328125, -0.514556884765625, -0.4988861083984375, -0.48321533203125, -0.4675445556640625, -0.451873779296875, -0.4362030029296875, -0.4205322265625, -0.4048614501953125, -0.389190673828125, -0.3735198974609375, -0.35784912109375, -0.3421783447265625, -0.326507568359375, -0.3108367919921875, -0.295166015625, -0.2794952392578125, -0.263824462890625, -0.2481536865234375, -0.23248291015625, -0.2168121337890625, -0.201141357421875, -0.1854705810546875, -0.1697998046875, -0.1541290283203125, -0.138458251953125, -0.1227874755859375, -0.10711669921875, -0.0914459228515625, -0.075775146484375, -0.0601043701171875, -0.04443359375, -0.0287628173828125, -0.013092041015625, 0.0025787353515625, 0.01824951171875, 0.0339202880859375, 0.049591064453125, 0.0652618408203125, 0.0809326171875, 0.0966033935546875, 0.112274169921875, 0.1279449462890625, 0.14361572265625, 0.1592864990234375, 0.174957275390625, 0.1906280517578125, 0.206298828125, 0.2219696044921875, 0.237640380859375, 0.2533111572265625, 0.26898193359375, 0.2846527099609375, 0.300323486328125, 0.3159942626953125, 0.3316650390625, 0.3473358154296875, 0.363006591796875, 0.3786773681640625, 0.39434814453125, 0.4100189208984375, 0.425689697265625, 0.4413604736328125, 0.45703125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 5.0, 9.0, 47.0, 96.0, 345.0, 290.0, 82.0, 32.0, 11.0, 5.0, 1.0, 6.0, 2.0, 3.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1845703125, -0.17840003967285156, -0.17222976684570312, -0.1660594940185547, -0.15988922119140625, -0.1537189483642578, -0.14754867553710938, -0.14137840270996094, -0.1352081298828125, -0.12903785705566406, -0.12286758422851562, -0.11669731140136719, -0.11052703857421875, -0.10435676574707031, -0.09818649291992188, -0.09201622009277344, -0.085845947265625, -0.07967567443847656, -0.07350540161132812, -0.06733512878417969, -0.06116485595703125, -0.05499458312988281, -0.048824310302734375, -0.04265403747558594, -0.0364837646484375, -0.030313491821289062, -0.024143218994140625, -0.017972946166992188, -0.01180267333984375, -0.0056324005126953125, 0.000537872314453125, 0.0067081451416015625, 0.01287841796875, 0.019048690795898438, 0.025218963623046875, 0.03138923645019531, 0.03755950927734375, 0.04372978210449219, 0.049900054931640625, 0.05607032775878906, 0.0622406005859375, 0.06841087341308594, 0.07458114624023438, 0.08075141906738281, 0.08692169189453125, 0.09309196472167969, 0.09926223754882812, 0.10543251037597656, 0.111602783203125, 0.11777305603027344, 0.12394332885742188, 0.1301136016845703, 0.13628387451171875, 0.1424541473388672, 0.14862442016601562, 0.15479469299316406, 0.1609649658203125, 0.16713523864746094, 0.17330551147460938, 0.1794757843017578, 0.18564605712890625, 0.1918163299560547, 0.19798660278320312, 0.20415687561035156, 0.2103271484375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 3.0, 5.0, 10.0, 12.0, 21.0, 21.0, 19.0, 16.0, 25.0, 34.0, 37.0, 85.0, 153.0, 1022.0, 11808.0, 1016500.0, 16956.0, 1251.0, 225.0, 86.0, 47.0, 40.0, 37.0, 23.0, 14.0, 20.0, 7.0, 11.0, 6.0, 6.0, 4.0, 4.0, 8.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.986328125, -2.8973388671875, -2.808349609375, -2.7193603515625, -2.63037109375, -2.5413818359375, -2.452392578125, -2.3634033203125, -2.2744140625, -2.1854248046875, -2.096435546875, -2.0074462890625, -1.91845703125, -1.8294677734375, -1.740478515625, -1.6514892578125, -1.5625, -1.4735107421875, -1.384521484375, -1.2955322265625, -1.20654296875, -1.1175537109375, -1.028564453125, -0.9395751953125, -0.8505859375, -0.7615966796875, -0.672607421875, -0.5836181640625, -0.49462890625, -0.4056396484375, -0.316650390625, -0.2276611328125, -0.138671875, -0.0496826171875, 0.039306640625, 0.1282958984375, 0.21728515625, 0.3062744140625, 0.395263671875, 0.4842529296875, 0.5732421875, 0.6622314453125, 0.751220703125, 0.8402099609375, 0.92919921875, 1.0181884765625, 1.107177734375, 1.1961669921875, 1.28515625, 1.3741455078125, 1.463134765625, 1.5521240234375, 1.64111328125, 1.7301025390625, 1.819091796875, 1.9080810546875, 1.9970703125, 2.0860595703125, 2.175048828125, 2.2640380859375, 2.35302734375, 2.4420166015625, 2.531005859375, 2.6199951171875, 2.708984375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 18.0, 39.0, 196.0, 561.0, 153.0, 35.0, 10.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2398250102996826, -2.199423313140869, -2.1590216159820557, -2.118619918823242, -2.0782179832458496, -2.037816286087036, -1.9974145889282227, -1.9570128917694092, -1.9166110754013062, -1.8762093782424927, -1.8358075618743896, -1.7954058647155762, -1.7550041675567627, -1.7146023511886597, -1.6742006540298462, -1.6337988376617432, -1.5933971405029297, -1.5529954433441162, -1.5125936269760132, -1.4721919298171997, -1.4317902326583862, -1.3913884162902832, -1.3509867191314697, -1.3105850219726562, -1.2701833248138428, -1.2297816276550293, -1.1893798112869263, -1.1489781141281128, -1.1085764169692993, -1.0681746006011963, -1.0277729034423828, -0.9873711466789246, -0.9469693899154663, -0.9065676331520081, -0.8661659359931946, -0.8257641792297363, -0.7853624224662781, -0.7449606657028198, -0.7045589685440063, -0.6641572117805481, -0.6237555146217346, -0.5833537578582764, -0.5429520606994629, -0.5025503039360046, -0.4621485471725464, -0.4217468202114105, -0.38134509325027466, -0.3409433364868164, -0.30054160952568054, -0.2601398825645447, -0.21973812580108643, -0.17933639883995056, -0.1389346569776535, -0.09853291511535645, -0.05813118815422058, -0.01772943139076233, 0.022672295570373535, 0.0630740374326706, 0.10347577184438705, 0.14387750625610352, 0.18427924811840057, 0.22468098998069763, 0.2650827169418335, 0.30548447370529175, 0.3458862006664276]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 4.0, 3.0, 6.0, 6.0, 5.0, 11.0, 9.0, 9.0, 12.0, 19.0, 14.0, 20.0, 20.0, 25.0, 26.0, 27.0, 36.0, 30.0, 40.0, 26.0, 37.0, 51.0, 46.0, 46.0, 39.0, 30.0, 36.0, 37.0, 45.0, 41.0, 29.0, 36.0, 24.0, 21.0, 24.0, 15.0, 17.0, 16.0, 12.0, 14.0, 14.0, 5.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.22420895099639893, -0.2168494164943695, -0.2094898819923401, -0.20213034749031067, -0.19477081298828125, -0.18741127848625183, -0.1800517439842224, -0.172692209482193, -0.16533267498016357, -0.15797314047813416, -0.15061360597610474, -0.14325407147407532, -0.1358945369720459, -0.12853500247001648, -0.12117547541856766, -0.11381594091653824, -0.10645641386508942, -0.09909687936306, -0.09173734486103058, -0.08437781035900116, -0.07701827585697174, -0.06965874135494232, -0.0622992143034935, -0.05493967980146408, -0.04758014529943466, -0.04022061079740524, -0.032861076295375824, -0.025501545518636703, -0.018142011016607285, -0.010782476514577866, -0.003422945737838745, 0.003936588764190674, 0.011296123266220093, 0.01865565776824951, 0.02601519040763378, 0.03337472304701805, 0.04073425754904747, 0.04809379205107689, 0.05545332282781601, 0.06281285732984543, 0.07017239183187485, 0.07753192633390427, 0.08489146083593369, 0.09225098788738251, 0.09961052238941193, 0.10697005689144135, 0.11432959139347076, 0.12168912589550018, 0.1290486603975296, 0.13640819489955902, 0.14376772940158844, 0.15112726390361786, 0.15848679840564728, 0.1658463329076767, 0.17320585250854492, 0.18056538701057434, 0.18792492151260376, 0.19528445601463318, 0.2026439905166626, 0.21000352501869202, 0.21736305952072144, 0.22472259402275085, 0.23208212852478027, 0.2394416630268097, 0.2468011975288391]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 1.0, 7.0, 7.0, 19.0, 13.0, 14.0, 20.0, 29.0, 41.0, 44.0, 39.0, 43.0, 67.0, 45.0, 65.0, 55.0, 54.0, 67.0, 57.0, 54.0, 46.0, 28.0, 38.0, 23.0, 23.0, 16.0, 17.0, 15.0, 18.0, 6.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.66015625, -3.554443359375, -3.44873046875, -3.343017578125, -3.2373046875, -3.131591796875, -3.02587890625, -2.920166015625, -2.814453125, -2.708740234375, -2.60302734375, -2.497314453125, -2.3916015625, -2.285888671875, -2.18017578125, -2.074462890625, -1.96875, -1.863037109375, -1.75732421875, -1.651611328125, -1.5458984375, -1.440185546875, -1.33447265625, -1.228759765625, -1.123046875, -1.017333984375, -0.91162109375, -0.805908203125, -0.7001953125, -0.594482421875, -0.48876953125, -0.383056640625, -0.27734375, -0.171630859375, -0.06591796875, 0.039794921875, 0.1455078125, 0.251220703125, 0.35693359375, 0.462646484375, 0.568359375, 0.674072265625, 0.77978515625, 0.885498046875, 0.9912109375, 1.096923828125, 1.20263671875, 1.308349609375, 1.4140625, 1.519775390625, 1.62548828125, 1.731201171875, 1.8369140625, 1.942626953125, 2.04833984375, 2.154052734375, 2.259765625, 2.365478515625, 2.47119140625, 2.576904296875, 2.6826171875, 2.788330078125, 2.89404296875, 2.999755859375, 3.10546875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 9.0, 7.0, 19.0, 26.0, 29.0, 47.0, 81.0, 120.0, 151.0, 256.0, 464.0, 765.0, 1289.0, 2419.0, 4535.0, 8842.0, 21160.0, 60081.0, 189710.0, 434630.0, 212497.0, 67475.0, 23430.0, 9760.0, 4619.0, 2593.0, 1429.0, 838.0, 473.0, 276.0, 174.0, 106.0, 70.0, 45.0, 38.0, 23.0, 15.0, 17.0, 7.0, 8.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.744140625, -3.635772705078125, -3.52740478515625, -3.419036865234375, -3.3106689453125, -3.202301025390625, -3.09393310546875, -2.985565185546875, -2.877197265625, -2.768829345703125, -2.66046142578125, -2.552093505859375, -2.4437255859375, -2.335357666015625, -2.22698974609375, -2.118621826171875, -2.01025390625, -1.901885986328125, -1.79351806640625, -1.685150146484375, -1.5767822265625, -1.468414306640625, -1.36004638671875, -1.251678466796875, -1.143310546875, -1.034942626953125, -0.92657470703125, -0.818206787109375, -0.7098388671875, -0.601470947265625, -0.49310302734375, -0.384735107421875, -0.2763671875, -0.167999267578125, -0.05963134765625, 0.048736572265625, 0.1571044921875, 0.265472412109375, 0.37384033203125, 0.482208251953125, 0.590576171875, 0.698944091796875, 0.80731201171875, 0.915679931640625, 1.0240478515625, 1.132415771484375, 1.24078369140625, 1.349151611328125, 1.45751953125, 1.565887451171875, 1.67425537109375, 1.782623291015625, 1.8909912109375, 1.999359130859375, 2.10772705078125, 2.216094970703125, 2.324462890625, 2.432830810546875, 2.54119873046875, 2.649566650390625, 2.7579345703125, 2.866302490234375, 2.97467041015625, 3.083038330078125, 3.19140625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 5.0, 9.0, 10.0, 16.0, 14.0, 25.0, 29.0, 28.0, 27.0, 22.0, 44.0, 41.0, 51.0, 60.0, 73.0, 138.0, 273.0, 1398.0, 249.0, 105.0, 50.0, 55.0, 42.0, 26.0, 42.0, 28.0, 35.0, 23.0, 15.0, 13.0, 18.0, 9.0, 14.0, 4.0, 8.0, 6.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.015625, -8.7369384765625, -8.458251953125, -8.1795654296875, -7.90087890625, -7.6221923828125, -7.343505859375, -7.0648193359375, -6.7861328125, -6.5074462890625, -6.228759765625, -5.9500732421875, -5.67138671875, -5.3927001953125, -5.114013671875, -4.8353271484375, -4.556640625, -4.2779541015625, -3.999267578125, -3.7205810546875, -3.44189453125, -3.1632080078125, -2.884521484375, -2.6058349609375, -2.3271484375, -2.0484619140625, -1.769775390625, -1.4910888671875, -1.21240234375, -0.9337158203125, -0.655029296875, -0.3763427734375, -0.09765625, 0.1810302734375, 0.459716796875, 0.7384033203125, 1.01708984375, 1.2957763671875, 1.574462890625, 1.8531494140625, 2.1318359375, 2.4105224609375, 2.689208984375, 2.9678955078125, 3.24658203125, 3.5252685546875, 3.803955078125, 4.0826416015625, 4.361328125, 4.6400146484375, 4.918701171875, 5.1973876953125, 5.47607421875, 5.7547607421875, 6.033447265625, 6.3121337890625, 6.5908203125, 6.8695068359375, 7.148193359375, 7.4268798828125, 7.70556640625, 7.9842529296875, 8.262939453125, 8.5416259765625, 8.8203125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 7.0, 13.0, 15.0, 26.0, 28.0, 48.0, 76.0, 112.0, 209.0, 364.0, 852.0, 3185.0, 42545.0, 3002229.0, 89586.0, 4349.0, 1043.0, 373.0, 253.0, 141.0, 88.0, 52.0, 34.0, 26.0, 14.0, 7.0, 7.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.03125, -23.33642578125, -22.6416015625, -21.94677734375, -21.251953125, -20.55712890625, -19.8623046875, -19.16748046875, -18.47265625, -17.77783203125, -17.0830078125, -16.38818359375, -15.693359375, -14.99853515625, -14.3037109375, -13.60888671875, -12.9140625, -12.21923828125, -11.5244140625, -10.82958984375, -10.134765625, -9.43994140625, -8.7451171875, -8.05029296875, -7.35546875, -6.66064453125, -5.9658203125, -5.27099609375, -4.576171875, -3.88134765625, -3.1865234375, -2.49169921875, -1.796875, -1.10205078125, -0.4072265625, 0.28759765625, 0.982421875, 1.67724609375, 2.3720703125, 3.06689453125, 3.76171875, 4.45654296875, 5.1513671875, 5.84619140625, 6.541015625, 7.23583984375, 7.9306640625, 8.62548828125, 9.3203125, 10.01513671875, 10.7099609375, 11.40478515625, 12.099609375, 12.79443359375, 13.4892578125, 14.18408203125, 14.87890625, 15.57373046875, 16.2685546875, 16.96337890625, 17.658203125, 18.35302734375, 19.0478515625, 19.74267578125, 20.4375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 31.0, 506.0, 453.0, 28.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.21781349182129, -20.983278274536133, -16.748743057250977, -12.51420783996582, -8.279672622680664, -4.045137405395508, 0.18939781188964844, 4.423933029174805, 8.658468246459961, 12.893003463745117, 17.127538681030273, 21.36207389831543, 25.596609115600586, 29.831144332885742, 34.06568145751953, 38.30021667480469, 42.534751892089844, 46.769287109375, 51.003822326660156, 55.23835754394531, 59.47289276123047, 63.707427978515625, 67.94196319580078, 72.17649841308594, 76.4110336303711, 80.64556884765625, 84.8801040649414, 89.11463928222656, 93.34917449951172, 97.58370971679688, 101.81824493408203, 106.05278015136719, 110.28730773925781, 114.52184295654297, 118.75637817382812, 122.99091339111328, 127.22544860839844, 131.45999145507812, 135.69451904296875, 139.92904663085938, 144.16358947753906, 148.39813232421875, 152.63265991210938, 156.8671875, 161.1017303466797, 165.33627319335938, 169.57080078125, 173.80532836914062, 178.0398712158203, 182.2744140625, 186.50894165039062, 190.74346923828125, 194.97801208496094, 199.21255493164062, 203.44708251953125, 207.68161010742188, 211.91615295410156, 216.15069580078125, 220.38522338867188, 224.6197509765625, 228.8542938232422, 233.08883666992188, 237.3233642578125, 241.55789184570312, 245.7924346923828]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 3.0, 10.0, 10.0, 13.0, 17.0, 21.0, 20.0, 15.0, 32.0, 26.0, 28.0, 33.0, 36.0, 31.0, 45.0, 47.0, 45.0, 40.0, 40.0, 48.0, 48.0, 47.0, 31.0, 35.0, 29.0, 41.0, 18.0, 36.0, 25.0, 16.0, 25.0, 14.0, 23.0, 15.0, 14.0, 4.0, 5.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-32.34456253051758, -31.40703010559082, -30.469497680664062, -29.531965255737305, -28.594432830810547, -27.656898498535156, -26.7193660736084, -25.78183364868164, -24.844301223754883, -23.906768798828125, -22.969236373901367, -22.03170394897461, -21.09416961669922, -20.156639099121094, -19.219104766845703, -18.281572341918945, -17.344039916992188, -16.40650749206543, -15.468975067138672, -14.531441688537598, -13.59390926361084, -12.656376838684082, -11.718843460083008, -10.78131103515625, -9.843778610229492, -8.906246185302734, -7.968713283538818, -7.031180381774902, -6.0936479568481445, -5.156115531921387, -4.218582630157471, -3.2810497283935547, -2.343517303466797, -1.40598464012146, -0.46845197677612305, 0.46908068656921387, 1.4066133499145508, 2.3441457748413086, 3.2816786766052246, 4.219211578369141, 5.156744003295898, 6.094276428222656, 7.031809329986572, 7.969342231750488, 8.906874656677246, 9.844407081604004, 10.781940460205078, 11.719472885131836, 12.657005310058594, 13.594537734985352, 14.53207015991211, 15.469603538513184, 16.407135009765625, 17.344669342041016, 18.282201766967773, 19.21973419189453, 20.15726661682129, 21.094799041748047, 22.032331466674805, 22.969863891601562, 23.907398223876953, 24.844928741455078, 25.78246307373047, 26.719995498657227, 27.657527923583984]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 3.0, 5.0, 11.0, 10.0, 11.0, 12.0, 25.0, 26.0, 22.0, 33.0, 46.0, 47.0, 45.0, 55.0, 56.0, 72.0, 63.0, 69.0, 50.0, 61.0, 53.0, 35.0, 48.0, 26.0, 25.0, 25.0, 14.0, 18.0, 10.0, 11.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.984375, -3.868682861328125, -3.75299072265625, -3.637298583984375, -3.5216064453125, -3.405914306640625, -3.29022216796875, -3.174530029296875, -3.058837890625, -2.943145751953125, -2.82745361328125, -2.711761474609375, -2.5960693359375, -2.480377197265625, -2.36468505859375, -2.248992919921875, -2.13330078125, -2.017608642578125, -1.90191650390625, -1.786224365234375, -1.6705322265625, -1.554840087890625, -1.43914794921875, -1.323455810546875, -1.207763671875, -1.092071533203125, -0.97637939453125, -0.860687255859375, -0.7449951171875, -0.629302978515625, -0.51361083984375, -0.397918701171875, -0.2822265625, -0.166534423828125, -0.05084228515625, 0.064849853515625, 0.1805419921875, 0.296234130859375, 0.41192626953125, 0.527618408203125, 0.643310546875, 0.759002685546875, 0.87469482421875, 0.990386962890625, 1.1060791015625, 1.221771240234375, 1.33746337890625, 1.453155517578125, 1.56884765625, 1.684539794921875, 1.80023193359375, 1.915924072265625, 2.0316162109375, 2.147308349609375, 2.26300048828125, 2.378692626953125, 2.494384765625, 2.610076904296875, 2.72576904296875, 2.841461181640625, 2.9571533203125, 3.072845458984375, 3.18853759765625, 3.304229736328125, 3.419921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 5.0, 4.0, 8.0, 6.0, 7.0, 15.0, 19.0, 29.0, 34.0, 56.0, 95.0, 124.0, 207.0, 291.0, 506.0, 879.0, 1740.0, 3377.0, 7766.0, 20034.0, 99279.0, 1511131.0, 2350801.0, 156180.0, 24559.0, 8647.0, 3924.0, 1928.0, 1065.0, 603.0, 357.0, 208.0, 143.0, 79.0, 61.0, 38.0, 23.0, 19.0, 9.0, 12.0, 9.0, 3.0, 0.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.09375, -9.7977294921875, -9.501708984375, -9.2056884765625, -8.90966796875, -8.6136474609375, -8.317626953125, -8.0216064453125, -7.7255859375, -7.4295654296875, -7.133544921875, -6.8375244140625, -6.54150390625, -6.2454833984375, -5.949462890625, -5.6534423828125, -5.357421875, -5.0614013671875, -4.765380859375, -4.4693603515625, -4.17333984375, -3.8773193359375, -3.581298828125, -3.2852783203125, -2.9892578125, -2.6932373046875, -2.397216796875, -2.1011962890625, -1.80517578125, -1.5091552734375, -1.213134765625, -0.9171142578125, -0.62109375, -0.3250732421875, -0.029052734375, 0.2669677734375, 0.56298828125, 0.8590087890625, 1.155029296875, 1.4510498046875, 1.7470703125, 2.0430908203125, 2.339111328125, 2.6351318359375, 2.93115234375, 3.2271728515625, 3.523193359375, 3.8192138671875, 4.115234375, 4.4112548828125, 4.707275390625, 5.0032958984375, 5.29931640625, 5.5953369140625, 5.891357421875, 6.1873779296875, 6.4833984375, 6.7794189453125, 7.075439453125, 7.3714599609375, 7.66748046875, 7.9635009765625, 8.259521484375, 8.5555419921875, 8.8515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 8.0, 7.0, 7.0, 20.0, 20.0, 7.0, 33.0, 32.0, 68.0, 71.0, 96.0, 133.0, 181.0, 241.0, 355.0, 447.0, 480.0, 423.0, 359.0, 277.0, 203.0, 155.0, 116.0, 89.0, 55.0, 46.0, 30.0, 25.0, 18.0, 14.0, 13.0, 10.0, 9.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.515625, -5.3218994140625, -5.128173828125, -4.9344482421875, -4.74072265625, -4.5469970703125, -4.353271484375, -4.1595458984375, -3.9658203125, -3.7720947265625, -3.578369140625, -3.3846435546875, -3.19091796875, -2.9971923828125, -2.803466796875, -2.6097412109375, -2.416015625, -2.2222900390625, -2.028564453125, -1.8348388671875, -1.64111328125, -1.4473876953125, -1.253662109375, -1.0599365234375, -0.8662109375, -0.6724853515625, -0.478759765625, -0.2850341796875, -0.09130859375, 0.1024169921875, 0.296142578125, 0.4898681640625, 0.68359375, 0.8773193359375, 1.071044921875, 1.2647705078125, 1.45849609375, 1.6522216796875, 1.845947265625, 2.0396728515625, 2.2333984375, 2.4271240234375, 2.620849609375, 2.8145751953125, 3.00830078125, 3.2020263671875, 3.395751953125, 3.5894775390625, 3.783203125, 3.9769287109375, 4.170654296875, 4.3643798828125, 4.55810546875, 4.7518310546875, 4.945556640625, 5.1392822265625, 5.3330078125, 5.5267333984375, 5.720458984375, 5.9141845703125, 6.10791015625, 6.3016357421875, 6.495361328125, 6.6890869140625, 6.8828125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 7.0, 9.0, 16.0, 16.0, 26.0, 41.0, 45.0, 55.0, 104.0, 195.0, 255.0, 356.0, 613.0, 998.0, 1561.0, 2631.0, 4480.0, 8335.0, 16237.0, 37872.0, 118651.0, 534512.0, 1990100.0, 1129849.0, 234779.0, 62338.0, 24005.0, 11277.0, 6041.0, 3376.0, 2086.0, 1215.0, 761.0, 469.0, 353.0, 217.0, 128.0, 95.0, 70.0, 23.0, 27.0, 21.0, 14.0, 9.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.76019287109375, -6.5164794921875, -6.27276611328125, -6.029052734375, -5.78533935546875, -5.5416259765625, -5.29791259765625, -5.05419921875, -4.81048583984375, -4.5667724609375, -4.32305908203125, -4.079345703125, -3.83563232421875, -3.5919189453125, -3.34820556640625, -3.1044921875, -2.86077880859375, -2.6170654296875, -2.37335205078125, -2.129638671875, -1.88592529296875, -1.6422119140625, -1.39849853515625, -1.15478515625, -0.91107177734375, -0.6673583984375, -0.42364501953125, -0.179931640625, 0.06378173828125, 0.3074951171875, 0.55120849609375, 0.794921875, 1.03863525390625, 1.2823486328125, 1.52606201171875, 1.769775390625, 2.01348876953125, 2.2572021484375, 2.50091552734375, 2.74462890625, 2.98834228515625, 3.2320556640625, 3.47576904296875, 3.719482421875, 3.96319580078125, 4.2069091796875, 4.45062255859375, 4.6943359375, 4.93804931640625, 5.1817626953125, 5.42547607421875, 5.669189453125, 5.91290283203125, 6.1566162109375, 6.40032958984375, 6.64404296875, 6.88775634765625, 7.1314697265625, 7.37518310546875, 7.618896484375, 7.86260986328125, 8.1063232421875, 8.35003662109375, 8.59375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 15.0, 26.0, 115.0, 269.0, 325.0, 181.0, 54.0, 13.0, 9.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.35435485839844, -205.33767700195312, -201.32098388671875, -197.30429077148438, -193.28761291503906, -189.27093505859375, -185.25424194335938, -181.237548828125, -177.2208709716797, -173.20419311523438, -169.1875, -165.17080688476562, -161.1541290283203, -157.137451171875, -153.12075805664062, -149.10406494140625, -145.08738708496094, -141.07070922851562, -137.05401611328125, -133.03732299804688, -129.02064514160156, -125.00395965576172, -120.98727416992188, -116.97058868408203, -112.95390319824219, -108.93721771240234, -104.9205322265625, -100.90384674072266, -96.88716125488281, -92.87047576904297, -88.85379028320312, -84.83710479736328, -80.82042694091797, -76.80374145507812, -72.78705596923828, -68.77037048339844, -64.7536849975586, -60.73699951171875, -56.720314025878906, -52.70362854003906, -48.68694305419922, -44.670257568359375, -40.65357208251953, -36.63688659667969, -32.620201110839844, -28.603515625, -24.586830139160156, -20.570144653320312, -16.55345916748047, -12.536773681640625, -8.520088195800781, -4.5034027099609375, -0.48671722412109375, 3.52996826171875, 7.546653747558594, 11.563339233398438, 15.580024719238281, 19.596710205078125, 23.61339569091797, 27.630081176757812, 31.646766662597656, 35.6634521484375, 39.680137634277344, 43.69682312011719, 47.71350860595703]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 1.0, 5.0, 0.0, 7.0, 8.0, 11.0, 8.0, 13.0, 14.0, 9.0, 16.0, 17.0, 19.0, 20.0, 16.0, 15.0, 25.0, 27.0, 27.0, 38.0, 30.0, 35.0, 41.0, 53.0, 42.0, 32.0, 36.0, 32.0, 34.0, 42.0, 25.0, 31.0, 28.0, 35.0, 22.0, 24.0, 29.0, 25.0, 14.0, 6.0, 14.0, 11.0, 10.0, 11.0, 7.0, 3.0, 9.0, 2.0, 6.0, 6.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.770544052124023, -21.082311630249023, -20.394081115722656, -19.705848693847656, -19.017616271972656, -18.32938575744629, -17.64115333557129, -16.952922821044922, -16.264690399169922, -15.576458930969238, -14.888227462768555, -14.199995040893555, -13.511763572692871, -12.823532104492188, -12.135299682617188, -11.447068214416504, -10.75883674621582, -10.070605278015137, -9.382373809814453, -8.694141387939453, -8.00590991973877, -7.317678451538086, -6.629446506500244, -5.941214561462402, -5.252983093261719, -4.564751625061035, -3.8765196800231934, -3.1882879734039307, -2.500056266784668, -1.8118245601654053, -1.1235928535461426, -0.4353609085083008, 0.2528724670410156, 0.9411041736602783, 1.629335880279541, 2.3175675868988037, 3.0057992935180664, 3.694031000137329, 4.382262706756592, 5.070494651794434, 5.758726119995117, 6.446957588195801, 7.135189533233643, 7.823421478271484, 8.511652946472168, 9.199884414672852, 9.888116836547852, 10.576348304748535, 11.264579772949219, 11.952811241149902, 12.641042709350586, 13.329275131225586, 14.01750659942627, 14.705738067626953, 15.393970489501953, 16.082202911376953, 16.77043342590332, 17.45866584777832, 18.146896362304688, 18.835128784179688, 19.523361206054688, 20.211591720581055, 20.899824142456055, 21.588054656982422, 22.276287078857422]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 11.0, 6.0, 9.0, 11.0, 13.0, 14.0, 29.0, 25.0, 34.0, 37.0, 40.0, 45.0, 50.0, 53.0, 56.0, 67.0, 51.0, 65.0, 70.0, 52.0, 40.0, 46.0, 35.0, 37.0, 28.0, 16.0, 14.0, 15.0, 10.0, 8.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.19244384765625, -4.0723876953125, -3.95233154296875, -3.832275390625, -3.71221923828125, -3.5921630859375, -3.47210693359375, -3.35205078125, -3.23199462890625, -3.1119384765625, -2.99188232421875, -2.871826171875, -2.75177001953125, -2.6317138671875, -2.51165771484375, -2.3916015625, -2.27154541015625, -2.1514892578125, -2.03143310546875, -1.911376953125, -1.79132080078125, -1.6712646484375, -1.55120849609375, -1.43115234375, -1.31109619140625, -1.1910400390625, -1.07098388671875, -0.950927734375, -0.83087158203125, -0.7108154296875, -0.59075927734375, -0.470703125, -0.35064697265625, -0.2305908203125, -0.11053466796875, 0.009521484375, 0.12957763671875, 0.2496337890625, 0.36968994140625, 0.48974609375, 0.60980224609375, 0.7298583984375, 0.84991455078125, 0.969970703125, 1.09002685546875, 1.2100830078125, 1.33013916015625, 1.4501953125, 1.57025146484375, 1.6903076171875, 1.81036376953125, 1.930419921875, 2.05047607421875, 2.1705322265625, 2.29058837890625, 2.41064453125, 2.53070068359375, 2.6507568359375, 2.77081298828125, 2.890869140625, 3.01092529296875, 3.1309814453125, 3.25103759765625, 3.37109375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 7.0, 17.0, 20.0, 19.0, 26.0, 25.0, 46.0, 56.0, 72.0, 109.0, 155.0, 166.0, 251.0, 313.0, 473.0, 644.0, 946.0, 1383.0, 2330.0, 3717.0, 7377.0, 15936.0, 37293.0, 94073.0, 215663.0, 313231.0, 201701.0, 86297.0, 34380.0, 14612.0, 6923.0, 3567.0, 2087.0, 1357.0, 919.0, 609.0, 437.0, 371.0, 207.0, 198.0, 144.0, 97.0, 67.0, 52.0, 55.0, 27.0, 24.0, 19.0, 17.0, 8.0, 10.0, 4.0, 5.0, 3.0, 6.0, 2.0], "bins": [-0.837890625, -0.8128433227539062, -0.7877960205078125, -0.7627487182617188, -0.737701416015625, -0.7126541137695312, -0.6876068115234375, -0.6625595092773438, -0.63751220703125, -0.6124649047851562, -0.5874176025390625, -0.5623703002929688, -0.537322998046875, -0.5122756958007812, -0.4872283935546875, -0.46218109130859375, -0.4371337890625, -0.41208648681640625, -0.3870391845703125, -0.36199188232421875, -0.336944580078125, -0.31189727783203125, -0.2868499755859375, -0.26180267333984375, -0.23675537109375, -0.21170806884765625, -0.1866607666015625, -0.16161346435546875, -0.136566162109375, -0.11151885986328125, -0.0864715576171875, -0.06142425537109375, -0.036376953125, -0.01132965087890625, 0.0137176513671875, 0.03876495361328125, 0.063812255859375, 0.08885955810546875, 0.1139068603515625, 0.13895416259765625, 0.16400146484375, 0.18904876708984375, 0.2140960693359375, 0.23914337158203125, 0.264190673828125, 0.28923797607421875, 0.3142852783203125, 0.33933258056640625, 0.3643798828125, 0.38942718505859375, 0.4144744873046875, 0.43952178955078125, 0.464569091796875, 0.48961639404296875, 0.5146636962890625, 0.5397109985351562, 0.56475830078125, 0.5898056030273438, 0.6148529052734375, 0.6399002075195312, 0.664947509765625, 0.6899948120117188, 0.7150421142578125, 0.7400894165039062, 0.76513671875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 3.0, 4.0, 6.0, 4.0, 10.0, 10.0, 20.0, 15.0, 13.0, 18.0, 17.0, 25.0, 32.0, 32.0, 47.0, 36.0, 34.0, 41.0, 35.0, 40.0, 33.0, 1069.0, 32.0, 44.0, 39.0, 36.0, 34.0, 32.0, 36.0, 39.0, 27.0, 19.0, 21.0, 19.0, 20.0, 15.0, 9.0, 17.0, 12.0, 7.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.033203125, -1.96954345703125, -1.9058837890625, -1.84222412109375, -1.778564453125, -1.71490478515625, -1.6512451171875, -1.58758544921875, -1.52392578125, -1.46026611328125, -1.3966064453125, -1.33294677734375, -1.269287109375, -1.20562744140625, -1.1419677734375, -1.07830810546875, -1.0146484375, -0.95098876953125, -0.8873291015625, -0.82366943359375, -0.760009765625, -0.69635009765625, -0.6326904296875, -0.56903076171875, -0.50537109375, -0.44171142578125, -0.3780517578125, -0.31439208984375, -0.250732421875, -0.18707275390625, -0.1234130859375, -0.05975341796875, 0.00390625, 0.06756591796875, 0.1312255859375, 0.19488525390625, 0.258544921875, 0.32220458984375, 0.3858642578125, 0.44952392578125, 0.51318359375, 0.57684326171875, 0.6405029296875, 0.70416259765625, 0.767822265625, 0.83148193359375, 0.8951416015625, 0.95880126953125, 1.0224609375, 1.08612060546875, 1.1497802734375, 1.21343994140625, 1.277099609375, 1.34075927734375, 1.4044189453125, 1.46807861328125, 1.53173828125, 1.59539794921875, 1.6590576171875, 1.72271728515625, 1.786376953125, 1.85003662109375, 1.9136962890625, 1.97735595703125, 2.041015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 14.0, 30.0, 32.0, 74.0, 112.0, 181.0, 339.0, 586.0, 1296.0, 3126.0, 10802.0, 54692.0, 357522.0, 1506485.0, 130458.0, 22403.0, 5225.0, 1885.0, 846.0, 424.0, 241.0, 124.0, 70.0, 43.0, 32.0, 17.0, 18.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.68798828125, -0.6684646606445312, -0.6489410400390625, -0.6294174194335938, -0.609893798828125, -0.5903701782226562, -0.5708465576171875, -0.5513229370117188, -0.53179931640625, -0.5122756958007812, -0.4927520751953125, -0.47322845458984375, -0.453704833984375, -0.43418121337890625, -0.4146575927734375, -0.39513397216796875, -0.3756103515625, -0.35608673095703125, -0.3365631103515625, -0.31703948974609375, -0.297515869140625, -0.27799224853515625, -0.2584686279296875, -0.23894500732421875, -0.21942138671875, -0.19989776611328125, -0.1803741455078125, -0.16085052490234375, -0.141326904296875, -0.12180328369140625, -0.1022796630859375, -0.08275604248046875, -0.063232421875, -0.04370880126953125, -0.0241851806640625, -0.00466156005859375, 0.014862060546875, 0.03438568115234375, 0.0539093017578125, 0.07343292236328125, 0.09295654296875, 0.11248016357421875, 0.1320037841796875, 0.15152740478515625, 0.171051025390625, 0.19057464599609375, 0.2100982666015625, 0.22962188720703125, 0.2491455078125, 0.26866912841796875, 0.2881927490234375, 0.30771636962890625, 0.327239990234375, 0.34676361083984375, 0.3662872314453125, 0.38581085205078125, 0.40533447265625, 0.42485809326171875, 0.4443817138671875, 0.46390533447265625, 0.483428955078125, 0.5029525756835938, 0.5224761962890625, 0.5419998168945312, 0.5615234375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 2.0, 16.0, 14.0, 19.0, 26.0, 40.0, 64.0, 98.0, 169.0, 189.0, 119.0, 79.0, 52.0, 33.0, 19.0, 11.0, 12.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.091064453125, -0.08794116973876953, -0.08481788635253906, -0.0816946029663086, -0.07857131958007812, -0.07544803619384766, -0.07232475280761719, -0.06920146942138672, -0.06607818603515625, -0.06295490264892578, -0.05983161926269531, -0.056708335876464844, -0.053585052490234375, -0.050461769104003906, -0.04733848571777344, -0.04421520233154297, -0.0410919189453125, -0.03796863555908203, -0.03484535217285156, -0.031722068786621094, -0.028598785400390625, -0.025475502014160156, -0.022352218627929688, -0.01922893524169922, -0.01610565185546875, -0.012982368469238281, -0.009859085083007812, -0.006735801696777344, -0.003612518310546875, -0.0004892349243164062, 0.0026340484619140625, 0.005757331848144531, 0.008880615234375, 0.012003898620605469, 0.015127182006835938, 0.018250465393066406, 0.021373748779296875, 0.024497032165527344, 0.027620315551757812, 0.03074359893798828, 0.03386688232421875, 0.03699016571044922, 0.04011344909667969, 0.043236732482910156, 0.046360015869140625, 0.049483299255371094, 0.05260658264160156, 0.05572986602783203, 0.0588531494140625, 0.06197643280029297, 0.06509971618652344, 0.0682229995727539, 0.07134628295898438, 0.07446956634521484, 0.07759284973144531, 0.08071613311767578, 0.08383941650390625, 0.08696269989013672, 0.09008598327636719, 0.09320926666259766, 0.09633255004882812, 0.0994558334350586, 0.10257911682128906, 0.10570240020751953, 0.10882568359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 15.0, 20.0, 27.0, 58.0, 61.0, 216.0, 771.0, 5834.0, 943603.0, 94159.0, 3040.0, 435.0, 118.0, 63.0, 46.0, 24.0, 14.0, 13.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.33984375, -2.272705078125, -2.20556640625, -2.138427734375, -2.0712890625, -2.004150390625, -1.93701171875, -1.869873046875, -1.802734375, -1.735595703125, -1.66845703125, -1.601318359375, -1.5341796875, -1.467041015625, -1.39990234375, -1.332763671875, -1.265625, -1.198486328125, -1.13134765625, -1.064208984375, -0.9970703125, -0.929931640625, -0.86279296875, -0.795654296875, -0.728515625, -0.661376953125, -0.59423828125, -0.527099609375, -0.4599609375, -0.392822265625, -0.32568359375, -0.258544921875, -0.19140625, -0.124267578125, -0.05712890625, 0.010009765625, 0.0771484375, 0.144287109375, 0.21142578125, 0.278564453125, 0.345703125, 0.412841796875, 0.47998046875, 0.547119140625, 0.6142578125, 0.681396484375, 0.74853515625, 0.815673828125, 0.8828125, 0.949951171875, 1.01708984375, 1.084228515625, 1.1513671875, 1.218505859375, 1.28564453125, 1.352783203125, 1.419921875, 1.487060546875, 1.55419921875, 1.621337890625, 1.6884765625, 1.755615234375, 1.82275390625, 1.889892578125, 1.95703125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 16.0, 34.0, 135.0, 390.0, 315.0, 74.0, 26.0, 11.0, 6.0, 2.0, 1.0], "bins": [-1.5195623636245728, -1.4928452968597412, -1.4661283493041992, -1.4394112825393677, -1.4126942157745361, -1.3859772682189941, -1.3592602014541626, -1.332543134689331, -1.305826187133789, -1.2791091203689575, -1.2523921728134155, -1.225675106048584, -1.1989580392837524, -1.1722410917282104, -1.145524024963379, -1.1188069581985474, -1.0920898914337158, -1.0653728246688843, -1.0386558771133423, -1.0119388103485107, -0.985221803188324, -0.9585047364234924, -0.9317877292633057, -0.9050706624984741, -0.8783537149429321, -0.8516367077827454, -0.8249196410179138, -0.798202633857727, -0.7714856266975403, -0.7447685599327087, -0.718051552772522, -0.6913344860076904, -0.6646174192428589, -0.6379004120826721, -0.6111833453178406, -0.5844663381576538, -0.557749330997467, -0.5310322642326355, -0.5043152570724487, -0.4775982201099396, -0.4508812427520752, -0.42416420578956604, -0.3974471986293793, -0.3707301616668701, -0.34401312470436096, -0.3172960877418518, -0.29057908058166504, -0.2638620436191559, -0.23714500665664673, -0.21042798459529877, -0.1837109476327896, -0.15699392557144165, -0.1302768886089325, -0.10355986654758453, -0.07684284448623657, -0.05012580752372742, -0.023408785462379456, 0.0033082421869039536, 0.030025269836187363, 0.05674229562282562, 0.08345932513475418, 0.11017635464668274, 0.1368933767080307, 0.16361041367053986, 0.19032743573188782]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 11.0, 7.0, 15.0, 18.0, 14.0, 18.0, 24.0, 36.0, 31.0, 39.0, 48.0, 36.0, 30.0, 45.0, 37.0, 38.0, 43.0, 37.0, 41.0, 45.0, 45.0, 41.0, 38.0, 36.0, 30.0, 25.0, 20.0, 23.0, 23.0, 20.0, 10.0, 15.0, 15.0, 7.0, 5.0, 9.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09699952602386475, -0.09404895454645157, -0.09109838306903839, -0.08814781159162521, -0.08519724011421204, -0.08224666863679886, -0.07929609715938568, -0.0763455256819725, -0.07339495420455933, -0.07044438272714615, -0.06749381124973297, -0.0645432397723198, -0.061592668294906616, -0.05864209681749344, -0.05569152534008026, -0.052740953862667084, -0.049790382385253906, -0.04683981090784073, -0.04388923943042755, -0.040938667953014374, -0.037988096475601196, -0.03503752499818802, -0.03208695352077484, -0.029136382043361664, -0.026185810565948486, -0.02323523908853531, -0.02028466761112213, -0.017334096133708954, -0.014383524656295776, -0.011432953178882599, -0.008482381701469421, -0.005531810224056244, -0.0025812387466430664, 0.0003693327307701111, 0.0033199042081832886, 0.006270475685596466, 0.009221047163009644, 0.012171618640422821, 0.015122190117835999, 0.018072761595249176, 0.021023333072662354, 0.02397390455007553, 0.02692447602748871, 0.029875047504901886, 0.032825618982315063, 0.03577619045972824, 0.03872676193714142, 0.041677333414554596, 0.04462790489196777, 0.04757847636938095, 0.05052904784679413, 0.053479619324207306, 0.05643019080162048, 0.05938076227903366, 0.06233133375644684, 0.06528190523386002, 0.0682324767112732, 0.07118304818868637, 0.07413361966609955, 0.07708419114351273, 0.0800347626209259, 0.08298533409833908, 0.08593590557575226, 0.08888647705316544, 0.09183704853057861]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 5.0, 11.0, 11.0, 11.0, 17.0, 22.0, 26.0, 24.0, 41.0, 40.0, 56.0, 59.0, 52.0, 78.0, 54.0, 64.0, 68.0, 57.0, 59.0, 49.0, 43.0, 33.0, 30.0, 22.0, 25.0, 10.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.3472900390625, -4.221923828125, -4.0965576171875, -3.97119140625, -3.8458251953125, -3.720458984375, -3.5950927734375, -3.4697265625, -3.3443603515625, -3.218994140625, -3.0936279296875, -2.96826171875, -2.8428955078125, -2.717529296875, -2.5921630859375, -2.466796875, -2.3414306640625, -2.216064453125, -2.0906982421875, -1.96533203125, -1.8399658203125, -1.714599609375, -1.5892333984375, -1.4638671875, -1.3385009765625, -1.213134765625, -1.0877685546875, -0.96240234375, -0.8370361328125, -0.711669921875, -0.5863037109375, -0.4609375, -0.3355712890625, -0.210205078125, -0.0848388671875, 0.04052734375, 0.1658935546875, 0.291259765625, 0.4166259765625, 0.5419921875, 0.6673583984375, 0.792724609375, 0.9180908203125, 1.04345703125, 1.1688232421875, 1.294189453125, 1.4195556640625, 1.544921875, 1.6702880859375, 1.795654296875, 1.9210205078125, 2.04638671875, 2.1717529296875, 2.297119140625, 2.4224853515625, 2.5478515625, 2.6732177734375, 2.798583984375, 2.9239501953125, 3.04931640625, 3.1746826171875, 3.300048828125, 3.4254150390625, 3.55078125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 11.0, 15.0, 17.0, 41.0, 51.0, 84.0, 144.0, 198.0, 328.0, 516.0, 833.0, 1315.0, 2179.0, 3854.0, 6290.0, 11110.0, 20698.0, 42744.0, 96729.0, 215522.0, 303772.0, 183911.0, 80237.0, 35902.0, 18212.0, 9689.0, 5563.0, 3340.0, 2028.0, 1203.0, 753.0, 470.0, 283.0, 187.0, 115.0, 81.0, 44.0, 23.0, 25.0, 11.0, 10.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.591278076171875, -2.50872802734375, -2.426177978515625, -2.3436279296875, -2.261077880859375, -2.17852783203125, -2.095977783203125, -2.013427734375, -1.930877685546875, -1.84832763671875, -1.765777587890625, -1.6832275390625, -1.600677490234375, -1.51812744140625, -1.435577392578125, -1.35302734375, -1.270477294921875, -1.18792724609375, -1.105377197265625, -1.0228271484375, -0.940277099609375, -0.85772705078125, -0.775177001953125, -0.692626953125, -0.610076904296875, -0.52752685546875, -0.444976806640625, -0.3624267578125, -0.279876708984375, -0.19732666015625, -0.114776611328125, -0.0322265625, 0.050323486328125, 0.13287353515625, 0.215423583984375, 0.2979736328125, 0.380523681640625, 0.46307373046875, 0.545623779296875, 0.628173828125, 0.710723876953125, 0.79327392578125, 0.875823974609375, 0.9583740234375, 1.040924072265625, 1.12347412109375, 1.206024169921875, 1.28857421875, 1.371124267578125, 1.45367431640625, 1.536224365234375, 1.6187744140625, 1.701324462890625, 1.78387451171875, 1.866424560546875, 1.948974609375, 2.031524658203125, 2.11407470703125, 2.196624755859375, 2.2791748046875, 2.361724853515625, 2.44427490234375, 2.526824951171875, 2.609375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 1.0, 2.0, 8.0, 0.0, 10.0, 15.0, 20.0, 13.0, 14.0, 15.0, 24.0, 33.0, 28.0, 42.0, 41.0, 35.0, 50.0, 52.0, 91.0, 205.0, 1386.0, 333.0, 164.0, 74.0, 67.0, 34.0, 36.0, 31.0, 32.0, 29.0, 22.0, 28.0, 22.0, 26.0, 12.0, 17.0, 8.0, 9.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1796875, -8.862060546875, -8.54443359375, -8.226806640625, -7.9091796875, -7.591552734375, -7.27392578125, -6.956298828125, -6.638671875, -6.321044921875, -6.00341796875, -5.685791015625, -5.3681640625, -5.050537109375, -4.73291015625, -4.415283203125, -4.09765625, -3.780029296875, -3.46240234375, -3.144775390625, -2.8271484375, -2.509521484375, -2.19189453125, -1.874267578125, -1.556640625, -1.239013671875, -0.92138671875, -0.603759765625, -0.2861328125, 0.031494140625, 0.34912109375, 0.666748046875, 0.984375, 1.302001953125, 1.61962890625, 1.937255859375, 2.2548828125, 2.572509765625, 2.89013671875, 3.207763671875, 3.525390625, 3.843017578125, 4.16064453125, 4.478271484375, 4.7958984375, 5.113525390625, 5.43115234375, 5.748779296875, 6.06640625, 6.384033203125, 6.70166015625, 7.019287109375, 7.3369140625, 7.654541015625, 7.97216796875, 8.289794921875, 8.607421875, 8.925048828125, 9.24267578125, 9.560302734375, 9.8779296875, 10.195556640625, 10.51318359375, 10.830810546875, 11.1484375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 10.0, 9.0, 20.0, 22.0, 21.0, 32.0, 35.0, 46.0, 51.0, 85.0, 92.0, 172.0, 287.0, 484.0, 1480.0, 9472.0, 517665.0, 2583174.0, 28255.0, 2519.0, 718.0, 343.0, 200.0, 113.0, 100.0, 61.0, 49.0, 35.0, 24.0, 26.0, 19.0, 20.0, 12.0, 8.0, 10.0, 5.0, 2.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-19.859375, -19.294921875, -18.73046875, -18.166015625, -17.6015625, -17.037109375, -16.47265625, -15.908203125, -15.34375, -14.779296875, -14.21484375, -13.650390625, -13.0859375, -12.521484375, -11.95703125, -11.392578125, -10.828125, -10.263671875, -9.69921875, -9.134765625, -8.5703125, -8.005859375, -7.44140625, -6.876953125, -6.3125, -5.748046875, -5.18359375, -4.619140625, -4.0546875, -3.490234375, -2.92578125, -2.361328125, -1.796875, -1.232421875, -0.66796875, -0.103515625, 0.4609375, 1.025390625, 1.58984375, 2.154296875, 2.71875, 3.283203125, 3.84765625, 4.412109375, 4.9765625, 5.541015625, 6.10546875, 6.669921875, 7.234375, 7.798828125, 8.36328125, 8.927734375, 9.4921875, 10.056640625, 10.62109375, 11.185546875, 11.75, 12.314453125, 12.87890625, 13.443359375, 14.0078125, 14.572265625, 15.13671875, 15.701171875, 16.265625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 11.0, 24.0, 50.0, 97.0, 165.0, 195.0, 189.0, 117.0, 85.0, 43.0, 23.0, 7.0, 6.0, 1.0], "bins": [-49.52204895019531, -48.634037017822266, -47.746028900146484, -46.85801696777344, -45.970008850097656, -45.08199691772461, -44.19398498535156, -43.30597686767578, -42.417964935302734, -41.52995300292969, -40.641944885253906, -39.75393295288086, -38.86592102050781, -37.97791290283203, -37.089900970458984, -36.2018928527832, -35.313880920410156, -34.42586898803711, -33.53786087036133, -32.64984893798828, -31.761838912963867, -30.873828887939453, -29.985816955566406, -29.097806930541992, -28.209796905517578, -27.321786880493164, -26.43377685546875, -25.545764923095703, -24.65775489807129, -23.769744873046875, -22.881732940673828, -21.993722915649414, -21.105710983276367, -20.217700958251953, -19.329689025878906, -18.441679000854492, -17.553668975830078, -16.665658950805664, -15.777647972106934, -14.889636993408203, -14.001626968383789, -13.113616943359375, -12.225605964660645, -11.337594985961914, -10.4495849609375, -9.561574935913086, -8.673563957214355, -7.785553455352783, -6.897543430328369, -6.009532928466797, -5.121522426605225, -4.233511924743652, -3.34550142288208, -2.457490921020508, -1.5694804191589355, -0.6814699172973633, 0.20654058456420898, 1.0945510864257812, 1.9825615882873535, 2.870572090148926, 3.758582592010498, 4.64659309387207, 5.534603595733643, 6.422614097595215, 7.310624599456787]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 9.0, 5.0, 6.0, 10.0, 17.0, 10.0, 15.0, 18.0, 18.0, 25.0, 23.0, 20.0, 21.0, 37.0, 26.0, 37.0, 30.0, 44.0, 41.0, 45.0, 46.0, 32.0, 29.0, 30.0, 39.0, 36.0, 31.0, 34.0, 29.0, 29.0, 27.0, 28.0, 21.0, 28.0, 15.0, 26.0, 18.0, 9.0, 12.0, 6.0, 5.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.49749755859375, -24.715063095092773, -23.932626724243164, -23.150192260742188, -22.36775779724121, -21.5853214263916, -20.802886962890625, -20.020450592041016, -19.23801612854004, -18.455581665039062, -17.673145294189453, -16.890710830688477, -16.1082763671875, -15.32583999633789, -14.543405532836914, -13.760970115661621, -12.978535652160645, -12.196100234985352, -11.413665771484375, -10.631230354309082, -9.848794937133789, -9.066360473632812, -8.28392505645752, -7.501489639282227, -6.719054698944092, -5.936619758605957, -5.154184341430664, -4.371749401092529, -3.5893142223358154, -2.8068790435791016, -2.024444103240967, -1.2420086860656738, -0.45957374572753906, 0.32286137342453003, 1.1052964925765991, 1.8877315521240234, 2.6701667308807373, 3.452601909637451, 4.235036849975586, 5.017472267150879, 5.799907207489014, 6.582342147827148, 7.364777565002441, 8.147212982177734, 8.929647445678711, 9.712082862854004, 10.494518280029297, 11.276952743530273, 12.059388160705566, 12.84182357788086, 13.624258041381836, 14.406693458557129, 15.189128875732422, 15.971563339233398, 16.753997802734375, 17.536434173583984, 18.31886863708496, 19.101303100585938, 19.883739471435547, 20.666173934936523, 21.4486083984375, 22.23104476928711, 23.013479232788086, 23.795913696289062, 24.578350067138672]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 7.0, 7.0, 7.0, 8.0, 17.0, 19.0, 20.0, 29.0, 17.0, 34.0, 38.0, 40.0, 42.0, 40.0, 57.0, 55.0, 61.0, 40.0, 59.0, 79.0, 41.0, 38.0, 45.0, 33.0, 30.0, 28.0, 24.0, 17.0, 15.0, 18.0, 10.0, 5.0, 10.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.40234375, -4.287109375, -4.171875, -4.056640625, -3.94140625, -3.826171875, -3.7109375, -3.595703125, -3.48046875, -3.365234375, -3.25, -3.134765625, -3.01953125, -2.904296875, -2.7890625, -2.673828125, -2.55859375, -2.443359375, -2.328125, -2.212890625, -2.09765625, -1.982421875, -1.8671875, -1.751953125, -1.63671875, -1.521484375, -1.40625, -1.291015625, -1.17578125, -1.060546875, -0.9453125, -0.830078125, -0.71484375, -0.599609375, -0.484375, -0.369140625, -0.25390625, -0.138671875, -0.0234375, 0.091796875, 0.20703125, 0.322265625, 0.4375, 0.552734375, 0.66796875, 0.783203125, 0.8984375, 1.013671875, 1.12890625, 1.244140625, 1.359375, 1.474609375, 1.58984375, 1.705078125, 1.8203125, 1.935546875, 2.05078125, 2.166015625, 2.28125, 2.396484375, 2.51171875, 2.626953125, 2.7421875, 2.857421875, 2.97265625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 8.0, 7.0, 4.0, 6.0, 18.0, 18.0, 29.0, 28.0, 57.0, 69.0, 85.0, 131.0, 217.0, 321.0, 461.0, 701.0, 1154.0, 1927.0, 3478.0, 7104.0, 18129.0, 81380.0, 863337.0, 2726596.0, 416645.0, 47889.0, 12681.0, 5241.0, 2628.0, 1522.0, 842.0, 525.0, 356.0, 236.0, 130.0, 89.0, 65.0, 49.0, 40.0, 27.0, 17.0, 6.0, 9.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.609375, -9.34503173828125, -9.0806884765625, -8.81634521484375, -8.552001953125, -8.28765869140625, -8.0233154296875, -7.75897216796875, -7.49462890625, -7.23028564453125, -6.9659423828125, -6.70159912109375, -6.437255859375, -6.17291259765625, -5.9085693359375, -5.64422607421875, -5.3798828125, -5.11553955078125, -4.8511962890625, -4.58685302734375, -4.322509765625, -4.05816650390625, -3.7938232421875, -3.52947998046875, -3.26513671875, -3.00079345703125, -2.7364501953125, -2.47210693359375, -2.207763671875, -1.94342041015625, -1.6790771484375, -1.41473388671875, -1.150390625, -0.88604736328125, -0.6217041015625, -0.35736083984375, -0.093017578125, 0.17132568359375, 0.4356689453125, 0.70001220703125, 0.96435546875, 1.22869873046875, 1.4930419921875, 1.75738525390625, 2.021728515625, 2.28607177734375, 2.5504150390625, 2.81475830078125, 3.0791015625, 3.34344482421875, 3.6077880859375, 3.87213134765625, 4.136474609375, 4.40081787109375, 4.6651611328125, 4.92950439453125, 5.19384765625, 5.45819091796875, 5.7225341796875, 5.98687744140625, 6.251220703125, 6.51556396484375, 6.7799072265625, 7.04425048828125, 7.30859375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 1.0, 1.0, 9.0, 11.0, 15.0, 22.0, 42.0, 71.0, 109.0, 157.0, 302.0, 519.0, 712.0, 786.0, 532.0, 326.0, 196.0, 101.0, 61.0, 40.0, 27.0, 12.0, 10.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.703125, -12.3408203125, -11.978515625, -11.6162109375, -11.25390625, -10.8916015625, -10.529296875, -10.1669921875, -9.8046875, -9.4423828125, -9.080078125, -8.7177734375, -8.35546875, -7.9931640625, -7.630859375, -7.2685546875, -6.90625, -6.5439453125, -6.181640625, -5.8193359375, -5.45703125, -5.0947265625, -4.732421875, -4.3701171875, -4.0078125, -3.6455078125, -3.283203125, -2.9208984375, -2.55859375, -2.1962890625, -1.833984375, -1.4716796875, -1.109375, -0.7470703125, -0.384765625, -0.0224609375, 0.33984375, 0.7021484375, 1.064453125, 1.4267578125, 1.7890625, 2.1513671875, 2.513671875, 2.8759765625, 3.23828125, 3.6005859375, 3.962890625, 4.3251953125, 4.6875, 5.0498046875, 5.412109375, 5.7744140625, 6.13671875, 6.4990234375, 6.861328125, 7.2236328125, 7.5859375, 7.9482421875, 8.310546875, 8.6728515625, 9.03515625, 9.3974609375, 9.759765625, 10.1220703125, 10.484375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 12.0, 21.0, 33.0, 79.0, 192.0, 561.0, 1930.0, 10409.0, 155770.0, 3794960.0, 215159.0, 12024.0, 2131.0, 593.0, 203.0, 95.0, 38.0, 21.0, 17.0, 14.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.125, -24.2744140625, -23.423828125, -22.5732421875, -21.72265625, -20.8720703125, -20.021484375, -19.1708984375, -18.3203125, -17.4697265625, -16.619140625, -15.7685546875, -14.91796875, -14.0673828125, -13.216796875, -12.3662109375, -11.515625, -10.6650390625, -9.814453125, -8.9638671875, -8.11328125, -7.2626953125, -6.412109375, -5.5615234375, -4.7109375, -3.8603515625, -3.009765625, -2.1591796875, -1.30859375, -0.4580078125, 0.392578125, 1.2431640625, 2.09375, 2.9443359375, 3.794921875, 4.6455078125, 5.49609375, 6.3466796875, 7.197265625, 8.0478515625, 8.8984375, 9.7490234375, 10.599609375, 11.4501953125, 12.30078125, 13.1513671875, 14.001953125, 14.8525390625, 15.703125, 16.5537109375, 17.404296875, 18.2548828125, 19.10546875, 19.9560546875, 20.806640625, 21.6572265625, 22.5078125, 23.3583984375, 24.208984375, 25.0595703125, 25.91015625, 26.7607421875, 27.611328125, 28.4619140625, 29.3125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 12.0, 11.0, 14.0, 25.0, 24.0, 26.0, 43.0, 40.0, 67.0, 65.0, 76.0, 72.0, 85.0, 68.0, 76.0, 45.0, 58.0, 35.0, 36.0, 30.0, 22.0, 18.0, 17.0, 10.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.343563079833984, -21.508934020996094, -20.674304962158203, -19.839675903320312, -19.005046844482422, -18.17041778564453, -17.33578872680664, -16.50115966796875, -15.666529655456543, -14.831900596618652, -13.997271537780762, -13.162641525268555, -12.328012466430664, -11.493383407592773, -10.658754348754883, -9.824125289916992, -8.989496231079102, -8.154867172241211, -7.32023811340332, -6.4856085777282715, -5.650979518890381, -4.81635046005249, -3.9817209243774414, -3.147091865539551, -2.31246280670166, -1.47783362865448, -0.6432044506072998, 0.19142484664916992, 1.0260539054870605, 1.8606829643249512, 2.6953125, 3.5299415588378906, 4.364568710327148, 5.199197769165039, 6.03382682800293, 6.8684563636779785, 7.703085422515869, 8.537714004516602, 9.372344017028809, 10.2069730758667, 11.04160213470459, 11.87623119354248, 12.710860252380371, 13.545490264892578, 14.380119323730469, 15.21474838256836, 16.04937744140625, 16.88400650024414, 17.71863555908203, 18.553264617919922, 19.387893676757812, 20.222522735595703, 21.057151794433594, 21.891780853271484, 22.726409912109375, 23.561038970947266, 24.395668029785156, 25.230297088623047, 26.064926147460938, 26.899555206298828, 27.73418426513672, 28.56881332397461, 29.4034423828125, 30.23807144165039, 31.072702407836914]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 5.0, 5.0, 6.0, 11.0, 8.0, 22.0, 23.0, 24.0, 23.0, 22.0, 21.0, 41.0, 42.0, 43.0, 41.0, 50.0, 46.0, 47.0, 48.0, 31.0, 32.0, 34.0, 40.0, 56.0, 31.0, 34.0, 39.0, 25.0, 27.0, 26.0, 14.0, 14.0, 18.0, 13.0, 11.0, 7.0, 9.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.392478942871094, -23.57134246826172, -22.750207901000977, -21.929073333740234, -21.10793685913086, -20.286800384521484, -19.465665817260742, -18.64453125, -17.823394775390625, -17.00225830078125, -16.181123733520508, -15.35998821258545, -14.53885269165039, -13.717717170715332, -12.896581649780273, -12.075446128845215, -11.254310607910156, -10.433175086975098, -9.612039566040039, -8.79090404510498, -7.969768524169922, -7.148633003234863, -6.327497482299805, -5.506361961364746, -4.6852264404296875, -3.864090919494629, -3.0429553985595703, -2.2218198776245117, -1.4006843566894531, -0.5795488357543945, 0.24158668518066406, 1.0627222061157227, 1.8838558197021484, 2.704991340637207, 3.5261268615722656, 4.347262382507324, 5.168397903442383, 5.989533424377441, 6.8106689453125, 7.631804466247559, 8.452939987182617, 9.274075508117676, 10.095211029052734, 10.916346549987793, 11.737482070922852, 12.55861759185791, 13.379753112792969, 14.200888633728027, 15.022024154663086, 15.843159675598145, 16.664295196533203, 17.485431671142578, 18.30656623840332, 19.127700805664062, 19.948837280273438, 20.769973754882812, 21.591108322143555, 22.412242889404297, 23.233379364013672, 24.054515838623047, 24.87565040588379, 25.69678497314453, 26.517921447753906, 27.33905792236328, 28.160192489624023]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 2.0, 5.0, 8.0, 14.0, 23.0, 24.0, 21.0, 33.0, 26.0, 45.0, 54.0, 49.0, 79.0, 44.0, 63.0, 61.0, 50.0, 58.0, 65.0, 50.0, 34.0, 36.0, 36.0, 26.0, 26.0, 17.0, 10.0, 11.0, 3.0, 11.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.148162841796875, -4.02288818359375, -3.897613525390625, -3.7723388671875, -3.647064208984375, -3.52178955078125, -3.396514892578125, -3.271240234375, -3.145965576171875, -3.02069091796875, -2.895416259765625, -2.7701416015625, -2.644866943359375, -2.51959228515625, -2.394317626953125, -2.26904296875, -2.143768310546875, -2.01849365234375, -1.893218994140625, -1.7679443359375, -1.642669677734375, -1.51739501953125, -1.392120361328125, -1.266845703125, -1.141571044921875, -1.01629638671875, -0.891021728515625, -0.7657470703125, -0.640472412109375, -0.51519775390625, -0.389923095703125, -0.2646484375, -0.139373779296875, -0.01409912109375, 0.111175537109375, 0.2364501953125, 0.361724853515625, 0.48699951171875, 0.612274169921875, 0.737548828125, 0.862823486328125, 0.98809814453125, 1.113372802734375, 1.2386474609375, 1.363922119140625, 1.48919677734375, 1.614471435546875, 1.73974609375, 1.865020751953125, 1.99029541015625, 2.115570068359375, 2.2408447265625, 2.366119384765625, 2.49139404296875, 2.616668701171875, 2.741943359375, 2.867218017578125, 2.99249267578125, 3.117767333984375, 3.2430419921875, 3.368316650390625, 3.49359130859375, 3.618865966796875, 3.744140625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 6.0, 6.0, 9.0, 7.0, 12.0, 20.0, 31.0, 55.0, 73.0, 121.0, 153.0, 254.0, 444.0, 745.0, 1371.0, 2880.0, 6413.0, 15406.0, 38812.0, 96563.0, 203185.0, 287238.0, 215485.0, 105032.0, 43383.0, 17078.0, 7085.0, 3138.0, 1503.0, 764.0, 461.0, 289.0, 183.0, 109.0, 64.0, 42.0, 40.0, 23.0, 23.0, 8.0, 8.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.77880859375, -0.7533187866210938, -0.7278289794921875, -0.7023391723632812, -0.676849365234375, -0.6513595581054688, -0.6258697509765625, -0.6003799438476562, -0.57489013671875, -0.5494003295898438, -0.5239105224609375, -0.49842071533203125, -0.472930908203125, -0.44744110107421875, -0.4219512939453125, -0.39646148681640625, -0.3709716796875, -0.34548187255859375, -0.3199920654296875, -0.29450225830078125, -0.269012451171875, -0.24352264404296875, -0.2180328369140625, -0.19254302978515625, -0.16705322265625, -0.14156341552734375, -0.1160736083984375, -0.09058380126953125, -0.065093994140625, -0.03960418701171875, -0.0141143798828125, 0.01137542724609375, 0.036865234375, 0.06235504150390625, 0.0878448486328125, 0.11333465576171875, 0.138824462890625, 0.16431427001953125, 0.1898040771484375, 0.21529388427734375, 0.24078369140625, 0.26627349853515625, 0.2917633056640625, 0.31725311279296875, 0.342742919921875, 0.36823272705078125, 0.3937225341796875, 0.41921234130859375, 0.4447021484375, 0.47019195556640625, 0.4956817626953125, 0.5211715698242188, 0.546661376953125, 0.5721511840820312, 0.5976409912109375, 0.6231307983398438, 0.64862060546875, 0.6741104125976562, 0.6996002197265625, 0.7250900268554688, 0.750579833984375, 0.7760696411132812, 0.8015594482421875, 0.8270492553710938, 0.8525390625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 19.0, 9.0, 13.0, 20.0, 25.0, 15.0, 20.0, 24.0, 25.0, 38.0, 40.0, 37.0, 44.0, 36.0, 45.0, 40.0, 40.0, 1056.0, 29.0, 41.0, 29.0, 30.0, 44.0, 27.0, 23.0, 32.0, 27.0, 36.0, 22.0, 17.0, 19.0, 12.0, 17.0, 11.0, 12.0, 10.0, 3.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.287109375, -2.2191162109375, -2.151123046875, -2.0831298828125, -2.01513671875, -1.9471435546875, -1.879150390625, -1.8111572265625, -1.7431640625, -1.6751708984375, -1.607177734375, -1.5391845703125, -1.47119140625, -1.4031982421875, -1.335205078125, -1.2672119140625, -1.19921875, -1.1312255859375, -1.063232421875, -0.9952392578125, -0.92724609375, -0.8592529296875, -0.791259765625, -0.7232666015625, -0.6552734375, -0.5872802734375, -0.519287109375, -0.4512939453125, -0.38330078125, -0.3153076171875, -0.247314453125, -0.1793212890625, -0.111328125, -0.0433349609375, 0.024658203125, 0.0926513671875, 0.16064453125, 0.2286376953125, 0.296630859375, 0.3646240234375, 0.4326171875, 0.5006103515625, 0.568603515625, 0.6365966796875, 0.70458984375, 0.7725830078125, 0.840576171875, 0.9085693359375, 0.9765625, 1.0445556640625, 1.112548828125, 1.1805419921875, 1.24853515625, 1.3165283203125, 1.384521484375, 1.4525146484375, 1.5205078125, 1.5885009765625, 1.656494140625, 1.7244873046875, 1.79248046875, 1.8604736328125, 1.928466796875, 1.9964599609375, 2.064453125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 16.0, 23.0, 21.0, 45.0, 66.0, 119.0, 207.0, 347.0, 574.0, 1142.0, 2180.0, 4638.0, 10142.0, 23285.0, 56352.0, 138269.0, 437986.0, 1078214.0, 202159.0, 81271.0, 33462.0, 14124.0, 6316.0, 3016.0, 1444.0, 715.0, 421.0, 248.0, 131.0, 63.0, 48.0, 24.0, 12.0, 11.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.27783203125, -0.2676200866699219, -0.25740814208984375, -0.24719619750976562, -0.2369842529296875, -0.22677230834960938, -0.21656036376953125, -0.20634841918945312, -0.196136474609375, -0.18592453002929688, -0.17571258544921875, -0.16550064086914062, -0.1552886962890625, -0.14507675170898438, -0.13486480712890625, -0.12465286254882812, -0.11444091796875, -0.10422897338867188, -0.09401702880859375, -0.08380508422851562, -0.0735931396484375, -0.06338119506835938, -0.05316925048828125, -0.042957305908203125, -0.032745361328125, -0.022533416748046875, -0.01232147216796875, -0.002109527587890625, 0.0081024169921875, 0.018314361572265625, 0.02852630615234375, 0.038738250732421875, 0.0489501953125, 0.059162139892578125, 0.06937408447265625, 0.07958602905273438, 0.0897979736328125, 0.10000991821289062, 0.11022186279296875, 0.12043380737304688, 0.130645751953125, 0.14085769653320312, 0.15106964111328125, 0.16128158569335938, 0.1714935302734375, 0.18170547485351562, 0.19191741943359375, 0.20212936401367188, 0.21234130859375, 0.22255325317382812, 0.23276519775390625, 0.24297714233398438, 0.2531890869140625, 0.2634010314941406, 0.27361297607421875, 0.2838249206542969, 0.294036865234375, 0.3042488098144531, 0.31446075439453125, 0.3246726989746094, 0.3348846435546875, 0.3450965881347656, 0.35530853271484375, 0.3655204772949219, 0.375732421875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 3.0, 4.0, 4.0, 6.0, 3.0, 11.0, 9.0, 17.0, 9.0, 13.0, 19.0, 26.0, 22.0, 28.0, 34.0, 42.0, 63.0, 59.0, 109.0, 87.0, 71.0, 63.0, 30.0, 41.0, 24.0, 22.0, 21.0, 16.0, 16.0, 15.0, 11.0, 7.0, 7.0, 15.0, 6.0, 8.0, 8.0, 6.0, 1.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.114990234375, -0.11139392852783203, -0.10779762268066406, -0.1042013168334961, -0.10060501098632812, -0.09700870513916016, -0.09341239929199219, -0.08981609344482422, -0.08621978759765625, -0.08262348175048828, -0.07902717590332031, -0.07543087005615234, -0.07183456420898438, -0.0682382583618164, -0.06464195251464844, -0.06104564666748047, -0.0574493408203125, -0.05385303497314453, -0.05025672912597656, -0.046660423278808594, -0.043064117431640625, -0.039467811584472656, -0.03587150573730469, -0.03227519989013672, -0.02867889404296875, -0.02508258819580078, -0.021486282348632812, -0.017889976501464844, -0.014293670654296875, -0.010697364807128906, -0.0071010589599609375, -0.0035047531127929688, 9.1552734375e-05, 0.0036878585815429688, 0.0072841644287109375, 0.010880470275878906, 0.014476776123046875, 0.018073081970214844, 0.021669387817382812, 0.02526569366455078, 0.02886199951171875, 0.03245830535888672, 0.03605461120605469, 0.039650917053222656, 0.043247222900390625, 0.046843528747558594, 0.05043983459472656, 0.05403614044189453, 0.0576324462890625, 0.06122875213623047, 0.06482505798339844, 0.0684213638305664, 0.07201766967773438, 0.07561397552490234, 0.07921028137207031, 0.08280658721923828, 0.08640289306640625, 0.08999919891357422, 0.09359550476074219, 0.09719181060791016, 0.10078811645507812, 0.1043844223022461, 0.10798072814941406, 0.11157703399658203, 0.11517333984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 7.0, 10.0, 9.0, 13.0, 13.0, 18.0, 17.0, 17.0, 34.0, 43.0, 35.0, 60.0, 108.0, 131.0, 199.0, 318.0, 678.0, 5805.0, 319187.0, 712131.0, 7857.0, 785.0, 282.0, 187.0, 120.0, 106.0, 94.0, 59.0, 44.0, 36.0, 34.0, 24.0, 15.0, 8.0, 7.0, 6.0, 3.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.302734375, -2.233062744140625, -2.16339111328125, -2.093719482421875, -2.0240478515625, -1.954376220703125, -1.88470458984375, -1.815032958984375, -1.745361328125, -1.675689697265625, -1.60601806640625, -1.536346435546875, -1.4666748046875, -1.397003173828125, -1.32733154296875, -1.257659912109375, -1.18798828125, -1.118316650390625, -1.04864501953125, -0.978973388671875, -0.9093017578125, -0.839630126953125, -0.76995849609375, -0.700286865234375, -0.630615234375, -0.560943603515625, -0.49127197265625, -0.421600341796875, -0.3519287109375, -0.282257080078125, -0.21258544921875, -0.142913818359375, -0.0732421875, -0.003570556640625, 0.06610107421875, 0.135772705078125, 0.2054443359375, 0.275115966796875, 0.34478759765625, 0.414459228515625, 0.484130859375, 0.553802490234375, 0.62347412109375, 0.693145751953125, 0.7628173828125, 0.832489013671875, 0.90216064453125, 0.971832275390625, 1.04150390625, 1.111175537109375, 1.18084716796875, 1.250518798828125, 1.3201904296875, 1.389862060546875, 1.45953369140625, 1.529205322265625, 1.598876953125, 1.668548583984375, 1.73822021484375, 1.807891845703125, 1.8775634765625, 1.947235107421875, 2.01690673828125, 2.086578369140625, 2.15625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 12.0, 31.0, 69.0, 143.0, 323.0, 204.0, 116.0, 44.0, 21.0, 13.0, 6.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2542712688446045, -1.225589632987976, -1.1969079971313477, -1.1682263612747192, -1.1395447254180908, -1.1108630895614624, -1.082181453704834, -1.053499698638916, -1.0248181819915771, -0.9961365461349487, -0.9674549102783203, -0.9387732744216919, -0.9100916385650635, -0.8814100027084351, -0.8527283072471619, -0.8240466713905334, -0.7953649759292603, -0.7666833400726318, -0.7380017042160034, -0.709320068359375, -0.6806384325027466, -0.6519567966461182, -0.623275101184845, -0.5945934653282166, -0.5659118294715881, -0.5372301936149597, -0.5085485577583313, -0.4798668920993805, -0.4511852562427521, -0.42250362038612366, -0.39382195472717285, -0.36514031887054443, -0.3364587426185608, -0.3077771067619324, -0.27909547090530396, -0.25041380524635315, -0.22173216938972473, -0.1930505335330963, -0.1643688827753067, -0.1356872320175171, -0.10700559616088867, -0.07832395285367966, -0.04964230954647064, -0.020960666239261627, 0.007720977067947388, 0.036402612924575806, 0.06508426368236542, 0.09376591444015503, 0.12244755029678345, 0.15112918615341187, 0.17981083691120148, 0.2084924876689911, 0.2371741235256195, 0.2658557593822479, 0.29453742504119873, 0.32321906089782715, 0.35190069675445557, 0.380582332611084, 0.4092639684677124, 0.4379456341266632, 0.4666272699832916, 0.49530890583992004, 0.5239905714988708, 0.5526722073554993, 0.5813538432121277]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 6.0, 12.0, 6.0, 12.0, 12.0, 9.0, 15.0, 21.0, 23.0, 24.0, 25.0, 25.0, 33.0, 42.0, 28.0, 40.0, 42.0, 38.0, 35.0, 42.0, 33.0, 50.0, 49.0, 33.0, 30.0, 38.0, 34.0, 34.0, 25.0, 26.0, 23.0, 21.0, 21.0, 18.0, 9.0, 7.0, 8.0, 8.0, 5.0, 5.0, 7.0, 7.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.24104547500610352, -0.23351912200450897, -0.22599276900291443, -0.21846643090248108, -0.21094007790088654, -0.203413724899292, -0.19588738679885864, -0.1883610337972641, -0.18083468079566956, -0.173308327794075, -0.16578197479248047, -0.15825563669204712, -0.15072928369045258, -0.14320293068885803, -0.13567659258842468, -0.12815023958683014, -0.1206238865852356, -0.11309753358364105, -0.1055711880326271, -0.09804484248161316, -0.09051848948001862, -0.08299213647842407, -0.07546579092741013, -0.06793944537639618, -0.060413092374801636, -0.05288674309849739, -0.045360393822193146, -0.0378340445458889, -0.030307695269584656, -0.02278134599328041, -0.015254996716976166, -0.007728647440671921, -0.00020229816436767578, 0.007324051111936569, 0.014850400388240814, 0.02237674966454506, 0.029903098940849304, 0.03742944821715355, 0.044955797493457794, 0.05248214676976204, 0.060008496046066284, 0.06753484904766083, 0.07506119459867477, 0.08258754014968872, 0.09011389315128326, 0.09764024615287781, 0.10516659170389175, 0.1126929372549057, 0.12021929025650024, 0.1277456432580948, 0.13527199625968933, 0.14279833436012268, 0.15032468736171722, 0.15785104036331177, 0.16537737846374512, 0.17290373146533966, 0.1804300844669342, 0.18795643746852875, 0.1954827904701233, 0.20300912857055664, 0.21053548157215118, 0.21806183457374573, 0.22558817267417908, 0.23311452567577362, 0.24064087867736816]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 19.0, 18.0, 17.0, 28.0, 29.0, 41.0, 46.0, 46.0, 48.0, 63.0, 54.0, 57.0, 70.0, 46.0, 49.0, 49.0, 61.0, 39.0, 40.0, 29.0, 23.0, 20.0, 13.0, 20.0, 13.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.824005126953125, -3.70465087890625, -3.585296630859375, -3.4659423828125, -3.346588134765625, -3.22723388671875, -3.107879638671875, -2.988525390625, -2.869171142578125, -2.74981689453125, -2.630462646484375, -2.5111083984375, -2.391754150390625, -2.27239990234375, -2.153045654296875, -2.03369140625, -1.914337158203125, -1.79498291015625, -1.675628662109375, -1.5562744140625, -1.436920166015625, -1.31756591796875, -1.198211669921875, -1.078857421875, -0.959503173828125, -0.84014892578125, -0.720794677734375, -0.6014404296875, -0.482086181640625, -0.36273193359375, -0.243377685546875, -0.1240234375, -0.004669189453125, 0.11468505859375, 0.234039306640625, 0.3533935546875, 0.472747802734375, 0.59210205078125, 0.711456298828125, 0.830810546875, 0.950164794921875, 1.06951904296875, 1.188873291015625, 1.3082275390625, 1.427581787109375, 1.54693603515625, 1.666290283203125, 1.78564453125, 1.904998779296875, 2.02435302734375, 2.143707275390625, 2.2630615234375, 2.382415771484375, 2.50177001953125, 2.621124267578125, 2.740478515625, 2.859832763671875, 2.97918701171875, 3.098541259765625, 3.2178955078125, 3.337249755859375, 3.45660400390625, 3.575958251953125, 3.6953125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 4.0, 8.0, 14.0, 20.0, 38.0, 39.0, 83.0, 133.0, 173.0, 282.0, 421.0, 757.0, 1365.0, 2885.0, 6478.0, 16948.0, 49526.0, 196496.0, 537314.0, 164935.0, 43609.0, 15209.0, 5933.0, 2641.0, 1353.0, 750.0, 424.0, 255.0, 147.0, 113.0, 71.0, 42.0, 25.0, 18.0, 11.0, 5.0, 4.0, 7.0, 5.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.935546875, -4.7734375, -4.611328125, -4.44921875, -4.287109375, -4.125, -3.962890625, -3.80078125, -3.638671875, -3.4765625, -3.314453125, -3.15234375, -2.990234375, -2.828125, -2.666015625, -2.50390625, -2.341796875, -2.1796875, -2.017578125, -1.85546875, -1.693359375, -1.53125, -1.369140625, -1.20703125, -1.044921875, -0.8828125, -0.720703125, -0.55859375, -0.396484375, -0.234375, -0.072265625, 0.08984375, 0.251953125, 0.4140625, 0.576171875, 0.73828125, 0.900390625, 1.0625, 1.224609375, 1.38671875, 1.548828125, 1.7109375, 1.873046875, 2.03515625, 2.197265625, 2.359375, 2.521484375, 2.68359375, 2.845703125, 3.0078125, 3.169921875, 3.33203125, 3.494140625, 3.65625, 3.818359375, 3.98046875, 4.142578125, 4.3046875, 4.466796875, 4.62890625, 4.791015625, 4.953125, 5.115234375, 5.27734375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 6.0, 8.0, 5.0, 9.0, 6.0, 6.0, 9.0, 15.0, 9.0, 25.0, 23.0, 22.0, 19.0, 27.0, 42.0, 37.0, 58.0, 36.0, 55.0, 75.0, 153.0, 352.0, 1409.0, 165.0, 86.0, 54.0, 36.0, 43.0, 32.0, 30.0, 32.0, 34.0, 23.0, 15.0, 15.0, 13.0, 16.0, 10.0, 7.0, 9.0, 4.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.0228271484375, -8.701904296875, -8.3809814453125, -8.06005859375, -7.7391357421875, -7.418212890625, -7.0972900390625, -6.7763671875, -6.4554443359375, -6.134521484375, -5.8135986328125, -5.49267578125, -5.1717529296875, -4.850830078125, -4.5299072265625, -4.208984375, -3.8880615234375, -3.567138671875, -3.2462158203125, -2.92529296875, -2.6043701171875, -2.283447265625, -1.9625244140625, -1.6416015625, -1.3206787109375, -0.999755859375, -0.6788330078125, -0.35791015625, -0.0369873046875, 0.283935546875, 0.6048583984375, 0.92578125, 1.2467041015625, 1.567626953125, 1.8885498046875, 2.20947265625, 2.5303955078125, 2.851318359375, 3.1722412109375, 3.4931640625, 3.8140869140625, 4.135009765625, 4.4559326171875, 4.77685546875, 5.0977783203125, 5.418701171875, 5.7396240234375, 6.060546875, 6.3814697265625, 6.702392578125, 7.0233154296875, 7.34423828125, 7.6651611328125, 7.986083984375, 8.3070068359375, 8.6279296875, 8.9488525390625, 9.269775390625, 9.5906982421875, 9.91162109375, 10.2325439453125, 10.553466796875, 10.8743896484375, 11.1953125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 4.0, 10.0, 11.0, 16.0, 15.0, 21.0, 26.0, 33.0, 47.0, 66.0, 78.0, 110.0, 158.0, 216.0, 408.0, 1172.0, 5980.0, 143369.0, 2921172.0, 66408.0, 4326.0, 859.0, 375.0, 222.0, 140.0, 106.0, 86.0, 56.0, 51.0, 26.0, 21.0, 25.0, 14.0, 21.0, 12.0, 10.0, 5.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.296875, -19.650634765625, -19.00439453125, -18.358154296875, -17.7119140625, -17.065673828125, -16.41943359375, -15.773193359375, -15.126953125, -14.480712890625, -13.83447265625, -13.188232421875, -12.5419921875, -11.895751953125, -11.24951171875, -10.603271484375, -9.95703125, -9.310791015625, -8.66455078125, -8.018310546875, -7.3720703125, -6.725830078125, -6.07958984375, -5.433349609375, -4.787109375, -4.140869140625, -3.49462890625, -2.848388671875, -2.2021484375, -1.555908203125, -0.90966796875, -0.263427734375, 0.3828125, 1.029052734375, 1.67529296875, 2.321533203125, 2.9677734375, 3.614013671875, 4.26025390625, 4.906494140625, 5.552734375, 6.198974609375, 6.84521484375, 7.491455078125, 8.1376953125, 8.783935546875, 9.43017578125, 10.076416015625, 10.72265625, 11.368896484375, 12.01513671875, 12.661376953125, 13.3076171875, 13.953857421875, 14.60009765625, 15.246337890625, 15.892578125, 16.538818359375, 17.18505859375, 17.831298828125, 18.4775390625, 19.123779296875, 19.77001953125, 20.416259765625, 21.0625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 35.0, 906.0, 77.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.082046508789062, -20.21932029724121, -12.35659408569336, -4.493867874145508, 3.3688583374023438, 11.231582641601562, 19.094310760498047, 26.95703887939453, 34.81976318359375, 42.68248748779297, 50.54521560668945, 58.40794372558594, 66.27066802978516, 74.13339233398438, 81.99612426757812, 89.85884857177734, 97.72157287597656, 105.58429718017578, 113.447021484375, 121.30975341796875, 129.1724853515625, 137.0352020263672, 144.89793395996094, 152.76065063476562, 160.62338256835938, 168.48611450195312, 176.3488311767578, 184.21156311035156, 192.07427978515625, 199.93701171875, 207.79974365234375, 215.6624755859375, 223.52520751953125, 231.387939453125, 239.2506561279297, 247.11338806152344, 254.97610473632812, 262.8388366699219, 270.7015686035156, 278.5643005371094, 286.427001953125, 294.28973388671875, 302.1524658203125, 310.0151672363281, 317.8778991699219, 325.7406311035156, 333.6033630371094, 341.4660949707031, 349.3288269042969, 357.1915588378906, 365.0542907714844, 372.9169921875, 380.77972412109375, 388.6424560546875, 396.50518798828125, 404.367919921875, 412.23065185546875, 420.0933837890625, 427.95611572265625, 435.8188171386719, 443.6815490722656, 451.5442810058594, 459.4070129394531, 467.2697448730469, 475.1324462890625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 0.0, 5.0, 10.0, 11.0, 4.0, 9.0, 18.0, 16.0, 17.0, 13.0, 22.0, 22.0, 31.0, 40.0, 36.0, 40.0, 35.0, 34.0, 33.0, 41.0, 40.0, 45.0, 48.0, 26.0, 35.0, 29.0, 31.0, 41.0, 37.0, 26.0, 21.0, 25.0, 27.0, 24.0, 20.0, 16.0, 13.0, 8.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0], "bins": [-31.852333068847656, -30.959306716918945, -30.066280364990234, -29.173254013061523, -28.280227661132812, -27.3872013092041, -26.49417495727539, -25.601146697998047, -24.70812225341797, -23.815095901489258, -22.922069549560547, -22.029043197631836, -21.136016845703125, -20.242990493774414, -19.349964141845703, -18.45693588256836, -17.56390953063965, -16.670883178710938, -15.777856826782227, -14.884830474853516, -13.991804122924805, -13.098777770996094, -12.205750465393066, -11.312724113464355, -10.419697761535645, -9.526671409606934, -8.633645057678223, -7.7406182289123535, -6.847591876983643, -5.954565525054932, -5.0615386962890625, -4.168512344360352, -3.275484085083008, -2.382457733154297, -1.4894311428070068, -0.5964045524597168, 0.29662179946899414, 1.189648151397705, 2.082674980163574, 2.975701332092285, 3.868727684020996, 4.761754035949707, 5.654780387878418, 6.547807216644287, 7.440833568572998, 8.333860397338867, 9.226886749267578, 10.119913101196289, 11.012939453125, 11.905965805053711, 12.798992156982422, 13.692018508911133, 14.585044860839844, 15.478071212768555, 16.371097564697266, 17.26412582397461, 18.157150268554688, 19.0501766204834, 19.94320297241211, 20.83622932434082, 21.72925567626953, 22.622282028198242, 23.515308380126953, 24.408336639404297, 25.301362991333008]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 10.0, 13.0, 14.0, 21.0, 21.0, 31.0, 28.0, 28.0, 38.0, 44.0, 55.0, 48.0, 46.0, 59.0, 51.0, 61.0, 48.0, 49.0, 49.0, 44.0, 35.0, 40.0, 33.0, 28.0, 18.0, 13.0, 15.0, 13.0, 13.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.1722412109375, -4.047607421875, -3.9229736328125, -3.79833984375, -3.6737060546875, -3.549072265625, -3.4244384765625, -3.2998046875, -3.1751708984375, -3.050537109375, -2.9259033203125, -2.80126953125, -2.6766357421875, -2.552001953125, -2.4273681640625, -2.302734375, -2.1781005859375, -2.053466796875, -1.9288330078125, -1.80419921875, -1.6795654296875, -1.554931640625, -1.4302978515625, -1.3056640625, -1.1810302734375, -1.056396484375, -0.9317626953125, -0.80712890625, -0.6824951171875, -0.557861328125, -0.4332275390625, -0.30859375, -0.1839599609375, -0.059326171875, 0.0653076171875, 0.18994140625, 0.3145751953125, 0.439208984375, 0.5638427734375, 0.6884765625, 0.8131103515625, 0.937744140625, 1.0623779296875, 1.18701171875, 1.3116455078125, 1.436279296875, 1.5609130859375, 1.685546875, 1.8101806640625, 1.934814453125, 2.0594482421875, 2.18408203125, 2.3087158203125, 2.433349609375, 2.5579833984375, 2.6826171875, 2.8072509765625, 2.931884765625, 3.0565185546875, 3.18115234375, 3.3057861328125, 3.430419921875, 3.5550537109375, 3.6796875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 1.0, 3.0, 4.0, 3.0, 8.0, 28.0, 24.0, 42.0, 32.0, 67.0, 98.0, 182.0, 280.0, 401.0, 762.0, 1629.0, 3414.0, 10033.0, 47516.0, 748811.0, 3026825.0, 312073.0, 28986.0, 7429.0, 2820.0, 1257.0, 599.0, 371.0, 209.0, 145.0, 75.0, 47.0, 42.0, 25.0, 13.0, 10.0, 10.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4921875, -11.15771484375, -10.8232421875, -10.48876953125, -10.154296875, -9.81982421875, -9.4853515625, -9.15087890625, -8.81640625, -8.48193359375, -8.1474609375, -7.81298828125, -7.478515625, -7.14404296875, -6.8095703125, -6.47509765625, -6.140625, -5.80615234375, -5.4716796875, -5.13720703125, -4.802734375, -4.46826171875, -4.1337890625, -3.79931640625, -3.46484375, -3.13037109375, -2.7958984375, -2.46142578125, -2.126953125, -1.79248046875, -1.4580078125, -1.12353515625, -0.7890625, -0.45458984375, -0.1201171875, 0.21435546875, 0.548828125, 0.88330078125, 1.2177734375, 1.55224609375, 1.88671875, 2.22119140625, 2.5556640625, 2.89013671875, 3.224609375, 3.55908203125, 3.8935546875, 4.22802734375, 4.5625, 4.89697265625, 5.2314453125, 5.56591796875, 5.900390625, 6.23486328125, 6.5693359375, 6.90380859375, 7.23828125, 7.57275390625, 7.9072265625, 8.24169921875, 8.576171875, 8.91064453125, 9.2451171875, 9.57958984375, 9.9140625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 9.0, 8.0, 4.0, 12.0, 18.0, 20.0, 32.0, 47.0, 69.0, 76.0, 119.0, 162.0, 216.0, 292.0, 441.0, 503.0, 513.0, 407.0, 328.0, 246.0, 151.0, 101.0, 67.0, 54.0, 50.0, 36.0, 24.0, 5.0, 11.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8046875, -6.5615234375, -6.318359375, -6.0751953125, -5.83203125, -5.5888671875, -5.345703125, -5.1025390625, -4.859375, -4.6162109375, -4.373046875, -4.1298828125, -3.88671875, -3.6435546875, -3.400390625, -3.1572265625, -2.9140625, -2.6708984375, -2.427734375, -2.1845703125, -1.94140625, -1.6982421875, -1.455078125, -1.2119140625, -0.96875, -0.7255859375, -0.482421875, -0.2392578125, 0.00390625, 0.2470703125, 0.490234375, 0.7333984375, 0.9765625, 1.2197265625, 1.462890625, 1.7060546875, 1.94921875, 2.1923828125, 2.435546875, 2.6787109375, 2.921875, 3.1650390625, 3.408203125, 3.6513671875, 3.89453125, 4.1376953125, 4.380859375, 4.6240234375, 4.8671875, 5.1103515625, 5.353515625, 5.5966796875, 5.83984375, 6.0830078125, 6.326171875, 6.5693359375, 6.8125, 7.0556640625, 7.298828125, 7.5419921875, 7.78515625, 8.0283203125, 8.271484375, 8.5146484375, 8.7578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 6.0, 7.0, 6.0, 20.0, 19.0, 28.0, 41.0, 78.0, 117.0, 218.0, 415.0, 744.0, 1400.0, 2950.0, 7063.0, 20160.0, 98299.0, 1009100.0, 2655991.0, 332225.0, 44029.0, 12109.0, 4686.0, 2142.0, 1096.0, 546.0, 309.0, 181.0, 107.0, 68.0, 30.0, 21.0, 26.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-14.8203125, -14.4227294921875, -14.025146484375, -13.6275634765625, -13.22998046875, -12.8323974609375, -12.434814453125, -12.0372314453125, -11.6396484375, -11.2420654296875, -10.844482421875, -10.4468994140625, -10.04931640625, -9.6517333984375, -9.254150390625, -8.8565673828125, -8.458984375, -8.0614013671875, -7.663818359375, -7.2662353515625, -6.86865234375, -6.4710693359375, -6.073486328125, -5.6759033203125, -5.2783203125, -4.8807373046875, -4.483154296875, -4.0855712890625, -3.68798828125, -3.2904052734375, -2.892822265625, -2.4952392578125, -2.09765625, -1.7000732421875, -1.302490234375, -0.9049072265625, -0.50732421875, -0.1097412109375, 0.287841796875, 0.6854248046875, 1.0830078125, 1.4805908203125, 1.878173828125, 2.2757568359375, 2.67333984375, 3.0709228515625, 3.468505859375, 3.8660888671875, 4.263671875, 4.6612548828125, 5.058837890625, 5.4564208984375, 5.85400390625, 6.2515869140625, 6.649169921875, 7.0467529296875, 7.4443359375, 7.8419189453125, 8.239501953125, 8.6370849609375, 9.03466796875, 9.4322509765625, 9.829833984375, 10.2274169921875, 10.625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 15.0, 35.0, 69.0, 157.0, 187.0, 202.0, 178.0, 84.0, 43.0, 21.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.77940368652344, -91.38491821289062, -88.99043273925781, -86.595947265625, -84.20146179199219, -81.80697631835938, -79.41249084472656, -77.01800537109375, -74.62351989746094, -72.22903442382812, -69.83454895019531, -67.4400634765625, -65.04557800292969, -62.651092529296875, -60.25660705566406, -57.86212158203125, -55.46763229370117, -53.07314682006836, -50.67866134643555, -48.284175872802734, -45.88969039916992, -43.49520492553711, -41.10071563720703, -38.70623016357422, -36.311744689941406, -33.917259216308594, -31.52277374267578, -29.12828826904297, -26.733802795410156, -24.339317321777344, -21.9448299407959, -19.550344467163086, -17.155860900878906, -14.761375427246094, -12.366889953613281, -9.972403526306152, -7.57791805267334, -5.183432579040527, -2.7889461517333984, -0.39446067810058594, 2.0000247955322266, 4.394510269165039, 6.78899621963501, 9.18348217010498, 11.577967643737793, 13.972453117370605, 16.366939544677734, 18.761425018310547, 21.15591049194336, 23.550395965576172, 25.944881439208984, 28.339366912841797, 30.73385238647461, 33.12833786010742, 35.5228271484375, 37.91731262207031, 40.311798095703125, 42.70628356933594, 45.10076904296875, 47.49525451660156, 49.889739990234375, 52.28422546386719, 54.6787109375, 57.07319641113281, 59.467681884765625]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 5.0, 9.0, 11.0, 12.0, 11.0, 17.0, 24.0, 23.0, 31.0, 24.0, 28.0, 35.0, 48.0, 39.0, 50.0, 43.0, 50.0, 57.0, 45.0, 41.0, 54.0, 46.0, 43.0, 29.0, 36.0, 26.0, 24.0, 24.0, 21.0, 16.0, 20.0, 9.0, 8.0, 8.0, 6.0, 7.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.270343780517578, -24.410444259643555, -23.55054473876953, -22.690645217895508, -21.830745697021484, -20.970844268798828, -20.110946655273438, -19.25104522705078, -18.391145706176758, -17.531246185302734, -16.67134666442871, -15.811447143554688, -14.951546669006348, -14.091647148132324, -13.2317476272583, -12.371847152709961, -11.511948585510254, -10.65204906463623, -9.792149543762207, -8.932249069213867, -8.072349548339844, -7.21245002746582, -6.352550506591797, -5.492650508880615, -4.632750988006592, -3.7728512287139893, -2.9129514694213867, -2.0530519485473633, -1.1931521892547607, -0.3332524299621582, 0.5266470909118652, 1.3865470886230469, 2.2464466094970703, 3.106346368789673, 3.9662461280822754, 4.826145648956299, 5.6860456466674805, 6.545945167541504, 7.405844688415527, 8.265745162963867, 9.12564468383789, 9.985544204711914, 10.845443725585938, 11.705343246459961, 12.5652437210083, 13.425143241882324, 14.285042762756348, 15.144943237304688, 16.004840850830078, 16.8647403717041, 17.724639892578125, 18.58453941345215, 19.444438934326172, 20.304340362548828, 21.16423797607422, 22.024139404296875, 22.8840389251709, 23.743938446044922, 24.603837966918945, 25.46373748779297, 26.323637008666992, 27.183536529541016, 28.043437957763672, 28.903337478637695, 29.76323699951172]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 10.0, 13.0, 5.0, 8.0, 15.0, 16.0, 19.0, 33.0, 40.0, 40.0, 47.0, 54.0, 49.0, 56.0, 45.0, 45.0, 48.0, 42.0, 56.0, 52.0, 41.0, 50.0, 31.0, 28.0, 23.0, 27.0, 20.0, 12.0, 20.0, 16.0, 11.0, 6.0, 7.0, 11.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.82421875, -3.705474853515625, -3.58673095703125, -3.467987060546875, -3.3492431640625, -3.230499267578125, -3.11175537109375, -2.993011474609375, -2.874267578125, -2.755523681640625, -2.63677978515625, -2.518035888671875, -2.3992919921875, -2.280548095703125, -2.16180419921875, -2.043060302734375, -1.92431640625, -1.805572509765625, -1.68682861328125, -1.568084716796875, -1.4493408203125, -1.330596923828125, -1.21185302734375, -1.093109130859375, -0.974365234375, -0.855621337890625, -0.73687744140625, -0.618133544921875, -0.4993896484375, -0.380645751953125, -0.26190185546875, -0.143157958984375, -0.0244140625, 0.094329833984375, 0.21307373046875, 0.331817626953125, 0.4505615234375, 0.569305419921875, 0.68804931640625, 0.806793212890625, 0.925537109375, 1.044281005859375, 1.16302490234375, 1.281768798828125, 1.4005126953125, 1.519256591796875, 1.63800048828125, 1.756744384765625, 1.87548828125, 1.994232177734375, 2.11297607421875, 2.231719970703125, 2.3504638671875, 2.469207763671875, 2.58795166015625, 2.706695556640625, 2.825439453125, 2.944183349609375, 3.06292724609375, 3.181671142578125, 3.3004150390625, 3.419158935546875, 3.53790283203125, 3.656646728515625, 3.775390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 6.0, 13.0, 21.0, 37.0, 51.0, 45.0, 72.0, 119.0, 172.0, 247.0, 348.0, 567.0, 766.0, 1236.0, 2104.0, 4180.0, 11433.0, 42297.0, 170019.0, 415390.0, 285971.0, 80068.0, 19748.0, 6271.0, 2818.0, 1512.0, 944.0, 663.0, 445.0, 306.0, 222.0, 147.0, 83.0, 52.0, 54.0, 36.0, 25.0, 19.0, 8.0, 6.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.2353515625, -1.1951446533203125, -1.154937744140625, -1.1147308349609375, -1.07452392578125, -1.0343170166015625, -0.994110107421875, -0.9539031982421875, -0.9136962890625, -0.8734893798828125, -0.833282470703125, -0.7930755615234375, -0.75286865234375, -0.7126617431640625, -0.672454833984375, -0.6322479248046875, -0.592041015625, -0.5518341064453125, -0.511627197265625, -0.4714202880859375, -0.43121337890625, -0.3910064697265625, -0.350799560546875, -0.3105926513671875, -0.2703857421875, -0.2301788330078125, -0.189971923828125, -0.1497650146484375, -0.10955810546875, -0.0693511962890625, -0.029144287109375, 0.0110626220703125, 0.05126953125, 0.0914764404296875, 0.131683349609375, 0.1718902587890625, 0.21209716796875, 0.2523040771484375, 0.292510986328125, 0.3327178955078125, 0.3729248046875, 0.4131317138671875, 0.453338623046875, 0.4935455322265625, 0.53375244140625, 0.5739593505859375, 0.614166259765625, 0.6543731689453125, 0.694580078125, 0.7347869873046875, 0.774993896484375, 0.8152008056640625, 0.85540771484375, 0.8956146240234375, 0.935821533203125, 0.9760284423828125, 1.0162353515625, 1.0564422607421875, 1.096649169921875, 1.1368560791015625, 1.17706298828125, 1.2172698974609375, 1.257476806640625, 1.2976837158203125, 1.337890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 8.0, 9.0, 14.0, 13.0, 18.0, 13.0, 13.0, 24.0, 19.0, 24.0, 36.0, 21.0, 39.0, 20.0, 30.0, 33.0, 33.0, 32.0, 39.0, 41.0, 1068.0, 36.0, 38.0, 35.0, 36.0, 34.0, 27.0, 35.0, 29.0, 27.0, 21.0, 19.0, 23.0, 10.0, 21.0, 8.0, 11.0, 15.0, 8.0, 12.0, 9.0, 7.0, 2.0, 2.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4140625, -2.33709716796875, -2.2601318359375, -2.18316650390625, -2.106201171875, -2.02923583984375, -1.9522705078125, -1.87530517578125, -1.79833984375, -1.72137451171875, -1.6444091796875, -1.56744384765625, -1.490478515625, -1.41351318359375, -1.3365478515625, -1.25958251953125, -1.1826171875, -1.10565185546875, -1.0286865234375, -0.95172119140625, -0.874755859375, -0.79779052734375, -0.7208251953125, -0.64385986328125, -0.56689453125, -0.48992919921875, -0.4129638671875, -0.33599853515625, -0.259033203125, -0.18206787109375, -0.1051025390625, -0.02813720703125, 0.048828125, 0.12579345703125, 0.2027587890625, 0.27972412109375, 0.356689453125, 0.43365478515625, 0.5106201171875, 0.58758544921875, 0.66455078125, 0.74151611328125, 0.8184814453125, 0.89544677734375, 0.972412109375, 1.04937744140625, 1.1263427734375, 1.20330810546875, 1.2802734375, 1.35723876953125, 1.4342041015625, 1.51116943359375, 1.588134765625, 1.66510009765625, 1.7420654296875, 1.81903076171875, 1.89599609375, 1.97296142578125, 2.0499267578125, 2.12689208984375, 2.203857421875, 2.28082275390625, 2.3577880859375, 2.43475341796875, 2.51171875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 0.0, 3.0, 6.0, 15.0, 13.0, 36.0, 29.0, 65.0, 100.0, 142.0, 270.0, 457.0, 878.0, 2023.0, 4995.0, 16808.0, 78892.0, 548568.0, 1301834.0, 109347.0, 21722.0, 6219.0, 2406.0, 1049.0, 514.0, 266.0, 173.0, 98.0, 52.0, 36.0, 36.0, 20.0, 16.0, 10.0, 9.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67822265625, -0.6577301025390625, -0.637237548828125, -0.6167449951171875, -0.59625244140625, -0.5757598876953125, -0.555267333984375, -0.5347747802734375, -0.5142822265625, -0.4937896728515625, -0.473297119140625, -0.4528045654296875, -0.43231201171875, -0.4118194580078125, -0.391326904296875, -0.3708343505859375, -0.350341796875, -0.3298492431640625, -0.309356689453125, -0.2888641357421875, -0.26837158203125, -0.2478790283203125, -0.227386474609375, -0.2068939208984375, -0.1864013671875, -0.1659088134765625, -0.145416259765625, -0.1249237060546875, -0.10443115234375, -0.0839385986328125, -0.063446044921875, -0.0429534912109375, -0.0224609375, -0.0019683837890625, 0.018524169921875, 0.0390167236328125, 0.05950927734375, 0.0800018310546875, 0.100494384765625, 0.1209869384765625, 0.1414794921875, 0.1619720458984375, 0.182464599609375, 0.2029571533203125, 0.22344970703125, 0.2439422607421875, 0.264434814453125, 0.2849273681640625, 0.305419921875, 0.3259124755859375, 0.346405029296875, 0.3668975830078125, 0.38739013671875, 0.4078826904296875, 0.428375244140625, 0.4488677978515625, 0.4693603515625, 0.4898529052734375, 0.510345458984375, 0.5308380126953125, 0.55133056640625, 0.5718231201171875, 0.592315673828125, 0.6128082275390625, 0.63330078125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 9.0, 14.0, 29.0, 33.0, 49.0, 56.0, 88.0, 148.0, 173.0, 110.0, 69.0, 54.0, 30.0, 40.0, 21.0, 11.0, 6.0, 12.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.1748809814453125, -0.169464111328125, -0.1640472412109375, -0.15863037109375, -0.1532135009765625, -0.147796630859375, -0.1423797607421875, -0.136962890625, -0.1315460205078125, -0.126129150390625, -0.1207122802734375, -0.11529541015625, -0.1098785400390625, -0.104461669921875, -0.0990447998046875, -0.0936279296875, -0.0882110595703125, -0.082794189453125, -0.0773773193359375, -0.07196044921875, -0.0665435791015625, -0.061126708984375, -0.0557098388671875, -0.05029296875, -0.0448760986328125, -0.039459228515625, -0.0340423583984375, -0.02862548828125, -0.0232086181640625, -0.017791748046875, -0.0123748779296875, -0.0069580078125, -0.0015411376953125, 0.003875732421875, 0.0092926025390625, 0.01470947265625, 0.0201263427734375, 0.025543212890625, 0.0309600830078125, 0.036376953125, 0.0417938232421875, 0.047210693359375, 0.0526275634765625, 0.05804443359375, 0.0634613037109375, 0.068878173828125, 0.0742950439453125, 0.0797119140625, 0.0851287841796875, 0.090545654296875, 0.0959625244140625, 0.10137939453125, 0.1067962646484375, 0.112213134765625, 0.1176300048828125, 0.123046875, 0.1284637451171875, 0.133880615234375, 0.1392974853515625, 0.14471435546875, 0.1501312255859375, 0.155548095703125, 0.1609649658203125, 0.1663818359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 6.0, 16.0, 16.0, 34.0, 45.0, 60.0, 97.0, 184.0, 474.0, 5764.0, 1013081.0, 27320.0, 845.0, 230.0, 137.0, 81.0, 47.0, 35.0, 26.0, 9.0, 7.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40234375, -3.291412353515625, -3.18048095703125, -3.069549560546875, -2.9586181640625, -2.847686767578125, -2.73675537109375, -2.625823974609375, -2.514892578125, -2.403961181640625, -2.29302978515625, -2.182098388671875, -2.0711669921875, -1.960235595703125, -1.84930419921875, -1.738372802734375, -1.62744140625, -1.516510009765625, -1.40557861328125, -1.294647216796875, -1.1837158203125, -1.072784423828125, -0.96185302734375, -0.850921630859375, -0.739990234375, -0.629058837890625, -0.51812744140625, -0.407196044921875, -0.2962646484375, -0.185333251953125, -0.07440185546875, 0.036529541015625, 0.1474609375, 0.258392333984375, 0.36932373046875, 0.480255126953125, 0.5911865234375, 0.702117919921875, 0.81304931640625, 0.923980712890625, 1.034912109375, 1.145843505859375, 1.25677490234375, 1.367706298828125, 1.4786376953125, 1.589569091796875, 1.70050048828125, 1.811431884765625, 1.92236328125, 2.033294677734375, 2.14422607421875, 2.255157470703125, 2.3660888671875, 2.477020263671875, 2.58795166015625, 2.698883056640625, 2.809814453125, 2.920745849609375, 3.03167724609375, 3.142608642578125, 3.2535400390625, 3.364471435546875, 3.47540283203125, 3.586334228515625, 3.697265625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 17.0, 71.0, 253.0, 425.0, 146.0, 45.0, 23.0, 14.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6808662414550781, -1.641090989112854, -1.6013158559799194, -1.5615406036376953, -1.5217654705047607, -1.4819902181625366, -1.4422149658203125, -1.402439832687378, -1.3626645803451538, -1.3228893280029297, -1.2831141948699951, -1.243338942527771, -1.2035638093948364, -1.1637885570526123, -1.1240134239196777, -1.0842381715774536, -1.0444629192352295, -1.0046876668930054, -0.9649125337600708, -0.9251372814178467, -0.8853620886802673, -0.845586895942688, -0.8058117032051086, -0.7660365104675293, -0.7262613773345947, -0.6864861845970154, -0.646710991859436, -0.6069357395172119, -0.5671605467796326, -0.5273853540420532, -0.4876101613044739, -0.44783493876457214, -0.4080597162246704, -0.36828452348709106, -0.32850930094718933, -0.28873410820961, -0.24895890057086945, -0.2091836929321289, -0.16940850019454956, -0.12963327765464783, -0.08985808491706848, -0.05008288100361824, -0.010307677090168, 0.029467523097991943, 0.06924273073673248, 0.10901793837547302, 0.14879313111305237, 0.1885683536529541, 0.22834354639053345, 0.2681187391281128, 0.3078939616680145, 0.34766915440559387, 0.3874443769454956, 0.42721956968307495, 0.4669947624206543, 0.5067700147628784, 0.546545147895813, 0.5863203406333923, 0.6260955333709717, 0.6658707857131958, 0.7056459784507751, 0.7454211711883545, 0.7851963639259338, 0.8249715566635132, 0.8647468090057373]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 8.0, 9.0, 7.0, 21.0, 17.0, 14.0, 28.0, 22.0, 31.0, 31.0, 24.0, 35.0, 40.0, 33.0, 50.0, 37.0, 27.0, 42.0, 38.0, 38.0, 34.0, 41.0, 27.0, 35.0, 34.0, 31.0, 28.0, 38.0, 23.0, 29.0, 26.0, 11.0, 8.0, 11.0, 8.0, 10.0, 12.0, 6.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.30903446674346924, -0.2998024821281433, -0.29057052731513977, -0.28133854269981384, -0.2721065878868103, -0.2628746032714844, -0.25364261865615845, -0.2444106638431549, -0.23517867922782898, -0.22594670951366425, -0.2167147397994995, -0.20748275518417358, -0.19825078547000885, -0.18901881575584412, -0.17978684604167938, -0.17055487632751465, -0.16132290661334991, -0.15209093689918518, -0.14285896718502045, -0.1336269974708557, -0.12439501285552979, -0.11516304314136505, -0.10593107342720032, -0.09669909626245499, -0.08746712654829025, -0.07823515683412552, -0.06900317966938019, -0.059771209955215454, -0.05053923651576042, -0.04130726307630539, -0.032075293362140656, -0.022843316197395325, -0.01361134648323059, -0.004379373975098133, 0.004852598533034325, 0.014084570109844208, 0.02331654354929924, 0.03254851698875427, 0.041780486702919006, 0.05101246386766434, 0.06024443358182907, 0.0694764032959938, 0.07870838046073914, 0.08794035017490387, 0.0971723198890686, 0.10640429705381393, 0.11563626676797867, 0.124868243932724, 0.13410021364688873, 0.14333218336105347, 0.1525641530752182, 0.16179612278938293, 0.17102810740470886, 0.1802600771188736, 0.18949204683303833, 0.19872403144836426, 0.2079559862613678, 0.21718795597553253, 0.22641992568969727, 0.2356519103050232, 0.24488388001918793, 0.25411584973335266, 0.2633478045463562, 0.27257978916168213, 0.28181177377700806]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 9.0, 14.0, 7.0, 12.0, 20.0, 21.0, 34.0, 37.0, 40.0, 41.0, 46.0, 29.0, 42.0, 51.0, 52.0, 51.0, 59.0, 55.0, 39.0, 35.0, 34.0, 48.0, 33.0, 27.0, 25.0, 24.0, 21.0, 18.0, 12.0, 12.0, 11.0, 5.0, 5.0, 8.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.421875, -3.30584716796875, -3.1898193359375, -3.07379150390625, -2.957763671875, -2.84173583984375, -2.7257080078125, -2.60968017578125, -2.49365234375, -2.37762451171875, -2.2615966796875, -2.14556884765625, -2.029541015625, -1.91351318359375, -1.7974853515625, -1.68145751953125, -1.5654296875, -1.44940185546875, -1.3333740234375, -1.21734619140625, -1.101318359375, -0.98529052734375, -0.8692626953125, -0.75323486328125, -0.63720703125, -0.52117919921875, -0.4051513671875, -0.28912353515625, -0.173095703125, -0.05706787109375, 0.0589599609375, 0.17498779296875, 0.291015625, 0.40704345703125, 0.5230712890625, 0.63909912109375, 0.755126953125, 0.87115478515625, 0.9871826171875, 1.10321044921875, 1.21923828125, 1.33526611328125, 1.4512939453125, 1.56732177734375, 1.683349609375, 1.79937744140625, 1.9154052734375, 2.03143310546875, 2.1474609375, 2.26348876953125, 2.3795166015625, 2.49554443359375, 2.611572265625, 2.72760009765625, 2.8436279296875, 2.95965576171875, 3.07568359375, 3.19171142578125, 3.3077392578125, 3.42376708984375, 3.539794921875, 3.65582275390625, 3.7718505859375, 3.88787841796875, 4.00390625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 11.0, 21.0, 24.0, 23.0, 36.0, 50.0, 89.0, 144.0, 182.0, 291.0, 403.0, 700.0, 1059.0, 1888.0, 3395.0, 6894.0, 14255.0, 32318.0, 73480.0, 171491.0, 334688.0, 226567.0, 99367.0, 42805.0, 19047.0, 8919.0, 4372.0, 2364.0, 1381.0, 808.0, 509.0, 342.0, 197.0, 122.0, 94.0, 63.0, 50.0, 31.0, 20.0, 12.0, 11.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.783203125, -3.651275634765625, -3.51934814453125, -3.387420654296875, -3.2554931640625, -3.123565673828125, -2.99163818359375, -2.859710693359375, -2.727783203125, -2.595855712890625, -2.46392822265625, -2.332000732421875, -2.2000732421875, -2.068145751953125, -1.93621826171875, -1.804290771484375, -1.67236328125, -1.540435791015625, -1.40850830078125, -1.276580810546875, -1.1446533203125, -1.012725830078125, -0.88079833984375, -0.748870849609375, -0.616943359375, -0.485015869140625, -0.35308837890625, -0.221160888671875, -0.0892333984375, 0.042694091796875, 0.17462158203125, 0.306549072265625, 0.4384765625, 0.570404052734375, 0.70233154296875, 0.834259033203125, 0.9661865234375, 1.098114013671875, 1.23004150390625, 1.361968994140625, 1.493896484375, 1.625823974609375, 1.75775146484375, 1.889678955078125, 2.0216064453125, 2.153533935546875, 2.28546142578125, 2.417388916015625, 2.54931640625, 2.681243896484375, 2.81317138671875, 2.945098876953125, 3.0770263671875, 3.208953857421875, 3.34088134765625, 3.472808837890625, 3.604736328125, 3.736663818359375, 3.86859130859375, 4.000518798828125, 4.1324462890625, 4.264373779296875, 4.39630126953125, 4.528228759765625, 4.66015625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 3.0, 4.0, 5.0, 6.0, 8.0, 6.0, 10.0, 13.0, 15.0, 21.0, 24.0, 33.0, 24.0, 29.0, 38.0, 31.0, 41.0, 58.0, 95.0, 149.0, 204.0, 1336.0, 238.0, 145.0, 86.0, 57.0, 51.0, 48.0, 44.0, 29.0, 27.0, 17.0, 26.0, 19.0, 16.0, 12.0, 11.0, 9.0, 11.0, 6.0, 11.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-11.09375, -10.7418212890625, -10.389892578125, -10.0379638671875, -9.68603515625, -9.3341064453125, -8.982177734375, -8.6302490234375, -8.2783203125, -7.9263916015625, -7.574462890625, -7.2225341796875, -6.87060546875, -6.5186767578125, -6.166748046875, -5.8148193359375, -5.462890625, -5.1109619140625, -4.759033203125, -4.4071044921875, -4.05517578125, -3.7032470703125, -3.351318359375, -2.9993896484375, -2.6474609375, -2.2955322265625, -1.943603515625, -1.5916748046875, -1.23974609375, -0.8878173828125, -0.535888671875, -0.1839599609375, 0.16796875, 0.5198974609375, 0.871826171875, 1.2237548828125, 1.57568359375, 1.9276123046875, 2.279541015625, 2.6314697265625, 2.9833984375, 3.3353271484375, 3.687255859375, 4.0391845703125, 4.39111328125, 4.7430419921875, 5.094970703125, 5.4468994140625, 5.798828125, 6.1507568359375, 6.502685546875, 6.8546142578125, 7.20654296875, 7.5584716796875, 7.910400390625, 8.2623291015625, 8.6142578125, 8.9661865234375, 9.318115234375, 9.6700439453125, 10.02197265625, 10.3739013671875, 10.725830078125, 11.0777587890625, 11.4296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 14.0, 9.0, 8.0, 13.0, 12.0, 21.0, 21.0, 28.0, 33.0, 42.0, 55.0, 80.0, 91.0, 125.0, 190.0, 271.0, 451.0, 1243.0, 7761.0, 201814.0, 2834826.0, 91228.0, 5040.0, 1008.0, 387.0, 240.0, 154.0, 110.0, 94.0, 73.0, 65.0, 40.0, 28.0, 23.0, 22.0, 17.0, 9.0, 11.0, 8.0, 4.0, 4.0, 5.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.052490234375, -19.37060546875, -18.688720703125, -18.0068359375, -17.324951171875, -16.64306640625, -15.961181640625, -15.279296875, -14.597412109375, -13.91552734375, -13.233642578125, -12.5517578125, -11.869873046875, -11.18798828125, -10.506103515625, -9.82421875, -9.142333984375, -8.46044921875, -7.778564453125, -7.0966796875, -6.414794921875, -5.73291015625, -5.051025390625, -4.369140625, -3.687255859375, -3.00537109375, -2.323486328125, -1.6416015625, -0.959716796875, -0.27783203125, 0.404052734375, 1.0859375, 1.767822265625, 2.44970703125, 3.131591796875, 3.8134765625, 4.495361328125, 5.17724609375, 5.859130859375, 6.541015625, 7.222900390625, 7.90478515625, 8.586669921875, 9.2685546875, 9.950439453125, 10.63232421875, 11.314208984375, 11.99609375, 12.677978515625, 13.35986328125, 14.041748046875, 14.7236328125, 15.405517578125, 16.08740234375, 16.769287109375, 17.451171875, 18.133056640625, 18.81494140625, 19.496826171875, 20.1787109375, 20.860595703125, 21.54248046875, 22.224365234375, 22.90625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 11.0, 30.0, 57.0, 87.0, 110.0, 161.0, 175.0, 148.0, 104.0, 63.0, 36.0, 17.0, 8.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.17344665527344, -44.10606002807617, -43.03866958618164, -41.971282958984375, -40.903892517089844, -39.83650588989258, -38.76911926269531, -37.70172882080078, -36.634342193603516, -35.56695556640625, -34.49956512451172, -33.43217849731445, -32.36479187011719, -31.297401428222656, -30.23001480102539, -29.162626266479492, -28.095237731933594, -27.027849197387695, -25.960460662841797, -24.89307403564453, -23.825685501098633, -22.758296966552734, -21.69091033935547, -20.62352180480957, -19.556133270263672, -18.488744735717773, -17.421356201171875, -16.35396957397461, -15.286581039428711, -14.219192504882812, -13.15180492401123, -12.084417343139648, -11.017026901245117, -9.949638366699219, -8.882250785827637, -7.8148627281188965, -6.747474670410156, -5.680086612701416, -4.612698554992676, -3.5453104972839355, -2.4779224395751953, -1.410534381866455, -0.34314632415771484, 0.7242417335510254, 1.7916297912597656, 2.859017848968506, 3.926405906677246, 4.993793964385986, 6.061182022094727, 7.128570079803467, 8.195958137512207, 9.263345718383789, 10.330734252929688, 11.398122787475586, 12.465510368347168, 13.53289794921875, 14.600286483764648, 15.667675018310547, 16.735061645507812, 17.80245018005371, 18.86983871459961, 19.937227249145508, 21.004615783691406, 22.072002410888672, 23.13939094543457]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 9.0, 7.0, 14.0, 12.0, 15.0, 18.0, 13.0, 16.0, 16.0, 18.0, 22.0, 26.0, 32.0, 29.0, 23.0, 26.0, 35.0, 32.0, 28.0, 37.0, 42.0, 38.0, 39.0, 23.0, 32.0, 33.0, 31.0, 23.0, 36.0, 26.0, 19.0, 25.0, 19.0, 24.0, 18.0, 21.0, 17.0, 21.0, 18.0, 6.0, 14.0, 6.0, 6.0, 6.0, 8.0, 7.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-23.690298080444336, -22.9163818359375, -22.14246368408203, -21.368547439575195, -20.59463119506836, -19.82071304321289, -19.046796798706055, -18.27288055419922, -17.49896240234375, -16.725046157836914, -15.951128005981445, -15.17721176147461, -14.403294563293457, -13.629377365112305, -12.855461120605469, -12.081543922424316, -11.307626724243164, -10.533709526062012, -9.75979232788086, -8.985876083374023, -8.211958885192871, -7.438041687011719, -6.664124965667725, -5.8902082443237305, -5.116291046142578, -4.342373847961426, -3.5684571266174316, -2.7945401668548584, -2.020623207092285, -1.246706247329712, -0.47278928756713867, 0.30112743377685547, 1.0750465393066406, 1.8489634990692139, 2.622880458831787, 3.3967974185943604, 4.170714378356934, 4.944631576538086, 5.71854829788208, 6.492465019226074, 7.266382217407227, 8.040299415588379, 8.814216613769531, 9.588132858276367, 10.36205005645752, 11.135967254638672, 11.909883499145508, 12.68380069732666, 13.457717895507812, 14.231635093688965, 15.005552291870117, 15.779468536376953, 16.553386688232422, 17.327302932739258, 18.101219177246094, 18.875137329101562, 19.6490535736084, 20.422969818115234, 21.196887969970703, 21.97080421447754, 22.744720458984375, 23.518638610839844, 24.29255485534668, 25.066471099853516, 25.840389251708984]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 8.0, 8.0, 11.0, 13.0, 15.0, 19.0, 16.0, 18.0, 28.0, 32.0, 34.0, 45.0, 45.0, 39.0, 39.0, 37.0, 44.0, 49.0, 37.0, 38.0, 52.0, 42.0, 44.0, 44.0, 23.0, 30.0, 20.0, 19.0, 20.0, 16.0, 19.0, 21.0, 15.0, 11.0, 9.0, 5.0, 6.0, 8.0, 2.0, 1.0, 1.0, 3.0, 3.0], "bins": [-4.19140625, -4.082305908203125, -3.97320556640625, -3.864105224609375, -3.7550048828125, -3.645904541015625, -3.53680419921875, -3.427703857421875, -3.318603515625, -3.209503173828125, -3.10040283203125, -2.991302490234375, -2.8822021484375, -2.773101806640625, -2.66400146484375, -2.554901123046875, -2.44580078125, -2.336700439453125, -2.22760009765625, -2.118499755859375, -2.0093994140625, -1.900299072265625, -1.79119873046875, -1.682098388671875, -1.572998046875, -1.463897705078125, -1.35479736328125, -1.245697021484375, -1.1365966796875, -1.027496337890625, -0.91839599609375, -0.809295654296875, -0.7001953125, -0.591094970703125, -0.48199462890625, -0.372894287109375, -0.2637939453125, -0.154693603515625, -0.04559326171875, 0.063507080078125, 0.172607421875, 0.281707763671875, 0.39080810546875, 0.499908447265625, 0.6090087890625, 0.718109130859375, 0.82720947265625, 0.936309814453125, 1.04541015625, 1.154510498046875, 1.26361083984375, 1.372711181640625, 1.4818115234375, 1.590911865234375, 1.70001220703125, 1.809112548828125, 1.918212890625, 2.027313232421875, 2.13641357421875, 2.245513916015625, 2.3546142578125, 2.463714599609375, 2.57281494140625, 2.681915283203125, 2.791015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 4.0, 3.0, 7.0, 6.0, 13.0, 20.0, 20.0, 18.0, 34.0, 45.0, 79.0, 106.0, 171.0, 271.0, 454.0, 794.0, 1400.0, 2947.0, 7059.0, 25876.0, 278548.0, 2649317.0, 1128473.0, 77703.0, 12585.0, 4236.0, 1845.0, 909.0, 494.0, 288.0, 164.0, 117.0, 81.0, 41.0, 33.0, 23.0, 20.0, 22.0, 12.0, 10.0, 12.0, 12.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0], "bins": [-12.1484375, -11.82666015625, -11.5048828125, -11.18310546875, -10.861328125, -10.53955078125, -10.2177734375, -9.89599609375, -9.57421875, -9.25244140625, -8.9306640625, -8.60888671875, -8.287109375, -7.96533203125, -7.6435546875, -7.32177734375, -7.0, -6.67822265625, -6.3564453125, -6.03466796875, -5.712890625, -5.39111328125, -5.0693359375, -4.74755859375, -4.42578125, -4.10400390625, -3.7822265625, -3.46044921875, -3.138671875, -2.81689453125, -2.4951171875, -2.17333984375, -1.8515625, -1.52978515625, -1.2080078125, -0.88623046875, -0.564453125, -0.24267578125, 0.0791015625, 0.40087890625, 0.72265625, 1.04443359375, 1.3662109375, 1.68798828125, 2.009765625, 2.33154296875, 2.6533203125, 2.97509765625, 3.296875, 3.61865234375, 3.9404296875, 4.26220703125, 4.583984375, 4.90576171875, 5.2275390625, 5.54931640625, 5.87109375, 6.19287109375, 6.5146484375, 6.83642578125, 7.158203125, 7.47998046875, 7.8017578125, 8.12353515625, 8.4453125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 11.0, 20.0, 21.0, 27.0, 47.0, 66.0, 84.0, 134.0, 176.0, 290.0, 366.0, 509.0, 524.0, 505.0, 381.0, 263.0, 204.0, 152.0, 80.0, 69.0, 27.0, 31.0, 19.0, 22.0, 17.0, 6.0, 9.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69140625, -6.41778564453125, -6.1441650390625, -5.87054443359375, -5.596923828125, -5.32330322265625, -5.0496826171875, -4.77606201171875, -4.50244140625, -4.22882080078125, -3.9552001953125, -3.68157958984375, -3.407958984375, -3.13433837890625, -2.8607177734375, -2.58709716796875, -2.3134765625, -2.03985595703125, -1.7662353515625, -1.49261474609375, -1.218994140625, -0.94537353515625, -0.6717529296875, -0.39813232421875, -0.12451171875, 0.14910888671875, 0.4227294921875, 0.69635009765625, 0.969970703125, 1.24359130859375, 1.5172119140625, 1.79083251953125, 2.064453125, 2.33807373046875, 2.6116943359375, 2.88531494140625, 3.158935546875, 3.43255615234375, 3.7061767578125, 3.97979736328125, 4.25341796875, 4.52703857421875, 4.8006591796875, 5.07427978515625, 5.347900390625, 5.62152099609375, 5.8951416015625, 6.16876220703125, 6.4423828125, 6.71600341796875, 6.9896240234375, 7.26324462890625, 7.536865234375, 7.81048583984375, 8.0841064453125, 8.35772705078125, 8.63134765625, 8.90496826171875, 9.1785888671875, 9.45220947265625, 9.725830078125, 9.99945068359375, 10.2730712890625, 10.54669189453125, 10.8203125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 9.0, 10.0, 15.0, 26.0, 30.0, 41.0, 53.0, 65.0, 153.0, 268.0, 527.0, 1273.0, 3658.0, 14953.0, 124943.0, 2331400.0, 1617420.0, 82764.0, 11588.0, 2981.0, 1025.0, 457.0, 244.0, 131.0, 92.0, 56.0, 30.0, 30.0, 16.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-19.96875, -19.4556884765625, -18.942626953125, -18.4295654296875, -17.91650390625, -17.4034423828125, -16.890380859375, -16.3773193359375, -15.8642578125, -15.3511962890625, -14.838134765625, -14.3250732421875, -13.81201171875, -13.2989501953125, -12.785888671875, -12.2728271484375, -11.759765625, -11.2467041015625, -10.733642578125, -10.2205810546875, -9.70751953125, -9.1944580078125, -8.681396484375, -8.1683349609375, -7.6552734375, -7.1422119140625, -6.629150390625, -6.1160888671875, -5.60302734375, -5.0899658203125, -4.576904296875, -4.0638427734375, -3.55078125, -3.0377197265625, -2.524658203125, -2.0115966796875, -1.49853515625, -0.9854736328125, -0.472412109375, 0.0406494140625, 0.5537109375, 1.0667724609375, 1.579833984375, 2.0928955078125, 2.60595703125, 3.1190185546875, 3.632080078125, 4.1451416015625, 4.658203125, 5.1712646484375, 5.684326171875, 6.1973876953125, 6.71044921875, 7.2235107421875, 7.736572265625, 8.2496337890625, 8.7626953125, 9.2757568359375, 9.788818359375, 10.3018798828125, 10.81494140625, 11.3280029296875, 11.841064453125, 12.3541259765625, 12.8671875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 23.0, 43.0, 103.0, 164.0, 235.0, 203.0, 129.0, 75.0, 22.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.8657283782959, -27.48964500427246, -25.113563537597656, -22.73748016357422, -20.36139678955078, -17.985315322875977, -15.609231948852539, -13.233150482177734, -10.857067108154297, -8.480984687805176, -6.1049017906188965, -3.728818893432617, -1.352736473083496, 1.023345947265625, 3.3994293212890625, 5.775510787963867, 8.151594161987305, 10.527676582336426, 12.903759002685547, 15.279842376708984, 17.655925750732422, 20.032007217407227, 22.408090591430664, 24.78417205810547, 27.160255432128906, 29.536338806152344, 31.91242027282715, 34.28850555419922, 36.66458511352539, 39.04066848754883, 41.416751861572266, 43.79283142089844, 46.168914794921875, 48.54499816894531, 50.92108154296875, 53.29716491699219, 55.67324447631836, 58.0493278503418, 60.425411224365234, 62.801490783691406, 65.17757415771484, 67.55365753173828, 69.92974090576172, 72.30582427978516, 74.6819076538086, 77.0579833984375, 79.43406677246094, 81.81015014648438, 84.18623352050781, 86.56231689453125, 88.93840026855469, 91.31448364257812, 93.69056701660156, 96.066650390625, 98.44273376464844, 100.81880950927734, 103.19490051269531, 105.57098388671875, 107.94706726074219, 110.32315063476562, 112.69923400878906, 115.0753173828125, 117.45140075683594, 119.82747650146484, 122.20355987548828]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 3.0, 6.0, 7.0, 8.0, 13.0, 17.0, 22.0, 21.0, 15.0, 24.0, 22.0, 31.0, 40.0, 33.0, 36.0, 51.0, 40.0, 27.0, 54.0, 40.0, 57.0, 47.0, 49.0, 40.0, 47.0, 36.0, 19.0, 21.0, 28.0, 28.0, 17.0, 13.0, 17.0, 14.0, 11.0, 9.0, 5.0, 2.0, 11.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.605205535888672, -19.82792854309082, -19.0506534576416, -18.27337646484375, -17.49610137939453, -16.71882438659668, -15.941549301147461, -15.16427230834961, -14.38699722290039, -13.609721183776855, -12.83244514465332, -12.055169105529785, -11.27789306640625, -10.500617027282715, -9.72334098815918, -8.946063995361328, -8.168787956237793, -7.391511917114258, -6.614235877990723, -5.8369598388671875, -5.059683799743652, -4.282407760620117, -3.505131244659424, -2.7278552055358887, -1.9505791664123535, -1.1733031272888184, -0.39602696895599365, 0.38124918937683105, 1.1585252285003662, 1.9358012676239014, 2.7130775451660156, 3.490353584289551, 4.267629623413086, 5.044905662536621, 5.822181701660156, 6.599457740783691, 7.376733779907227, 8.154009819030762, 8.931285858154297, 9.708562850952148, 10.485837936401367, 11.263113975524902, 12.040390014648438, 12.817666053771973, 13.594942092895508, 14.372218132019043, 15.149494171142578, 15.92677116394043, 16.70404815673828, 17.481325149536133, 18.25860023498535, 19.035877227783203, 19.813152313232422, 20.590429306030273, 21.367704391479492, 22.144981384277344, 22.922256469726562, 23.699533462524414, 24.476808547973633, 25.254085540771484, 26.031360626220703, 26.808637619018555, 27.585912704467773, 28.363189697265625, 29.140464782714844]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 6.0, 8.0, 14.0, 8.0, 16.0, 13.0, 24.0, 23.0, 25.0, 33.0, 42.0, 51.0, 48.0, 37.0, 47.0, 61.0, 55.0, 60.0, 51.0, 49.0, 42.0, 39.0, 30.0, 39.0, 27.0, 27.0, 24.0, 16.0, 11.0, 20.0, 13.0, 12.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.2421875, -4.116424560546875, -3.99066162109375, -3.864898681640625, -3.7391357421875, -3.613372802734375, -3.48760986328125, -3.361846923828125, -3.236083984375, -3.110321044921875, -2.98455810546875, -2.858795166015625, -2.7330322265625, -2.607269287109375, -2.48150634765625, -2.355743408203125, -2.22998046875, -2.104217529296875, -1.97845458984375, -1.852691650390625, -1.7269287109375, -1.601165771484375, -1.47540283203125, -1.349639892578125, -1.223876953125, -1.098114013671875, -0.97235107421875, -0.846588134765625, -0.7208251953125, -0.595062255859375, -0.46929931640625, -0.343536376953125, -0.2177734375, -0.092010498046875, 0.03375244140625, 0.159515380859375, 0.2852783203125, 0.411041259765625, 0.53680419921875, 0.662567138671875, 0.788330078125, 0.914093017578125, 1.03985595703125, 1.165618896484375, 1.2913818359375, 1.417144775390625, 1.54290771484375, 1.668670654296875, 1.79443359375, 1.920196533203125, 2.04595947265625, 2.171722412109375, 2.2974853515625, 2.423248291015625, 2.54901123046875, 2.674774169921875, 2.800537109375, 2.926300048828125, 3.05206298828125, 3.177825927734375, 3.3035888671875, 3.429351806640625, 3.55511474609375, 3.680877685546875, 3.806640625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 15.0, 10.0, 20.0, 16.0, 27.0, 41.0, 60.0, 98.0, 122.0, 159.0, 232.0, 327.0, 453.0, 648.0, 1032.0, 1626.0, 3041.0, 6595.0, 16911.0, 50659.0, 158342.0, 358238.0, 288324.0, 104681.0, 33617.0, 11847.0, 4915.0, 2409.0, 1361.0, 813.0, 530.0, 364.0, 274.0, 210.0, 147.0, 122.0, 82.0, 56.0, 37.0, 28.0, 26.0, 15.0, 12.0, 8.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.14544677734375, -1.1082763671875, -1.07110595703125, -1.033935546875, -0.99676513671875, -0.9595947265625, -0.92242431640625, -0.88525390625, -0.84808349609375, -0.8109130859375, -0.77374267578125, -0.736572265625, -0.69940185546875, -0.6622314453125, -0.62506103515625, -0.587890625, -0.55072021484375, -0.5135498046875, -0.47637939453125, -0.439208984375, -0.40203857421875, -0.3648681640625, -0.32769775390625, -0.29052734375, -0.25335693359375, -0.2161865234375, -0.17901611328125, -0.141845703125, -0.10467529296875, -0.0675048828125, -0.03033447265625, 0.0068359375, 0.04400634765625, 0.0811767578125, 0.11834716796875, 0.155517578125, 0.19268798828125, 0.2298583984375, 0.26702880859375, 0.30419921875, 0.34136962890625, 0.3785400390625, 0.41571044921875, 0.452880859375, 0.49005126953125, 0.5272216796875, 0.56439208984375, 0.6015625, 0.63873291015625, 0.6759033203125, 0.71307373046875, 0.750244140625, 0.78741455078125, 0.8245849609375, 0.86175537109375, 0.89892578125, 0.93609619140625, 0.9732666015625, 1.01043701171875, 1.047607421875, 1.08477783203125, 1.1219482421875, 1.15911865234375, 1.1962890625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 11.0, 8.0, 12.0, 14.0, 11.0, 16.0, 15.0, 19.0, 28.0, 36.0, 33.0, 31.0, 30.0, 42.0, 40.0, 41.0, 38.0, 41.0, 1069.0, 42.0, 47.0, 35.0, 49.0, 34.0, 35.0, 29.0, 30.0, 27.0, 25.0, 34.0, 18.0, 15.0, 16.0, 7.0, 10.0, 11.0, 6.0, 9.0, 4.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.328125, -3.234375, -3.140625, -3.046875, -2.953125, -2.859375, -2.765625, -2.671875, -2.578125, -2.484375, -2.390625, -2.296875, -2.203125, -2.109375, -2.015625, -1.921875, -1.828125, -1.734375, -1.640625, -1.546875, -1.453125, -1.359375, -1.265625, -1.171875, -1.078125, -0.984375, -0.890625, -0.796875, -0.703125, -0.609375, -0.515625, -0.421875, -0.328125, -0.234375, -0.140625, -0.046875, 0.046875, 0.140625, 0.234375, 0.328125, 0.421875, 0.515625, 0.609375, 0.703125, 0.796875, 0.890625, 0.984375, 1.078125, 1.171875, 1.265625, 1.359375, 1.453125, 1.546875, 1.640625, 1.734375, 1.828125, 1.921875, 2.015625, 2.109375, 2.203125, 2.296875, 2.390625, 2.484375, 2.578125, 2.671875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 5.0, 6.0, 11.0, 4.0, 12.0, 33.0, 31.0, 65.0, 137.0, 278.0, 517.0, 1060.0, 2518.0, 6925.0, 25034.0, 171775.0, 1676847.0, 174592.0, 25406.0, 6995.0, 2586.0, 1135.0, 517.0, 301.0, 150.0, 68.0, 52.0, 28.0, 18.0, 4.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.79248046875, -0.7614059448242188, -0.7303314208984375, -0.6992568969726562, -0.668182373046875, -0.6371078491210938, -0.6060333251953125, -0.5749588012695312, -0.54388427734375, -0.5128097534179688, -0.4817352294921875, -0.45066070556640625, -0.419586181640625, -0.38851165771484375, -0.3574371337890625, -0.32636260986328125, -0.2952880859375, -0.26421356201171875, -0.2331390380859375, -0.20206451416015625, -0.170989990234375, -0.13991546630859375, -0.1088409423828125, -0.07776641845703125, -0.04669189453125, -0.01561737060546875, 0.0154571533203125, 0.04653167724609375, 0.077606201171875, 0.10868072509765625, 0.1397552490234375, 0.17082977294921875, 0.201904296875, 0.23297882080078125, 0.2640533447265625, 0.29512786865234375, 0.326202392578125, 0.35727691650390625, 0.3883514404296875, 0.41942596435546875, 0.45050048828125, 0.48157501220703125, 0.5126495361328125, 0.5437240600585938, 0.574798583984375, 0.6058731079101562, 0.6369476318359375, 0.6680221557617188, 0.6990966796875, 0.7301712036132812, 0.7612457275390625, 0.7923202514648438, 0.823394775390625, 0.8544692993164062, 0.8855438232421875, 0.9166183471679688, 0.94769287109375, 0.9787673950195312, 1.0098419189453125, 1.0409164428710938, 1.071990966796875, 1.1030654907226562, 1.1341400146484375, 1.1652145385742188, 1.1962890625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 1.0, 6.0, 5.0, 4.0, 9.0, 12.0, 25.0, 29.0, 42.0, 53.0, 60.0, 97.0, 137.0, 124.0, 92.0, 70.0, 57.0, 47.0, 22.0, 19.0, 17.0, 7.0, 7.0, 3.0, 5.0, 9.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128173828125, -0.12427902221679688, -0.12038421630859375, -0.11648941040039062, -0.1125946044921875, -0.10869979858398438, -0.10480499267578125, -0.10091018676757812, -0.097015380859375, -0.09312057495117188, -0.08922576904296875, -0.08533096313476562, -0.0814361572265625, -0.07754135131835938, -0.07364654541015625, -0.06975173950195312, -0.06585693359375, -0.061962127685546875, -0.05806732177734375, -0.054172515869140625, -0.0502777099609375, -0.046382904052734375, -0.04248809814453125, -0.038593292236328125, -0.034698486328125, -0.030803680419921875, -0.02690887451171875, -0.023014068603515625, -0.0191192626953125, -0.015224456787109375, -0.01132965087890625, -0.007434844970703125, -0.0035400390625, 0.000354766845703125, 0.00424957275390625, 0.008144378662109375, 0.0120391845703125, 0.015933990478515625, 0.01982879638671875, 0.023723602294921875, 0.027618408203125, 0.031513214111328125, 0.03540802001953125, 0.039302825927734375, 0.0431976318359375, 0.047092437744140625, 0.05098724365234375, 0.054882049560546875, 0.05877685546875, 0.06267166137695312, 0.06656646728515625, 0.07046127319335938, 0.0743560791015625, 0.07825088500976562, 0.08214569091796875, 0.08604049682617188, 0.089935302734375, 0.09383010864257812, 0.09772491455078125, 0.10161972045898438, 0.1055145263671875, 0.10940933227539062, 0.11330413818359375, 0.11719894409179688, 0.12109375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 3.0, 2.0, 12.0, 3.0, 6.0, 15.0, 18.0, 28.0, 36.0, 58.0, 94.0, 135.0, 266.0, 1611.0, 148416.0, 894000.0, 3020.0, 359.0, 165.0, 94.0, 58.0, 45.0, 21.0, 18.0, 12.0, 6.0, 9.0, 6.0, 3.0, 3.0, 7.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.3984375, -2.321319580078125, -2.24420166015625, -2.167083740234375, -2.0899658203125, -2.012847900390625, -1.93572998046875, -1.858612060546875, -1.781494140625, -1.704376220703125, -1.62725830078125, -1.550140380859375, -1.4730224609375, -1.395904541015625, -1.31878662109375, -1.241668701171875, -1.16455078125, -1.087432861328125, -1.01031494140625, -0.933197021484375, -0.8560791015625, -0.778961181640625, -0.70184326171875, -0.624725341796875, -0.547607421875, -0.470489501953125, -0.39337158203125, -0.316253662109375, -0.2391357421875, -0.162017822265625, -0.08489990234375, -0.007781982421875, 0.0693359375, 0.146453857421875, 0.22357177734375, 0.300689697265625, 0.3778076171875, 0.454925537109375, 0.53204345703125, 0.609161376953125, 0.686279296875, 0.763397216796875, 0.84051513671875, 0.917633056640625, 0.9947509765625, 1.071868896484375, 1.14898681640625, 1.226104736328125, 1.30322265625, 1.380340576171875, 1.45745849609375, 1.534576416015625, 1.6116943359375, 1.688812255859375, 1.76593017578125, 1.843048095703125, 1.920166015625, 1.997283935546875, 2.07440185546875, 2.151519775390625, 2.2286376953125, 2.305755615234375, 2.38287353515625, 2.459991455078125, 2.537109375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 24.0, 114.0, 392.0, 324.0, 111.0, 28.0, 11.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4904543161392212, -1.4628010988235474, -1.435148000717163, -1.4074947834014893, -1.3798415660858154, -1.3521884679794312, -1.3245352506637573, -1.2968820333480835, -1.2692289352416992, -1.2415757179260254, -1.2139226198196411, -1.1862694025039673, -1.1586161851882935, -1.1309630870819092, -1.1033098697662354, -1.0756566524505615, -1.0480034351348877, -1.0203502178192139, -0.9926970601081848, -0.9650439023971558, -0.9373907446861267, -0.9097375869750977, -0.8820843696594238, -0.8544312119483948, -0.8267780542373657, -0.7991248965263367, -0.7714716792106628, -0.7438185214996338, -0.7161653637886047, -0.6885122060775757, -0.6608589887619019, -0.6332058310508728, -0.6055526733398438, -0.5778995156288147, -0.5502462983131409, -0.5225931406021118, -0.49493998289108276, -0.4672867953777313, -0.4396336078643799, -0.41198045015335083, -0.3843272924423218, -0.35667410492897034, -0.3290209472179413, -0.30136775970458984, -0.2737146019935608, -0.24606141448020935, -0.2184082269668579, -0.19075505435466766, -0.16310188174247742, -0.13544870913028717, -0.10779552906751633, -0.08014234900474548, -0.05248917639255524, -0.02483600378036499, 0.00281718373298645, 0.030470356345176697, 0.05812352895736694, 0.08577670156955719, 0.11342988163232803, 0.14108306169509888, 0.16873623430728912, 0.19638940691947937, 0.2240425944328308, 0.25169575214385986, 0.2793489396572113]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 6.0, 5.0, 6.0, 12.0, 6.0, 13.0, 25.0, 16.0, 29.0, 27.0, 29.0, 23.0, 32.0, 42.0, 39.0, 28.0, 39.0, 32.0, 38.0, 35.0, 38.0, 46.0, 42.0, 34.0, 46.0, 32.0, 29.0, 33.0, 43.0, 30.0, 16.0, 19.0, 17.0, 20.0, 9.0, 10.0, 9.0, 10.0, 7.0, 5.0, 9.0, 1.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1520177721977234, -0.1472860872745514, -0.1425543874502182, -0.1378227025270462, -0.1330910176038742, -0.12835931777954102, -0.12362763285636902, -0.11889594793319702, -0.11416425555944443, -0.10943256318569183, -0.10470087826251984, -0.09996918588876724, -0.09523749351501465, -0.09050580859184265, -0.08577411621809006, -0.08104242384433746, -0.07631073892116547, -0.07157904654741287, -0.06684736162424088, -0.06211566925048828, -0.057383980602025986, -0.05265229195356369, -0.047920599579811096, -0.0431889109313488, -0.038457222282886505, -0.03372553363442421, -0.028993843123316765, -0.02426215261220932, -0.019530463963747025, -0.014798775315284729, -0.010067084804177284, -0.0053353942930698395, -0.0006037056446075439, 0.004127983935177326, 0.008859673514962196, 0.013591363094747066, 0.018323052674531937, 0.023054741322994232, 0.027786431834101677, 0.03251812234520912, 0.03724981099367142, 0.04198149964213371, 0.04671318829059601, 0.0514448806643486, 0.0561765693128109, 0.06090825796127319, 0.06563995033502579, 0.07037164270877838, 0.07510332763195038, 0.07983502000570297, 0.08456670492887497, 0.08929839730262756, 0.09403008222579956, 0.09876177459955215, 0.10349346697330475, 0.10822515189647675, 0.11295684427022934, 0.11768853664398193, 0.12242022156715393, 0.12715190649032593, 0.13188360631465912, 0.13661529123783112, 0.1413469761610031, 0.1460786759853363, 0.1508103609085083]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 12.0, 15.0, 14.0, 12.0, 31.0, 30.0, 28.0, 28.0, 37.0, 32.0, 60.0, 38.0, 28.0, 46.0, 50.0, 47.0, 54.0, 47.0, 53.0, 35.0, 35.0, 23.0, 31.0, 17.0, 25.0, 35.0, 23.0, 15.0, 17.0, 11.0, 7.0, 6.0, 10.0, 5.0, 7.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.2109375, -3.101593017578125, -2.99224853515625, -2.882904052734375, -2.7735595703125, -2.664215087890625, -2.55487060546875, -2.445526123046875, -2.336181640625, -2.226837158203125, -2.11749267578125, -2.008148193359375, -1.8988037109375, -1.789459228515625, -1.68011474609375, -1.570770263671875, -1.46142578125, -1.352081298828125, -1.24273681640625, -1.133392333984375, -1.0240478515625, -0.914703369140625, -0.80535888671875, -0.696014404296875, -0.586669921875, -0.477325439453125, -0.36798095703125, -0.258636474609375, -0.1492919921875, -0.039947509765625, 0.06939697265625, 0.178741455078125, 0.2880859375, 0.397430419921875, 0.50677490234375, 0.616119384765625, 0.7254638671875, 0.834808349609375, 0.94415283203125, 1.053497314453125, 1.162841796875, 1.272186279296875, 1.38153076171875, 1.490875244140625, 1.6002197265625, 1.709564208984375, 1.81890869140625, 1.928253173828125, 2.03759765625, 2.146942138671875, 2.25628662109375, 2.365631103515625, 2.4749755859375, 2.584320068359375, 2.69366455078125, 2.803009033203125, 2.912353515625, 3.021697998046875, 3.13104248046875, 3.240386962890625, 3.3497314453125, 3.459075927734375, 3.56842041015625, 3.677764892578125, 3.787109375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 13.0, 15.0, 15.0, 17.0, 34.0, 58.0, 86.0, 127.0, 175.0, 273.0, 457.0, 777.0, 1267.0, 2327.0, 4148.0, 7508.0, 14440.0, 27460.0, 55501.0, 112638.0, 235390.0, 289600.0, 148280.0, 72618.0, 35576.0, 18318.0, 9496.0, 5084.0, 2873.0, 1505.0, 932.0, 567.0, 327.0, 210.0, 159.0, 91.0, 58.0, 35.0, 24.0, 22.0, 15.0, 8.0, 10.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.34765625, -3.24365234375, -3.1396484375, -3.03564453125, -2.931640625, -2.82763671875, -2.7236328125, -2.61962890625, -2.515625, -2.41162109375, -2.3076171875, -2.20361328125, -2.099609375, -1.99560546875, -1.8916015625, -1.78759765625, -1.68359375, -1.57958984375, -1.4755859375, -1.37158203125, -1.267578125, -1.16357421875, -1.0595703125, -0.95556640625, -0.8515625, -0.74755859375, -0.6435546875, -0.53955078125, -0.435546875, -0.33154296875, -0.2275390625, -0.12353515625, -0.01953125, 0.08447265625, 0.1884765625, 0.29248046875, 0.396484375, 0.50048828125, 0.6044921875, 0.70849609375, 0.8125, 0.91650390625, 1.0205078125, 1.12451171875, 1.228515625, 1.33251953125, 1.4365234375, 1.54052734375, 1.64453125, 1.74853515625, 1.8525390625, 1.95654296875, 2.060546875, 2.16455078125, 2.2685546875, 2.37255859375, 2.4765625, 2.58056640625, 2.6845703125, 2.78857421875, 2.892578125, 2.99658203125, 3.1005859375, 3.20458984375, 3.30859375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 10.0, 8.0, 15.0, 12.0, 12.0, 29.0, 31.0, 30.0, 19.0, 32.0, 35.0, 45.0, 58.0, 71.0, 139.0, 213.0, 1481.0, 257.0, 115.0, 74.0, 70.0, 41.0, 46.0, 39.0, 28.0, 35.0, 24.0, 15.0, 15.0, 12.0, 8.0, 6.0, 9.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.1119384765625, -10.692626953125, -10.2733154296875, -9.85400390625, -9.4346923828125, -9.015380859375, -8.5960693359375, -8.1767578125, -7.7574462890625, -7.338134765625, -6.9188232421875, -6.49951171875, -6.0802001953125, -5.660888671875, -5.2415771484375, -4.822265625, -4.4029541015625, -3.983642578125, -3.5643310546875, -3.14501953125, -2.7257080078125, -2.306396484375, -1.8870849609375, -1.4677734375, -1.0484619140625, -0.629150390625, -0.2098388671875, 0.20947265625, 0.6287841796875, 1.048095703125, 1.4674072265625, 1.88671875, 2.3060302734375, 2.725341796875, 3.1446533203125, 3.56396484375, 3.9832763671875, 4.402587890625, 4.8218994140625, 5.2412109375, 5.6605224609375, 6.079833984375, 6.4991455078125, 6.91845703125, 7.3377685546875, 7.757080078125, 8.1763916015625, 8.595703125, 9.0150146484375, 9.434326171875, 9.8536376953125, 10.27294921875, 10.6922607421875, 11.111572265625, 11.5308837890625, 11.9501953125, 12.3695068359375, 12.788818359375, 13.2081298828125, 13.62744140625, 14.0467529296875, 14.466064453125, 14.8853759765625, 15.3046875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 12.0, 5.0, 13.0, 14.0, 15.0, 27.0, 24.0, 42.0, 41.0, 66.0, 95.0, 107.0, 176.0, 237.0, 464.0, 1153.0, 11050.0, 1754956.0, 1365300.0, 9499.0, 1069.0, 420.0, 239.0, 165.0, 103.0, 93.0, 57.0, 45.0, 47.0, 39.0, 26.0, 25.0, 18.0, 19.0, 9.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 6.0, 2.0], "bins": [-27.96875, -27.21240234375, -26.4560546875, -25.69970703125, -24.943359375, -24.18701171875, -23.4306640625, -22.67431640625, -21.91796875, -21.16162109375, -20.4052734375, -19.64892578125, -18.892578125, -18.13623046875, -17.3798828125, -16.62353515625, -15.8671875, -15.11083984375, -14.3544921875, -13.59814453125, -12.841796875, -12.08544921875, -11.3291015625, -10.57275390625, -9.81640625, -9.06005859375, -8.3037109375, -7.54736328125, -6.791015625, -6.03466796875, -5.2783203125, -4.52197265625, -3.765625, -3.00927734375, -2.2529296875, -1.49658203125, -0.740234375, 0.01611328125, 0.7724609375, 1.52880859375, 2.28515625, 3.04150390625, 3.7978515625, 4.55419921875, 5.310546875, 6.06689453125, 6.8232421875, 7.57958984375, 8.3359375, 9.09228515625, 9.8486328125, 10.60498046875, 11.361328125, 12.11767578125, 12.8740234375, 13.63037109375, 14.38671875, 15.14306640625, 15.8994140625, 16.65576171875, 17.412109375, 18.16845703125, 18.9248046875, 19.68115234375, 20.4375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 462.0, 535.0, 16.0, 1.0, 0.0, 0.0, 1.0], "bins": [-306.1728515625, -300.89447021484375, -295.6161193847656, -290.3377380371094, -285.0593566894531, -279.781005859375, -274.50262451171875, -269.2242431640625, -263.94586181640625, -258.66748046875, -253.3891143798828, -248.11074829101562, -242.83236694335938, -237.5540008544922, -232.275634765625, -226.99725341796875, -221.71890258789062, -216.44053649902344, -211.1621551513672, -205.8837890625, -200.60540771484375, -195.32704162597656, -190.04867553710938, -184.77029418945312, -179.49191284179688, -174.2135467529297, -168.93516540527344, -163.65679931640625, -158.37841796875, -153.1000518798828, -147.82168579101562, -142.54330444335938, -137.2649383544922, -131.986572265625, -126.70819091796875, -121.42982482910156, -116.15145111083984, -110.87307739257812, -105.5947036743164, -100.31632995605469, -95.0379638671875, -89.75959014892578, -84.48121643066406, -79.20285034179688, -73.92447662353516, -68.64610290527344, -63.36772918701172, -58.089359283447266, -52.81098556518555, -47.53261184692383, -42.254241943359375, -36.975868225097656, -31.69749641418457, -26.419124603271484, -21.140750885009766, -15.862380981445312, -10.584007263183594, -5.30563497543335, -0.02726268768310547, 5.251110076904297, 10.529481887817383, 15.807853698730469, 21.086227416992188, 26.36459732055664, 31.64297103881836]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 9.0, 20.0, 12.0, 14.0, 13.0, 18.0, 20.0, 28.0, 37.0, 30.0, 35.0, 33.0, 46.0, 36.0, 50.0, 36.0, 41.0, 49.0, 34.0, 50.0, 35.0, 43.0, 39.0, 32.0, 35.0, 28.0, 27.0, 27.0, 17.0, 12.0, 18.0, 11.0, 7.0, 6.0, 10.0, 7.0, 7.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.58615493774414, -33.50345993041992, -32.42076873779297, -31.33807373046875, -30.255380630493164, -29.172687530517578, -28.08999252319336, -27.007299423217773, -25.924606323242188, -24.8419132232666, -23.759220123291016, -22.676525115966797, -21.59383201599121, -20.511138916015625, -19.428443908691406, -18.34575080871582, -17.263057708740234, -16.18036460876465, -15.097670555114746, -14.014976501464844, -12.932283401489258, -11.849590301513672, -10.76689624786377, -9.684202194213867, -8.601509094238281, -7.518815517425537, -6.436121940612793, -5.353428363800049, -4.270734786987305, -3.1880412101745605, -2.1053476333618164, -1.0226540565490723, 0.0600433349609375, 1.1427369117736816, 2.225430488586426, 3.30812406539917, 4.390817642211914, 5.473511219024658, 6.556204795837402, 7.6388983726501465, 8.72159194946289, 9.804285049438477, 10.886979103088379, 11.969673156738281, 13.052366256713867, 14.135059356689453, 15.217753410339355, 16.300447463989258, 17.383140563964844, 18.46583366394043, 19.548526763916016, 20.631221771240234, 21.71391487121582, 22.796607971191406, 23.879302978515625, 24.96199607849121, 26.044689178466797, 27.127382278442383, 28.21007537841797, 29.292770385742188, 30.375463485717773, 31.45815658569336, 32.54085159301758, 33.62354278564453, 34.70623779296875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 3.0, 6.0, 13.0, 18.0, 18.0, 15.0, 23.0, 19.0, 25.0, 22.0, 43.0, 35.0, 49.0, 34.0, 48.0, 54.0, 52.0, 46.0, 48.0, 42.0, 44.0, 50.0, 30.0, 37.0, 25.0, 31.0, 31.0, 23.0, 21.0, 12.0, 20.0, 15.0, 14.0, 7.0, 8.0, 8.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.930389404296875, -3.80609130859375, -3.681793212890625, -3.5574951171875, -3.433197021484375, -3.30889892578125, -3.184600830078125, -3.060302734375, -2.936004638671875, -2.81170654296875, -2.687408447265625, -2.5631103515625, -2.438812255859375, -2.31451416015625, -2.190216064453125, -2.06591796875, -1.941619873046875, -1.81732177734375, -1.693023681640625, -1.5687255859375, -1.444427490234375, -1.32012939453125, -1.195831298828125, -1.071533203125, -0.947235107421875, -0.82293701171875, -0.698638916015625, -0.5743408203125, -0.450042724609375, -0.32574462890625, -0.201446533203125, -0.0771484375, 0.047149658203125, 0.17144775390625, 0.295745849609375, 0.4200439453125, 0.544342041015625, 0.66864013671875, 0.792938232421875, 0.917236328125, 1.041534423828125, 1.16583251953125, 1.290130615234375, 1.4144287109375, 1.538726806640625, 1.66302490234375, 1.787322998046875, 1.91162109375, 2.035919189453125, 2.16021728515625, 2.284515380859375, 2.4088134765625, 2.533111572265625, 2.65740966796875, 2.781707763671875, 2.906005859375, 3.030303955078125, 3.15460205078125, 3.278900146484375, 3.4031982421875, 3.527496337890625, 3.65179443359375, 3.776092529296875, 3.900390625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 7.0, 2.0, 5.0, 19.0, 18.0, 26.0, 40.0, 64.0, 60.0, 95.0, 120.0, 168.0, 260.0, 424.0, 651.0, 1212.0, 2406.0, 6262.0, 24059.0, 214155.0, 2057688.0, 1700064.0, 157715.0, 19372.0, 4976.0, 1903.0, 950.0, 533.0, 333.0, 214.0, 140.0, 90.0, 69.0, 58.0, 39.0, 30.0, 18.0, 17.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.4522705078125, -9.146728515625, -8.8411865234375, -8.53564453125, -8.2301025390625, -7.924560546875, -7.6190185546875, -7.3134765625, -7.0079345703125, -6.702392578125, -6.3968505859375, -6.09130859375, -5.7857666015625, -5.480224609375, -5.1746826171875, -4.869140625, -4.5635986328125, -4.258056640625, -3.9525146484375, -3.64697265625, -3.3414306640625, -3.035888671875, -2.7303466796875, -2.4248046875, -2.1192626953125, -1.813720703125, -1.5081787109375, -1.20263671875, -0.8970947265625, -0.591552734375, -0.2860107421875, 0.01953125, 0.3250732421875, 0.630615234375, 0.9361572265625, 1.24169921875, 1.5472412109375, 1.852783203125, 2.1583251953125, 2.4638671875, 2.7694091796875, 3.074951171875, 3.3804931640625, 3.68603515625, 3.9915771484375, 4.297119140625, 4.6026611328125, 4.908203125, 5.2137451171875, 5.519287109375, 5.8248291015625, 6.13037109375, 6.4359130859375, 6.741455078125, 7.0469970703125, 7.3525390625, 7.6580810546875, 7.963623046875, 8.2691650390625, 8.57470703125, 8.8802490234375, 9.185791015625, 9.4913330078125, 9.796875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 1.0, 6.0, 8.0, 8.0, 13.0, 18.0, 27.0, 46.0, 51.0, 56.0, 96.0, 107.0, 172.0, 223.0, 272.0, 365.0, 429.0, 390.0, 386.0, 337.0, 268.0, 192.0, 151.0, 108.0, 82.0, 61.0, 41.0, 34.0, 26.0, 22.0, 20.0, 13.0, 5.0, 5.0, 7.0, 2.0, 8.0, 2.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.2734375, -7.05560302734375, -6.8377685546875, -6.61993408203125, -6.402099609375, -6.18426513671875, -5.9664306640625, -5.74859619140625, -5.53076171875, -5.31292724609375, -5.0950927734375, -4.87725830078125, -4.659423828125, -4.44158935546875, -4.2237548828125, -4.00592041015625, -3.7880859375, -3.57025146484375, -3.3524169921875, -3.13458251953125, -2.916748046875, -2.69891357421875, -2.4810791015625, -2.26324462890625, -2.04541015625, -1.82757568359375, -1.6097412109375, -1.39190673828125, -1.174072265625, -0.95623779296875, -0.7384033203125, -0.52056884765625, -0.302734375, -0.08489990234375, 0.1329345703125, 0.35076904296875, 0.568603515625, 0.78643798828125, 1.0042724609375, 1.22210693359375, 1.43994140625, 1.65777587890625, 1.8756103515625, 2.09344482421875, 2.311279296875, 2.52911376953125, 2.7469482421875, 2.96478271484375, 3.1826171875, 3.40045166015625, 3.6182861328125, 3.83612060546875, 4.053955078125, 4.27178955078125, 4.4896240234375, 4.70745849609375, 4.92529296875, 5.14312744140625, 5.3609619140625, 5.57879638671875, 5.796630859375, 6.01446533203125, 6.2322998046875, 6.45013427734375, 6.66796875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 2.0, 3.0, 7.0, 4.0, 9.0, 14.0, 22.0, 23.0, 31.0, 43.0, 40.0, 67.0, 112.0, 171.0, 269.0, 513.0, 1453.0, 5289.0, 44109.0, 1575705.0, 2485933.0, 70370.0, 6938.0, 1690.0, 595.0, 303.0, 163.0, 107.0, 68.0, 54.0, 53.0, 30.0, 18.0, 16.0, 10.0, 11.0, 5.0, 3.0, 3.0, 10.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.03125, -19.38671875, -18.7421875, -18.09765625, -17.453125, -16.80859375, -16.1640625, -15.51953125, -14.875, -14.23046875, -13.5859375, -12.94140625, -12.296875, -11.65234375, -11.0078125, -10.36328125, -9.71875, -9.07421875, -8.4296875, -7.78515625, -7.140625, -6.49609375, -5.8515625, -5.20703125, -4.5625, -3.91796875, -3.2734375, -2.62890625, -1.984375, -1.33984375, -0.6953125, -0.05078125, 0.59375, 1.23828125, 1.8828125, 2.52734375, 3.171875, 3.81640625, 4.4609375, 5.10546875, 5.75, 6.39453125, 7.0390625, 7.68359375, 8.328125, 8.97265625, 9.6171875, 10.26171875, 10.90625, 11.55078125, 12.1953125, 12.83984375, 13.484375, 14.12890625, 14.7734375, 15.41796875, 16.0625, 16.70703125, 17.3515625, 17.99609375, 18.640625, 19.28515625, 19.9296875, 20.57421875, 21.21875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 9.0, 7.0, 12.0, 16.0, 21.0, 29.0, 32.0, 61.0, 53.0, 80.0, 74.0, 77.0, 88.0, 78.0, 58.0, 67.0, 55.0, 62.0, 28.0, 22.0, 14.0, 20.0, 12.0, 6.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.082929611206055, -30.205961227416992, -29.32899284362793, -28.452024459838867, -27.575057983398438, -26.698089599609375, -25.821121215820312, -24.94415283203125, -24.067184448242188, -23.190216064453125, -22.313247680664062, -21.436279296875, -20.559310913085938, -19.682342529296875, -18.805376052856445, -17.928407669067383, -17.05143928527832, -16.174470901489258, -15.297502517700195, -14.42053508758545, -13.543566703796387, -12.666598320007324, -11.789630889892578, -10.912662506103516, -10.035694122314453, -9.15872573852539, -8.281757354736328, -7.404789924621582, -6.5278215408325195, -5.650853157043457, -4.773885250091553, -3.8969173431396484, -3.0199508666992188, -2.1429827213287354, -1.266014575958252, -0.38904643058776855, 0.48792171478271484, 1.3648900985717773, 2.2418580055236816, 3.118825912475586, 3.9957942962646484, 4.872762680053711, 5.749730587005615, 6.6266984939575195, 7.503666877746582, 8.380635261535645, 9.25760269165039, 10.134571075439453, 11.011539459228516, 11.888507843017578, 12.76547622680664, 13.642443656921387, 14.51941204071045, 15.396380424499512, 16.273347854614258, 17.15031623840332, 18.027284622192383, 18.904253005981445, 19.781221389770508, 20.65818977355957, 21.53515625, 22.412124633789062, 23.289093017578125, 24.166061401367188, 25.04302978515625]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 10.0, 9.0, 9.0, 14.0, 12.0, 11.0, 19.0, 21.0, 18.0, 33.0, 27.0, 33.0, 46.0, 42.0, 37.0, 41.0, 50.0, 47.0, 50.0, 28.0, 50.0, 36.0, 33.0, 36.0, 36.0, 33.0, 31.0, 31.0, 22.0, 33.0, 13.0, 11.0, 9.0, 18.0, 12.0, 5.0, 7.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.095518112182617, -23.30828857421875, -22.52105712890625, -21.733827590942383, -20.946598052978516, -20.159366607666016, -19.37213706970215, -18.58490753173828, -17.79767608642578, -17.010446548461914, -16.223215103149414, -15.435985565185547, -14.64875602722168, -13.861525535583496, -13.074295043945312, -12.287065505981445, -11.499835968017578, -10.712605476379395, -9.925375938415527, -9.138145446777344, -8.350915908813477, -7.563685417175293, -6.776454925537109, -5.989224910736084, -5.201994895935059, -4.414764881134033, -3.6275346279144287, -2.840304374694824, -2.053074359893799, -1.2658443450927734, -0.47861385345458984, 0.30861616134643555, 1.0958480834960938, 1.8830782175064087, 2.6703083515167236, 3.457538604736328, 4.2447686195373535, 5.031998634338379, 5.8192291259765625, 6.606459140777588, 7.393689155578613, 8.180919647216797, 8.968149185180664, 9.755379676818848, 10.542610168457031, 11.329839706420898, 12.117070198059082, 12.904300689697266, 13.691530227661133, 14.478760719299316, 15.265990257263184, 16.053220748901367, 16.840450286865234, 17.627681732177734, 18.4149112701416, 19.20214080810547, 19.98937225341797, 20.776601791381836, 21.563833236694336, 22.351062774658203, 23.13829231262207, 23.925521850585938, 24.712753295898438, 25.499982833862305, 26.287212371826172]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 10.0, 11.0, 11.0, 11.0, 14.0, 17.0, 30.0, 24.0, 33.0, 35.0, 35.0, 53.0, 48.0, 42.0, 49.0, 52.0, 40.0, 52.0, 48.0, 44.0, 35.0, 38.0, 37.0, 28.0, 30.0, 31.0, 25.0, 18.0, 16.0, 23.0, 12.0, 8.0, 9.0, 8.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.994140625, -3.871368408203125, -3.74859619140625, -3.625823974609375, -3.5030517578125, -3.380279541015625, -3.25750732421875, -3.134735107421875, -3.011962890625, -2.889190673828125, -2.76641845703125, -2.643646240234375, -2.5208740234375, -2.398101806640625, -2.27532958984375, -2.152557373046875, -2.02978515625, -1.907012939453125, -1.78424072265625, -1.661468505859375, -1.5386962890625, -1.415924072265625, -1.29315185546875, -1.170379638671875, -1.047607421875, -0.924835205078125, -0.80206298828125, -0.679290771484375, -0.5565185546875, -0.433746337890625, -0.31097412109375, -0.188201904296875, -0.0654296875, 0.057342529296875, 0.18011474609375, 0.302886962890625, 0.4256591796875, 0.548431396484375, 0.67120361328125, 0.793975830078125, 0.916748046875, 1.039520263671875, 1.16229248046875, 1.285064697265625, 1.4078369140625, 1.530609130859375, 1.65338134765625, 1.776153564453125, 1.89892578125, 2.021697998046875, 2.14447021484375, 2.267242431640625, 2.3900146484375, 2.512786865234375, 2.63555908203125, 2.758331298828125, 2.881103515625, 3.003875732421875, 3.12664794921875, 3.249420166015625, 3.3721923828125, 3.494964599609375, 3.61773681640625, 3.740509033203125, 3.86328125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 10.0, 19.0, 27.0, 38.0, 64.0, 96.0, 161.0, 236.0, 415.0, 705.0, 1214.0, 2469.0, 4877.0, 10272.0, 21936.0, 47147.0, 98479.0, 181620.0, 244307.0, 204961.0, 119300.0, 58322.0, 27114.0, 12568.0, 5789.0, 2934.0, 1498.0, 825.0, 442.0, 260.0, 166.0, 106.0, 57.0, 38.0, 29.0, 12.0, 10.0, 13.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7393951416015625, -0.718048095703125, -0.6967010498046875, -0.67535400390625, -0.6540069580078125, -0.632659912109375, -0.6113128662109375, -0.5899658203125, -0.5686187744140625, -0.547271728515625, -0.5259246826171875, -0.50457763671875, -0.4832305908203125, -0.461883544921875, -0.4405364990234375, -0.419189453125, -0.3978424072265625, -0.376495361328125, -0.3551483154296875, -0.33380126953125, -0.3124542236328125, -0.291107177734375, -0.2697601318359375, -0.2484130859375, -0.2270660400390625, -0.205718994140625, -0.1843719482421875, -0.16302490234375, -0.1416778564453125, -0.120330810546875, -0.0989837646484375, -0.07763671875, -0.0562896728515625, -0.034942626953125, -0.0135955810546875, 0.00775146484375, 0.0290985107421875, 0.050445556640625, 0.0717926025390625, 0.0931396484375, 0.1144866943359375, 0.135833740234375, 0.1571807861328125, 0.17852783203125, 0.1998748779296875, 0.221221923828125, 0.2425689697265625, 0.263916015625, 0.2852630615234375, 0.306610107421875, 0.3279571533203125, 0.34930419921875, 0.3706512451171875, 0.391998291015625, 0.4133453369140625, 0.4346923828125, 0.4560394287109375, 0.477386474609375, 0.4987335205078125, 0.52008056640625, 0.5414276123046875, 0.562774658203125, 0.5841217041015625, 0.60546875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 6.0, 7.0, 10.0, 17.0, 15.0, 19.0, 16.0, 15.0, 23.0, 21.0, 29.0, 33.0, 41.0, 38.0, 34.0, 40.0, 26.0, 40.0, 41.0, 36.0, 1055.0, 46.0, 38.0, 38.0, 28.0, 47.0, 30.0, 22.0, 31.0, 25.0, 23.0, 24.0, 33.0, 18.0, 10.0, 11.0, 6.0, 6.0, 6.0, 11.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.494140625, -2.4114990234375, -2.328857421875, -2.2462158203125, -2.16357421875, -2.0809326171875, -1.998291015625, -1.9156494140625, -1.8330078125, -1.7503662109375, -1.667724609375, -1.5850830078125, -1.50244140625, -1.4197998046875, -1.337158203125, -1.2545166015625, -1.171875, -1.0892333984375, -1.006591796875, -0.9239501953125, -0.84130859375, -0.7586669921875, -0.676025390625, -0.5933837890625, -0.5107421875, -0.4281005859375, -0.345458984375, -0.2628173828125, -0.18017578125, -0.0975341796875, -0.014892578125, 0.0677490234375, 0.150390625, 0.2330322265625, 0.315673828125, 0.3983154296875, 0.48095703125, 0.5635986328125, 0.646240234375, 0.7288818359375, 0.8115234375, 0.8941650390625, 0.976806640625, 1.0594482421875, 1.14208984375, 1.2247314453125, 1.307373046875, 1.3900146484375, 1.47265625, 1.5552978515625, 1.637939453125, 1.7205810546875, 1.80322265625, 1.8858642578125, 1.968505859375, 2.0511474609375, 2.1337890625, 2.2164306640625, 2.299072265625, 2.3817138671875, 2.46435546875, 2.5469970703125, 2.629638671875, 2.7122802734375, 2.794921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 7.0, 3.0, 10.0, 11.0, 26.0, 17.0, 25.0, 49.0, 73.0, 89.0, 115.0, 179.0, 294.0, 397.0, 637.0, 1060.0, 1590.0, 2740.0, 5126.0, 11205.0, 27204.0, 70125.0, 172058.0, 1223901.0, 364082.0, 127637.0, 50195.0, 19883.0, 8394.0, 4068.0, 2199.0, 1297.0, 789.0, 533.0, 335.0, 232.0, 176.0, 113.0, 82.0, 68.0, 40.0, 26.0, 16.0, 10.0, 9.0, 6.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.401611328125, -0.3900794982910156, -0.37854766845703125, -0.3670158386230469, -0.3554840087890625, -0.3439521789550781, -0.33242034912109375, -0.3208885192871094, -0.309356689453125, -0.2978248596191406, -0.28629302978515625, -0.2747611999511719, -0.2632293701171875, -0.2516975402832031, -0.24016571044921875, -0.22863388061523438, -0.21710205078125, -0.20557022094726562, -0.19403839111328125, -0.18250656127929688, -0.1709747314453125, -0.15944290161132812, -0.14791107177734375, -0.13637924194335938, -0.124847412109375, -0.11331558227539062, -0.10178375244140625, -0.09025192260742188, -0.0787200927734375, -0.06718826293945312, -0.05565643310546875, -0.044124603271484375, -0.0325927734375, -0.021060943603515625, -0.00952911376953125, 0.002002716064453125, 0.0135345458984375, 0.025066375732421875, 0.03659820556640625, 0.048130035400390625, 0.059661865234375, 0.07119369506835938, 0.08272552490234375, 0.09425735473632812, 0.1057891845703125, 0.11732101440429688, 0.12885284423828125, 0.14038467407226562, 0.15191650390625, 0.16344833374023438, 0.17498016357421875, 0.18651199340820312, 0.1980438232421875, 0.20957565307617188, 0.22110748291015625, 0.23263931274414062, 0.244171142578125, 0.2557029724121094, 0.26723480224609375, 0.2787666320800781, 0.2902984619140625, 0.3018302917480469, 0.31336212158203125, 0.3248939514160156, 0.33642578125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 7.0, 1.0, 4.0, 10.0, 9.0, 12.0, 11.0, 13.0, 23.0, 25.0, 46.0, 74.0, 98.0, 110.0, 120.0, 133.0, 90.0, 51.0, 42.0, 22.0, 20.0, 14.0, 13.0, 11.0, 9.0, 8.0, 7.0, 7.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08428955078125, -0.08183479309082031, -0.07938003540039062, -0.07692527770996094, -0.07447052001953125, -0.07201576232910156, -0.06956100463867188, -0.06710624694824219, -0.0646514892578125, -0.06219673156738281, -0.059741973876953125, -0.05728721618652344, -0.05483245849609375, -0.05237770080566406, -0.049922943115234375, -0.04746818542480469, -0.045013427734375, -0.04255867004394531, -0.040103912353515625, -0.03764915466308594, -0.03519439697265625, -0.03273963928222656, -0.030284881591796875, -0.027830123901367188, -0.0253753662109375, -0.022920608520507812, -0.020465850830078125, -0.018011093139648438, -0.01555633544921875, -0.013101577758789062, -0.010646820068359375, -0.008192062377929688, -0.0057373046875, -0.0032825469970703125, -0.000827789306640625, 0.0016269683837890625, 0.00408172607421875, 0.0065364837646484375, 0.008991241455078125, 0.011445999145507812, 0.0139007568359375, 0.016355514526367188, 0.018810272216796875, 0.021265029907226562, 0.02371978759765625, 0.026174545288085938, 0.028629302978515625, 0.031084060668945312, 0.033538818359375, 0.03599357604980469, 0.038448333740234375, 0.04090309143066406, 0.04335784912109375, 0.04581260681152344, 0.048267364501953125, 0.05072212219238281, 0.0531768798828125, 0.05563163757324219, 0.058086395263671875, 0.06054115295410156, 0.06299591064453125, 0.06545066833496094, 0.06790542602539062, 0.07036018371582031, 0.07281494140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 7.0, 9.0, 11.0, 12.0, 15.0, 12.0, 28.0, 41.0, 80.0, 135.0, 442.0, 7773.0, 1032543.0, 6672.0, 405.0, 159.0, 65.0, 39.0, 24.0, 13.0, 13.0, 13.0, 8.0, 9.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.70703125, -1.649139404296875, -1.59124755859375, -1.533355712890625, -1.4754638671875, -1.417572021484375, -1.35968017578125, -1.301788330078125, -1.243896484375, -1.186004638671875, -1.12811279296875, -1.070220947265625, -1.0123291015625, -0.954437255859375, -0.89654541015625, -0.838653564453125, -0.78076171875, -0.722869873046875, -0.66497802734375, -0.607086181640625, -0.5491943359375, -0.491302490234375, -0.43341064453125, -0.375518798828125, -0.317626953125, -0.259735107421875, -0.20184326171875, -0.143951416015625, -0.0860595703125, -0.028167724609375, 0.02972412109375, 0.087615966796875, 0.1455078125, 0.203399658203125, 0.26129150390625, 0.319183349609375, 0.3770751953125, 0.434967041015625, 0.49285888671875, 0.550750732421875, 0.608642578125, 0.666534423828125, 0.72442626953125, 0.782318115234375, 0.8402099609375, 0.898101806640625, 0.95599365234375, 1.013885498046875, 1.07177734375, 1.129669189453125, 1.18756103515625, 1.245452880859375, 1.3033447265625, 1.361236572265625, 1.41912841796875, 1.477020263671875, 1.534912109375, 1.592803955078125, 1.65069580078125, 1.708587646484375, 1.7664794921875, 1.824371337890625, 1.88226318359375, 1.940155029296875, 1.998046875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 19.0, 16.0, 26.0, 59.0, 102.0, 170.0, 229.0, 138.0, 101.0, 50.0, 25.0, 22.0, 15.0, 3.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30595648288726807, -0.29777663946151733, -0.2895967960357666, -0.28141695261001587, -0.27323710918426514, -0.2650572657585144, -0.25687742233276367, -0.24869756400585175, -0.24051770567893982, -0.2323378622531891, -0.22415801882743835, -0.21597817540168762, -0.2077983170747757, -0.19961847364902496, -0.19143863022327423, -0.1832587867975235, -0.17507894337177277, -0.16689909994602203, -0.1587192565202713, -0.15053939819335938, -0.14235955476760864, -0.1341797113418579, -0.12599986791610718, -0.11782002449035645, -0.10964017361402512, -0.10146033018827438, -0.09328047931194305, -0.08510063588619232, -0.07692079246044159, -0.06874094158411026, -0.06056109815835953, -0.0523812510073185, -0.044201403856277466, -0.036021556705236435, -0.027841711416840553, -0.01966186612844467, -0.01148201897740364, -0.00330217182636261, 0.0048776715993881226, 0.013057518750429153, 0.021237365901470184, 0.029417213052511215, 0.037597060203552246, 0.04577690362930298, 0.05395675078034401, 0.06213659793138504, 0.07031644135713577, 0.0784962922334671, 0.08667613565921783, 0.09485597908496857, 0.1030358299612999, 0.11121567338705063, 0.11939552426338196, 0.1275753676891327, 0.13575521111488342, 0.14393505454063416, 0.1521148979663849, 0.16029474139213562, 0.16847458481788635, 0.17665442824363708, 0.184834286570549, 0.19301412999629974, 0.20119397342205048, 0.2093738168478012, 0.21755367517471313]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 6.0, 5.0, 7.0, 12.0, 16.0, 17.0, 19.0, 18.0, 17.0, 20.0, 25.0, 32.0, 30.0, 26.0, 32.0, 40.0, 41.0, 42.0, 43.0, 43.0, 45.0, 47.0, 34.0, 37.0, 35.0, 37.0, 37.0, 25.0, 28.0, 20.0, 16.0, 21.0, 23.0, 12.0, 10.0, 10.0, 12.0, 10.0, 13.0, 6.0, 4.0, 4.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.10851395130157471, -0.10503684729337692, -0.10155974328517914, -0.09808264672756195, -0.09460554271936417, -0.09112843871116638, -0.0876513421535492, -0.08417423814535141, -0.08069713413715363, -0.07722003012895584, -0.07374292612075806, -0.07026582956314087, -0.06678872555494308, -0.0633116215467453, -0.059834521263837814, -0.05635742098093033, -0.052880316972732544, -0.04940321296453476, -0.045926112681627274, -0.04244901239871979, -0.038971908390522, -0.03549480438232422, -0.03201770409941673, -0.028540601953864098, -0.025063499808311462, -0.021586397662758827, -0.018109295517206192, -0.014632193371653557, -0.011155091226100922, -0.0076779890805482864, -0.004200886934995651, -0.000723784789443016, 0.002753317356109619, 0.006230419501662254, 0.00970752164721489, 0.013184623792767525, 0.01666172593832016, 0.020138828083872795, 0.02361593022942543, 0.027093032374978065, 0.0305701345205307, 0.034047238528728485, 0.03752433881163597, 0.04100143909454346, 0.04447854310274124, 0.047955647110939026, 0.05143274739384651, 0.054909847676754, 0.05838695168495178, 0.06186405569314957, 0.06534115970134735, 0.06881825625896454, 0.07229536026716232, 0.07577246427536011, 0.0792495608329773, 0.08272666484117508, 0.08620376884937286, 0.08968087285757065, 0.09315797686576843, 0.09663507342338562, 0.1001121774315834, 0.10358928143978119, 0.10706637799739838, 0.11054348200559616, 0.11402058601379395]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 17.0, 12.0, 13.0, 21.0, 17.0, 23.0, 29.0, 41.0, 42.0, 38.0, 57.0, 36.0, 56.0, 54.0, 58.0, 52.0, 51.0, 45.0, 35.0, 38.0, 41.0, 31.0, 37.0, 23.0, 24.0, 21.0, 19.0, 16.0, 8.0, 8.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.984375, -3.8572998046875, -3.730224609375, -3.6031494140625, -3.47607421875, -3.3489990234375, -3.221923828125, -3.0948486328125, -2.9677734375, -2.8406982421875, -2.713623046875, -2.5865478515625, -2.45947265625, -2.3323974609375, -2.205322265625, -2.0782470703125, -1.951171875, -1.8240966796875, -1.697021484375, -1.5699462890625, -1.44287109375, -1.3157958984375, -1.188720703125, -1.0616455078125, -0.9345703125, -0.8074951171875, -0.680419921875, -0.5533447265625, -0.42626953125, -0.2991943359375, -0.172119140625, -0.0450439453125, 0.08203125, 0.2091064453125, 0.336181640625, 0.4632568359375, 0.59033203125, 0.7174072265625, 0.844482421875, 0.9715576171875, 1.0986328125, 1.2257080078125, 1.352783203125, 1.4798583984375, 1.60693359375, 1.7340087890625, 1.861083984375, 1.9881591796875, 2.115234375, 2.2423095703125, 2.369384765625, 2.4964599609375, 2.62353515625, 2.7506103515625, 2.877685546875, 3.0047607421875, 3.1318359375, 3.2589111328125, 3.385986328125, 3.5130615234375, 3.64013671875, 3.7672119140625, 3.894287109375, 4.0213623046875, 4.1484375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 5.0, 9.0, 12.0, 28.0, 27.0, 37.0, 56.0, 72.0, 137.0, 203.0, 341.0, 582.0, 963.0, 1687.0, 3047.0, 5696.0, 11040.0, 21934.0, 44947.0, 90846.0, 174223.0, 300648.0, 190880.0, 100477.0, 50128.0, 24254.0, 12105.0, 6381.0, 3315.0, 1803.0, 1014.0, 646.0, 325.0, 234.0, 152.0, 97.0, 57.0, 49.0, 29.0, 15.0, 19.0, 7.0, 10.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.119140625, -3.017120361328125, -2.91510009765625, -2.813079833984375, -2.7110595703125, -2.609039306640625, -2.50701904296875, -2.404998779296875, -2.302978515625, -2.200958251953125, -2.09893798828125, -1.996917724609375, -1.8948974609375, -1.792877197265625, -1.69085693359375, -1.588836669921875, -1.48681640625, -1.384796142578125, -1.28277587890625, -1.180755615234375, -1.0787353515625, -0.976715087890625, -0.87469482421875, -0.772674560546875, -0.670654296875, -0.568634033203125, -0.46661376953125, -0.364593505859375, -0.2625732421875, -0.160552978515625, -0.05853271484375, 0.043487548828125, 0.1455078125, 0.247528076171875, 0.34954833984375, 0.451568603515625, 0.5535888671875, 0.655609130859375, 0.75762939453125, 0.859649658203125, 0.961669921875, 1.063690185546875, 1.16571044921875, 1.267730712890625, 1.3697509765625, 1.471771240234375, 1.57379150390625, 1.675811767578125, 1.77783203125, 1.879852294921875, 1.98187255859375, 2.083892822265625, 2.1859130859375, 2.287933349609375, 2.38995361328125, 2.491973876953125, 2.593994140625, 2.696014404296875, 2.79803466796875, 2.900054931640625, 3.0020751953125, 3.104095458984375, 3.20611572265625, 3.308135986328125, 3.41015625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 7.0, 11.0, 8.0, 12.0, 15.0, 12.0, 25.0, 29.0, 25.0, 44.0, 35.0, 54.0, 57.0, 91.0, 117.0, 245.0, 1456.0, 227.0, 128.0, 72.0, 50.0, 47.0, 42.0, 32.0, 39.0, 26.0, 24.0, 15.0, 21.0, 18.0, 7.0, 16.0, 9.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.640625, -13.255615234375, -12.87060546875, -12.485595703125, -12.1005859375, -11.715576171875, -11.33056640625, -10.945556640625, -10.560546875, -10.175537109375, -9.79052734375, -9.405517578125, -9.0205078125, -8.635498046875, -8.25048828125, -7.865478515625, -7.48046875, -7.095458984375, -6.71044921875, -6.325439453125, -5.9404296875, -5.555419921875, -5.17041015625, -4.785400390625, -4.400390625, -4.015380859375, -3.63037109375, -3.245361328125, -2.8603515625, -2.475341796875, -2.09033203125, -1.705322265625, -1.3203125, -0.935302734375, -0.55029296875, -0.165283203125, 0.2197265625, 0.604736328125, 0.98974609375, 1.374755859375, 1.759765625, 2.144775390625, 2.52978515625, 2.914794921875, 3.2998046875, 3.684814453125, 4.06982421875, 4.454833984375, 4.83984375, 5.224853515625, 5.60986328125, 5.994873046875, 6.3798828125, 6.764892578125, 7.14990234375, 7.534912109375, 7.919921875, 8.304931640625, 8.68994140625, 9.074951171875, 9.4599609375, 9.844970703125, 10.22998046875, 10.614990234375, 11.0]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 7.0, 5.0, 7.0, 12.0, 17.0, 14.0, 33.0, 43.0, 71.0, 74.0, 122.0, 166.0, 291.0, 424.0, 900.0, 14025.0, 3051140.0, 75538.0, 1430.0, 515.0, 283.0, 172.0, 111.0, 89.0, 67.0, 49.0, 21.0, 27.0, 13.0, 12.0, 8.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.940673828125, -29.89697265625, -28.853271484375, -27.8095703125, -26.765869140625, -25.72216796875, -24.678466796875, -23.634765625, -22.591064453125, -21.54736328125, -20.503662109375, -19.4599609375, -18.416259765625, -17.37255859375, -16.328857421875, -15.28515625, -14.241455078125, -13.19775390625, -12.154052734375, -11.1103515625, -10.066650390625, -9.02294921875, -7.979248046875, -6.935546875, -5.891845703125, -4.84814453125, -3.804443359375, -2.7607421875, -1.717041015625, -0.67333984375, 0.370361328125, 1.4140625, 2.457763671875, 3.50146484375, 4.545166015625, 5.5888671875, 6.632568359375, 7.67626953125, 8.719970703125, 9.763671875, 10.807373046875, 11.85107421875, 12.894775390625, 13.9384765625, 14.982177734375, 16.02587890625, 17.069580078125, 18.11328125, 19.156982421875, 20.20068359375, 21.244384765625, 22.2880859375, 23.331787109375, 24.37548828125, 25.419189453125, 26.462890625, 27.506591796875, 28.55029296875, 29.593994140625, 30.6376953125, 31.681396484375, 32.72509765625, 33.768798828125, 34.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 59.0, 588.0, 353.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.212997436523438, -12.006647109985352, -7.800296783447266, -3.5939464569091797, 0.6124038696289062, 4.818754196166992, 9.025104522705078, 13.231454849243164, 17.43780517578125, 21.644155502319336, 25.850505828857422, 30.056856155395508, 34.263206481933594, 38.46955871582031, 42.675907135009766, 46.88225555419922, 51.08860778808594, 55.294960021972656, 59.50130844116211, 63.70765686035156, 67.91400909423828, 72.120361328125, 76.32670593261719, 80.5330581665039, 84.73941040039062, 88.94576263427734, 93.15211486816406, 97.35845947265625, 101.56481170654297, 105.77116394042969, 109.97750854492188, 114.1838607788086, 118.39021301269531, 122.59656524658203, 126.80291748046875, 131.00926208496094, 135.21560668945312, 139.42196655273438, 143.62831115722656, 147.8346710205078, 152.041015625, 156.2473602294922, 160.45372009277344, 164.66006469726562, 168.86642456054688, 173.07276916503906, 177.27911376953125, 181.4854736328125, 185.6918182373047, 189.89816284179688, 194.10452270507812, 198.3108673095703, 202.5172119140625, 206.72357177734375, 210.92991638183594, 215.1362762451172, 219.34262084960938, 223.54896545410156, 227.7553253173828, 231.961669921875, 236.16802978515625, 240.37437438964844, 244.58071899414062, 248.78707885742188, 252.99342346191406]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 3.0, 6.0, 12.0, 11.0, 22.0, 23.0, 18.0, 22.0, 33.0, 25.0, 35.0, 43.0, 36.0, 26.0, 41.0, 49.0, 34.0, 29.0, 49.0, 38.0, 33.0, 35.0, 25.0, 25.0, 43.0, 37.0, 32.0, 22.0, 16.0, 19.0, 17.0, 16.0, 16.0, 15.0, 15.0, 14.0, 12.0, 9.0, 6.0, 4.0, 3.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-26.746265411376953, -25.83853530883789, -24.930803298950195, -24.0230712890625, -23.115341186523438, -22.207611083984375, -21.29987907409668, -20.392147064208984, -19.484416961669922, -18.57668685913086, -17.668954849243164, -16.76122283935547, -15.853492736816406, -14.945761680603027, -14.038030624389648, -13.13029956817627, -12.22256851196289, -11.314837455749512, -10.407106399536133, -9.499375343322754, -8.591644287109375, -7.683913230895996, -6.776182174682617, -5.868451118469238, -4.960720062255859, -4.0529890060424805, -3.1452579498291016, -2.2375268936157227, -1.3297958374023438, -0.42206478118896484, 0.48566627502441406, 1.393397331237793, 2.301128387451172, 3.208859443664551, 4.11659049987793, 5.024321556091309, 5.9320526123046875, 6.839783668518066, 7.747514724731445, 8.655245780944824, 9.562976837158203, 10.470707893371582, 11.378438949584961, 12.28617000579834, 13.193901062011719, 14.101632118225098, 15.009363174438477, 15.917094230651855, 16.824825286865234, 17.732555389404297, 18.640287399291992, 19.548019409179688, 20.45574951171875, 21.363479614257812, 22.271211624145508, 23.178943634033203, 24.086673736572266, 24.994403839111328, 25.902135848999023, 26.80986785888672, 27.71759796142578, 28.625328063964844, 29.53306007385254, 30.440792083740234, 31.348522186279297]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 6.0, 5.0, 10.0, 14.0, 15.0, 14.0, 21.0, 20.0, 27.0, 36.0, 38.0, 38.0, 32.0, 48.0, 49.0, 66.0, 61.0, 51.0, 48.0, 41.0, 51.0, 36.0, 46.0, 40.0, 27.0, 30.0, 25.0, 19.0, 29.0, 20.0, 12.0, 7.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.00390625, -4.8623046875, -4.720703125, -4.5791015625, -4.4375, -4.2958984375, -4.154296875, -4.0126953125, -3.87109375, -3.7294921875, -3.587890625, -3.4462890625, -3.3046875, -3.1630859375, -3.021484375, -2.8798828125, -2.73828125, -2.5966796875, -2.455078125, -2.3134765625, -2.171875, -2.0302734375, -1.888671875, -1.7470703125, -1.60546875, -1.4638671875, -1.322265625, -1.1806640625, -1.0390625, -0.8974609375, -0.755859375, -0.6142578125, -0.47265625, -0.3310546875, -0.189453125, -0.0478515625, 0.09375, 0.2353515625, 0.376953125, 0.5185546875, 0.66015625, 0.8017578125, 0.943359375, 1.0849609375, 1.2265625, 1.3681640625, 1.509765625, 1.6513671875, 1.79296875, 1.9345703125, 2.076171875, 2.2177734375, 2.359375, 2.5009765625, 2.642578125, 2.7841796875, 2.92578125, 3.0673828125, 3.208984375, 3.3505859375, 3.4921875, 3.6337890625, 3.775390625, 3.9169921875, 4.05859375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 6.0, 7.0, 6.0, 13.0, 17.0, 25.0, 42.0, 37.0, 74.0, 102.0, 122.0, 164.0, 246.0, 323.0, 474.0, 729.0, 1078.0, 1729.0, 3121.0, 6414.0, 17330.0, 70247.0, 370300.0, 1553972.0, 1641944.0, 414546.0, 78610.0, 18798.0, 6329.0, 2915.0, 1541.0, 976.0, 644.0, 453.0, 284.0, 202.0, 153.0, 105.0, 54.0, 51.0, 38.0, 20.0, 19.0, 9.0, 12.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.6767578125, -6.474609375, -6.2724609375, -6.0703125, -5.8681640625, -5.666015625, -5.4638671875, -5.26171875, -5.0595703125, -4.857421875, -4.6552734375, -4.453125, -4.2509765625, -4.048828125, -3.8466796875, -3.64453125, -3.4423828125, -3.240234375, -3.0380859375, -2.8359375, -2.6337890625, -2.431640625, -2.2294921875, -2.02734375, -1.8251953125, -1.623046875, -1.4208984375, -1.21875, -1.0166015625, -0.814453125, -0.6123046875, -0.41015625, -0.2080078125, -0.005859375, 0.1962890625, 0.3984375, 0.6005859375, 0.802734375, 1.0048828125, 1.20703125, 1.4091796875, 1.611328125, 1.8134765625, 2.015625, 2.2177734375, 2.419921875, 2.6220703125, 2.82421875, 3.0263671875, 3.228515625, 3.4306640625, 3.6328125, 3.8349609375, 4.037109375, 4.2392578125, 4.44140625, 4.6435546875, 4.845703125, 5.0478515625, 5.25, 5.4521484375, 5.654296875, 5.8564453125, 6.05859375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [6.0, 2.0, 0.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 13.0, 19.0, 13.0, 15.0, 17.0, 28.0, 24.0, 38.0, 27.0, 45.0, 56.0, 72.0, 84.0, 110.0, 137.0, 173.0, 228.0, 271.0, 284.0, 335.0, 315.0, 317.0, 256.0, 222.0, 176.0, 149.0, 122.0, 91.0, 81.0, 63.0, 53.0, 44.0, 32.0, 27.0, 20.0, 18.0, 15.0, 12.0, 12.0, 5.0, 8.0, 13.0, 4.0, 5.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.86328125, -4.700927734375, -4.53857421875, -4.376220703125, -4.2138671875, -4.051513671875, -3.88916015625, -3.726806640625, -3.564453125, -3.402099609375, -3.23974609375, -3.077392578125, -2.9150390625, -2.752685546875, -2.59033203125, -2.427978515625, -2.265625, -2.103271484375, -1.94091796875, -1.778564453125, -1.6162109375, -1.453857421875, -1.29150390625, -1.129150390625, -0.966796875, -0.804443359375, -0.64208984375, -0.479736328125, -0.3173828125, -0.155029296875, 0.00732421875, 0.169677734375, 0.33203125, 0.494384765625, 0.65673828125, 0.819091796875, 0.9814453125, 1.143798828125, 1.30615234375, 1.468505859375, 1.630859375, 1.793212890625, 1.95556640625, 2.117919921875, 2.2802734375, 2.442626953125, 2.60498046875, 2.767333984375, 2.9296875, 3.092041015625, 3.25439453125, 3.416748046875, 3.5791015625, 3.741455078125, 3.90380859375, 4.066162109375, 4.228515625, 4.390869140625, 4.55322265625, 4.715576171875, 4.8779296875, 5.040283203125, 5.20263671875, 5.364990234375, 5.52734375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 8.0, 9.0, 8.0, 5.0, 5.0, 11.0, 18.0, 12.0, 17.0, 27.0, 34.0, 46.0, 65.0, 76.0, 110.0, 110.0, 154.0, 258.0, 483.0, 1207.0, 4603.0, 32782.0, 593594.0, 3217991.0, 316108.0, 20982.0, 3363.0, 933.0, 405.0, 210.0, 147.0, 115.0, 73.0, 60.0, 42.0, 38.0, 40.0, 28.0, 20.0, 16.0, 14.0, 15.0, 13.0, 8.0, 3.0, 6.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0], "bins": [-18.125, -17.59814453125, -17.0712890625, -16.54443359375, -16.017578125, -15.49072265625, -14.9638671875, -14.43701171875, -13.91015625, -13.38330078125, -12.8564453125, -12.32958984375, -11.802734375, -11.27587890625, -10.7490234375, -10.22216796875, -9.6953125, -9.16845703125, -8.6416015625, -8.11474609375, -7.587890625, -7.06103515625, -6.5341796875, -6.00732421875, -5.48046875, -4.95361328125, -4.4267578125, -3.89990234375, -3.373046875, -2.84619140625, -2.3193359375, -1.79248046875, -1.265625, -0.73876953125, -0.2119140625, 0.31494140625, 0.841796875, 1.36865234375, 1.8955078125, 2.42236328125, 2.94921875, 3.47607421875, 4.0029296875, 4.52978515625, 5.056640625, 5.58349609375, 6.1103515625, 6.63720703125, 7.1640625, 7.69091796875, 8.2177734375, 8.74462890625, 9.271484375, 9.79833984375, 10.3251953125, 10.85205078125, 11.37890625, 11.90576171875, 12.4326171875, 12.95947265625, 13.486328125, 14.01318359375, 14.5400390625, 15.06689453125, 15.59375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 5.0, 16.0, 13.0, 23.0, 30.0, 30.0, 34.0, 46.0, 59.0, 59.0, 56.0, 67.0, 52.0, 79.0, 59.0, 60.0, 50.0, 50.0, 48.0, 34.0, 31.0, 24.0, 12.0, 14.0, 7.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-27.221803665161133, -26.56178855895996, -25.901775360107422, -25.24176025390625, -24.581745147705078, -23.92173194885254, -23.261716842651367, -22.601703643798828, -21.941688537597656, -21.281673431396484, -20.621660232543945, -19.961645126342773, -19.301631927490234, -18.641616821289062, -17.98160171508789, -17.32158660888672, -16.66157341003418, -16.001558303833008, -15.341545104980469, -14.681529998779297, -14.021515846252441, -13.361501693725586, -12.701486587524414, -12.041472434997559, -11.381458282470703, -10.721444129943848, -10.061429977416992, -9.40141487121582, -8.741400718688965, -8.08138656616211, -7.421371936798096, -6.761357307434082, -6.101341247558594, -5.441327095031738, -4.781312465667725, -4.121297836303711, -3.4612836837768555, -2.801269292831421, -2.1412549018859863, -1.4812402725219727, -0.8212261199951172, -0.16121172904968262, 0.49880266189575195, 1.1588170528411865, 1.818831443786621, 2.4788458347320557, 3.1388602256774902, 3.798874855041504, 4.458889007568359, 5.118903160095215, 5.7789177894592285, 6.438932418823242, 7.098946571350098, 7.758960723876953, 8.418975830078125, 9.07898998260498, 9.739004135131836, 10.399018287658691, 11.059032440185547, 11.719047546386719, 12.379061698913574, 13.03907585144043, 13.699090957641602, 14.359105110168457, 15.019119262695312]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 5.0, 8.0, 13.0, 10.0, 14.0, 13.0, 17.0, 26.0, 32.0, 35.0, 28.0, 24.0, 37.0, 35.0, 47.0, 42.0, 53.0, 34.0, 47.0, 59.0, 34.0, 34.0, 45.0, 39.0, 28.0, 28.0, 32.0, 27.0, 25.0, 13.0, 31.0, 13.0, 17.0, 6.0, 9.0, 8.0, 2.0, 12.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-24.955812454223633, -24.187835693359375, -23.419858932495117, -22.65188217163086, -21.8839054107666, -21.115928649902344, -20.347951889038086, -19.579975128173828, -18.81199836730957, -18.044021606445312, -17.276044845581055, -16.508068084716797, -15.740091323852539, -14.972114562988281, -14.204137802124023, -13.436161041259766, -12.668184280395508, -11.90020751953125, -11.132230758666992, -10.364253997802734, -9.596277236938477, -8.828300476074219, -8.060323715209961, -7.292346954345703, -6.524370193481445, -5.7563934326171875, -4.98841667175293, -4.220439910888672, -3.452463150024414, -2.6844863891601562, -1.9165096282958984, -1.1485328674316406, -0.3805561065673828, 0.387420654296875, 1.1553974151611328, 1.9233741760253906, 2.6913509368896484, 3.4593276977539062, 4.227304458618164, 4.995281219482422, 5.76325798034668, 6.5312347412109375, 7.299211502075195, 8.067188262939453, 8.835165023803711, 9.603141784667969, 10.371118545532227, 11.139095306396484, 11.907072067260742, 12.675048828125, 13.443025588989258, 14.211002349853516, 14.978979110717773, 15.746955871582031, 16.51493263244629, 17.282909393310547, 18.050886154174805, 18.818862915039062, 19.58683967590332, 20.354816436767578, 21.122793197631836, 21.890769958496094, 22.65874671936035, 23.42672348022461, 24.194700241088867]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 9.0, 13.0, 13.0, 21.0, 17.0, 19.0, 38.0, 30.0, 44.0, 33.0, 35.0, 69.0, 54.0, 59.0, 68.0, 50.0, 35.0, 43.0, 57.0, 30.0, 32.0, 38.0, 30.0, 33.0, 29.0, 20.0, 16.0, 9.0, 13.0, 8.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.38934326171875, -4.2513427734375, -4.11334228515625, -3.975341796875, -3.83734130859375, -3.6993408203125, -3.56134033203125, -3.42333984375, -3.28533935546875, -3.1473388671875, -3.00933837890625, -2.871337890625, -2.73333740234375, -2.5953369140625, -2.45733642578125, -2.3193359375, -2.18133544921875, -2.0433349609375, -1.90533447265625, -1.767333984375, -1.62933349609375, -1.4913330078125, -1.35333251953125, -1.21533203125, -1.07733154296875, -0.9393310546875, -0.80133056640625, -0.663330078125, -0.52532958984375, -0.3873291015625, -0.24932861328125, -0.111328125, 0.02667236328125, 0.1646728515625, 0.30267333984375, 0.440673828125, 0.57867431640625, 0.7166748046875, 0.85467529296875, 0.99267578125, 1.13067626953125, 1.2686767578125, 1.40667724609375, 1.544677734375, 1.68267822265625, 1.8206787109375, 1.95867919921875, 2.0966796875, 2.23468017578125, 2.3726806640625, 2.51068115234375, 2.648681640625, 2.78668212890625, 2.9246826171875, 3.06268310546875, 3.20068359375, 3.33868408203125, 3.4766845703125, 3.61468505859375, 3.752685546875, 3.89068603515625, 4.0286865234375, 4.16668701171875, 4.3046875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 9.0, 11.0, 10.0, 14.0, 27.0, 32.0, 56.0, 93.0, 120.0, 207.0, 362.0, 587.0, 1004.0, 1866.0, 3307.0, 6334.0, 12327.0, 24769.0, 49433.0, 94789.0, 161484.0, 220089.0, 198889.0, 128575.0, 70602.0, 35838.0, 18047.0, 9041.0, 4710.0, 2566.0, 1343.0, 806.0, 448.0, 280.0, 182.0, 117.0, 61.0, 45.0, 26.0, 19.0, 13.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.69091796875, -0.6721267700195312, -0.6533355712890625, -0.6345443725585938, -0.615753173828125, -0.5969619750976562, -0.5781707763671875, -0.5593795776367188, -0.54058837890625, -0.5217971801757812, -0.5030059814453125, -0.48421478271484375, -0.465423583984375, -0.44663238525390625, -0.4278411865234375, -0.40904998779296875, -0.3902587890625, -0.37146759033203125, -0.3526763916015625, -0.33388519287109375, -0.315093994140625, -0.29630279541015625, -0.2775115966796875, -0.25872039794921875, -0.23992919921875, -0.22113800048828125, -0.2023468017578125, -0.18355560302734375, -0.164764404296875, -0.14597320556640625, -0.1271820068359375, -0.10839080810546875, -0.089599609375, -0.07080841064453125, -0.0520172119140625, -0.03322601318359375, -0.014434814453125, 0.00435638427734375, 0.0231475830078125, 0.04193878173828125, 0.06072998046875, 0.07952117919921875, 0.0983123779296875, 0.11710357666015625, 0.135894775390625, 0.15468597412109375, 0.1734771728515625, 0.19226837158203125, 0.2110595703125, 0.22985076904296875, 0.2486419677734375, 0.26743316650390625, 0.286224365234375, 0.30501556396484375, 0.3238067626953125, 0.34259796142578125, 0.36138916015625, 0.38018035888671875, 0.3989715576171875, 0.41776275634765625, 0.436553955078125, 0.45534515380859375, 0.4741363525390625, 0.49292755126953125, 0.51171875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 8.0, 8.0, 6.0, 9.0, 11.0, 10.0, 16.0, 16.0, 25.0, 14.0, 14.0, 27.0, 28.0, 33.0, 29.0, 43.0, 40.0, 44.0, 32.0, 35.0, 39.0, 1072.0, 51.0, 34.0, 35.0, 30.0, 39.0, 24.0, 21.0, 26.0, 28.0, 21.0, 18.0, 14.0, 21.0, 10.0, 18.0, 14.0, 15.0, 8.0, 9.0, 7.0, 4.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.245361328125, -2.16845703125, -2.091552734375, -2.0146484375, -1.937744140625, -1.86083984375, -1.783935546875, -1.70703125, -1.630126953125, -1.55322265625, -1.476318359375, -1.3994140625, -1.322509765625, -1.24560546875, -1.168701171875, -1.091796875, -1.014892578125, -0.93798828125, -0.861083984375, -0.7841796875, -0.707275390625, -0.63037109375, -0.553466796875, -0.4765625, -0.399658203125, -0.32275390625, -0.245849609375, -0.1689453125, -0.092041015625, -0.01513671875, 0.061767578125, 0.138671875, 0.215576171875, 0.29248046875, 0.369384765625, 0.4462890625, 0.523193359375, 0.60009765625, 0.677001953125, 0.75390625, 0.830810546875, 0.90771484375, 0.984619140625, 1.0615234375, 1.138427734375, 1.21533203125, 1.292236328125, 1.369140625, 1.446044921875, 1.52294921875, 1.599853515625, 1.6767578125, 1.753662109375, 1.83056640625, 1.907470703125, 1.984375, 2.061279296875, 2.13818359375, 2.215087890625, 2.2919921875, 2.368896484375, 2.44580078125, 2.522705078125, 2.599609375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 5.0, 2.0, 8.0, 19.0, 21.0, 25.0, 28.0, 38.0, 54.0, 83.0, 106.0, 172.0, 198.0, 336.0, 451.0, 646.0, 976.0, 1659.0, 2592.0, 4862.0, 9805.0, 23267.0, 57629.0, 144353.0, 650921.0, 939205.0, 151043.0, 61143.0, 24227.0, 10541.0, 5101.0, 2814.0, 1628.0, 1091.0, 633.0, 453.0, 316.0, 188.0, 130.0, 98.0, 87.0, 49.0, 39.0, 24.0, 16.0, 21.0, 10.0, 11.0, 6.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371337890625, -0.3597450256347656, -0.34815216064453125, -0.3365592956542969, -0.3249664306640625, -0.3133735656738281, -0.30178070068359375, -0.2901878356933594, -0.278594970703125, -0.2670021057128906, -0.25540924072265625, -0.24381637573242188, -0.2322235107421875, -0.22063064575195312, -0.20903778076171875, -0.19744491577148438, -0.18585205078125, -0.17425918579101562, -0.16266632080078125, -0.15107345581054688, -0.1394805908203125, -0.12788772583007812, -0.11629486083984375, -0.10470199584960938, -0.093109130859375, -0.08151626586914062, -0.06992340087890625, -0.058330535888671875, -0.0467376708984375, -0.035144805908203125, -0.02355194091796875, -0.011959075927734375, -0.0003662109375, 0.011226654052734375, 0.02281951904296875, 0.034412384033203125, 0.0460052490234375, 0.057598114013671875, 0.06919097900390625, 0.08078384399414062, 0.092376708984375, 0.10396957397460938, 0.11556243896484375, 0.12715530395507812, 0.1387481689453125, 0.15034103393554688, 0.16193389892578125, 0.17352676391601562, 0.18511962890625, 0.19671249389648438, 0.20830535888671875, 0.21989822387695312, 0.2314910888671875, 0.24308395385742188, 0.25467681884765625, 0.2662696838378906, 0.277862548828125, 0.2894554138183594, 0.30104827880859375, 0.3126411437988281, 0.3242340087890625, 0.3358268737792969, 0.34741973876953125, 0.3590126037597656, 0.37060546875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 12.0, 8.0, 10.0, 11.0, 16.0, 19.0, 19.0, 40.0, 42.0, 57.0, 94.0, 112.0, 124.0, 92.0, 85.0, 48.0, 35.0, 34.0, 31.0, 17.0, 11.0, 11.0, 6.0, 12.0, 10.0, 5.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06097412109375, -0.058976173400878906, -0.05697822570800781, -0.05498027801513672, -0.052982330322265625, -0.05098438262939453, -0.04898643493652344, -0.046988487243652344, -0.04499053955078125, -0.042992591857910156, -0.04099464416503906, -0.03899669647216797, -0.036998748779296875, -0.03500080108642578, -0.03300285339355469, -0.031004905700683594, -0.0290069580078125, -0.027009010314941406, -0.025011062622070312, -0.02301311492919922, -0.021015167236328125, -0.01901721954345703, -0.017019271850585938, -0.015021324157714844, -0.01302337646484375, -0.011025428771972656, -0.009027481079101562, -0.007029533386230469, -0.005031585693359375, -0.0030336380004882812, -0.0010356903076171875, 0.0009622573852539062, 0.002960205078125, 0.004958152770996094, 0.0069561004638671875, 0.008954048156738281, 0.010951995849609375, 0.012949943542480469, 0.014947891235351562, 0.016945838928222656, 0.01894378662109375, 0.020941734313964844, 0.022939682006835938, 0.02493762969970703, 0.026935577392578125, 0.02893352508544922, 0.030931472778320312, 0.032929420471191406, 0.0349273681640625, 0.036925315856933594, 0.03892326354980469, 0.04092121124267578, 0.042919158935546875, 0.04491710662841797, 0.04691505432128906, 0.048913002014160156, 0.05091094970703125, 0.052908897399902344, 0.05490684509277344, 0.05690479278564453, 0.058902740478515625, 0.06090068817138672, 0.06289863586425781, 0.0648965835571289, 0.06689453125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 9.0, 7.0, 12.0, 11.0, 9.0, 10.0, 15.0, 20.0, 37.0, 66.0, 86.0, 144.0, 480.0, 4675.0, 939239.0, 101110.0, 1933.0, 295.0, 125.0, 89.0, 47.0, 28.0, 24.0, 11.0, 11.0, 13.0, 11.0, 11.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4404296875, -1.3990936279296875, -1.357757568359375, -1.3164215087890625, -1.27508544921875, -1.2337493896484375, -1.192413330078125, -1.1510772705078125, -1.1097412109375, -1.0684051513671875, -1.027069091796875, -0.9857330322265625, -0.94439697265625, -0.9030609130859375, -0.861724853515625, -0.8203887939453125, -0.779052734375, -0.7377166748046875, -0.696380615234375, -0.6550445556640625, -0.61370849609375, -0.5723724365234375, -0.531036376953125, -0.4897003173828125, -0.4483642578125, -0.4070281982421875, -0.365692138671875, -0.3243560791015625, -0.28302001953125, -0.2416839599609375, -0.200347900390625, -0.1590118408203125, -0.11767578125, -0.0763397216796875, -0.035003662109375, 0.0063323974609375, 0.04766845703125, 0.0890045166015625, 0.130340576171875, 0.1716766357421875, 0.2130126953125, 0.2543487548828125, 0.295684814453125, 0.3370208740234375, 0.37835693359375, 0.4196929931640625, 0.461029052734375, 0.5023651123046875, 0.543701171875, 0.5850372314453125, 0.626373291015625, 0.6677093505859375, 0.70904541015625, 0.7503814697265625, 0.791717529296875, 0.8330535888671875, 0.8743896484375, 0.9157257080078125, 0.957061767578125, 0.9983978271484375, 1.03973388671875, 1.0810699462890625, 1.122406005859375, 1.1637420654296875, 1.205078125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 24.0, 52.0, 95.0, 284.0, 300.0, 115.0, 67.0, 35.0, 12.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28749316930770874, -0.2755560576915741, -0.26361894607543945, -0.2516818344593048, -0.23974472284317017, -0.22780761122703552, -0.21587051451206207, -0.20393340289592743, -0.19199629127979279, -0.18005917966365814, -0.1681220680475235, -0.15618497133255005, -0.1442478597164154, -0.13231074810028076, -0.12037363648414612, -0.10843652486801147, -0.09649941325187683, -0.08456230163574219, -0.07262519001960754, -0.0606880858540535, -0.048750974237918854, -0.03681386262178421, -0.024876758456230164, -0.01293964684009552, -0.0010025352239608765, 0.010934574529528618, 0.022871684283018112, 0.03480879217386246, 0.0467459037899971, 0.058683015406131744, 0.07062011957168579, 0.08255723118782043, 0.09449434280395508, 0.10643145442008972, 0.11836856603622437, 0.130305677652359, 0.14224278926849365, 0.1541799008846283, 0.16611699759960175, 0.1780541092157364, 0.18999122083187103, 0.20192833244800568, 0.21386544406414032, 0.22580254077911377, 0.2377396523952484, 0.24967676401138306, 0.2616138756275177, 0.27355098724365234, 0.285488098859787, 0.29742521047592163, 0.3093623220920563, 0.3212994337081909, 0.33323654532432556, 0.3451736569404602, 0.35711073875427246, 0.3690478801727295, 0.38098496198654175, 0.3929220736026764, 0.40485918521881104, 0.4167962968349457, 0.4287334084510803, 0.44067052006721497, 0.4526076316833496, 0.46454471349716187, 0.4764818549156189]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 8.0, 3.0, 4.0, 7.0, 8.0, 7.0, 7.0, 10.0, 22.0, 14.0, 22.0, 15.0, 20.0, 36.0, 25.0, 35.0, 32.0, 35.0, 34.0, 37.0, 42.0, 51.0, 43.0, 35.0, 38.0, 39.0, 34.0, 29.0, 34.0, 26.0, 30.0, 20.0, 30.0, 23.0, 19.0, 20.0, 19.0, 13.0, 11.0, 12.0, 11.0, 10.0, 11.0, 2.0, 3.0, 7.0, 4.0, 8.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.13358747959136963, -0.12956584990024567, -0.1255442202091217, -0.12152259051799774, -0.11750096082687378, -0.11347933113574982, -0.10945770144462585, -0.10543607175350189, -0.10141444206237793, -0.09739281237125397, -0.09337118268013, -0.08934955298900604, -0.08532792329788208, -0.08130629360675812, -0.07728466391563416, -0.07326303422451019, -0.06924140453338623, -0.06521977484226227, -0.061198145151138306, -0.05717651546001434, -0.05315488576889038, -0.04913325607776642, -0.045111626386642456, -0.041089996695518494, -0.03706836700439453, -0.03304673731327057, -0.029025107622146606, -0.025003477931022644, -0.02098184823989868, -0.01696021854877472, -0.012938588857650757, -0.008916959166526794, -0.004895329475402832, -0.0008736997842788696, 0.0031479299068450928, 0.007169559597969055, 0.011191189289093018, 0.01521281898021698, 0.019234448671340942, 0.023256078362464905, 0.027277708053588867, 0.03129933774471283, 0.03532096743583679, 0.039342597126960754, 0.04336422681808472, 0.04738585650920868, 0.05140748620033264, 0.055429115891456604, 0.059450745582580566, 0.06347237527370453, 0.06749400496482849, 0.07151563465595245, 0.07553726434707642, 0.07955889403820038, 0.08358052372932434, 0.0876021534204483, 0.09162378311157227, 0.09564541280269623, 0.09966704249382019, 0.10368867218494415, 0.10771030187606812, 0.11173193156719208, 0.11575356125831604, 0.11977519094944, 0.12379682064056396]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 0.0, 8.0, 15.0, 16.0, 12.0, 26.0, 27.0, 24.0, 37.0, 49.0, 26.0, 50.0, 44.0, 60.0, 47.0, 73.0, 51.0, 59.0, 44.0, 43.0, 33.0, 50.0, 44.0, 31.0, 31.0, 24.0, 18.0, 13.0, 12.0, 13.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78125, -4.6356201171875, -4.489990234375, -4.3443603515625, -4.19873046875, -4.0531005859375, -3.907470703125, -3.7618408203125, -3.6162109375, -3.4705810546875, -3.324951171875, -3.1793212890625, -3.03369140625, -2.8880615234375, -2.742431640625, -2.5968017578125, -2.451171875, -2.3055419921875, -2.159912109375, -2.0142822265625, -1.86865234375, -1.7230224609375, -1.577392578125, -1.4317626953125, -1.2861328125, -1.1405029296875, -0.994873046875, -0.8492431640625, -0.70361328125, -0.5579833984375, -0.412353515625, -0.2667236328125, -0.12109375, 0.0245361328125, 0.170166015625, 0.3157958984375, 0.46142578125, 0.6070556640625, 0.752685546875, 0.8983154296875, 1.0439453125, 1.1895751953125, 1.335205078125, 1.4808349609375, 1.62646484375, 1.7720947265625, 1.917724609375, 2.0633544921875, 2.208984375, 2.3546142578125, 2.500244140625, 2.6458740234375, 2.79150390625, 2.9371337890625, 3.082763671875, 3.2283935546875, 3.3740234375, 3.5196533203125, 3.665283203125, 3.8109130859375, 3.95654296875, 4.1021728515625, 4.247802734375, 4.3934326171875, 4.5390625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 14.0, 25.0, 46.0, 70.0, 105.0, 152.0, 232.0, 407.0, 583.0, 922.0, 1530.0, 2441.0, 4301.0, 9060.0, 21000.0, 54413.0, 146861.0, 374915.0, 266516.0, 98266.0, 36512.0, 14691.0, 6520.0, 3520.0, 2036.0, 1231.0, 784.0, 507.0, 309.0, 215.0, 121.0, 68.0, 64.0, 22.0, 34.0, 11.0, 12.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3515625, -4.21026611328125, -4.0689697265625, -3.92767333984375, -3.786376953125, -3.64508056640625, -3.5037841796875, -3.36248779296875, -3.22119140625, -3.07989501953125, -2.9385986328125, -2.79730224609375, -2.656005859375, -2.51470947265625, -2.3734130859375, -2.23211669921875, -2.0908203125, -1.94952392578125, -1.8082275390625, -1.66693115234375, -1.525634765625, -1.38433837890625, -1.2430419921875, -1.10174560546875, -0.96044921875, -0.81915283203125, -0.6778564453125, -0.53656005859375, -0.395263671875, -0.25396728515625, -0.1126708984375, 0.02862548828125, 0.169921875, 0.31121826171875, 0.4525146484375, 0.59381103515625, 0.735107421875, 0.87640380859375, 1.0177001953125, 1.15899658203125, 1.30029296875, 1.44158935546875, 1.5828857421875, 1.72418212890625, 1.865478515625, 2.00677490234375, 2.1480712890625, 2.28936767578125, 2.4306640625, 2.57196044921875, 2.7132568359375, 2.85455322265625, 2.995849609375, 3.13714599609375, 3.2784423828125, 3.41973876953125, 3.56103515625, 3.70233154296875, 3.8436279296875, 3.98492431640625, 4.126220703125, 4.26751708984375, 4.4088134765625, 4.55010986328125, 4.69140625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 10.0, 14.0, 14.0, 9.0, 16.0, 14.0, 18.0, 22.0, 27.0, 30.0, 33.0, 40.0, 50.0, 49.0, 56.0, 81.0, 164.0, 1488.0, 336.0, 143.0, 75.0, 36.0, 38.0, 45.0, 45.0, 37.0, 26.0, 24.0, 21.0, 16.0, 14.0, 8.0, 14.0, 4.0, 7.0, 4.0, 5.0, 4.0, 3.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.588134765625, -10.16064453125, -9.733154296875, -9.3056640625, -8.878173828125, -8.45068359375, -8.023193359375, -7.595703125, -7.168212890625, -6.74072265625, -6.313232421875, -5.8857421875, -5.458251953125, -5.03076171875, -4.603271484375, -4.17578125, -3.748291015625, -3.32080078125, -2.893310546875, -2.4658203125, -2.038330078125, -1.61083984375, -1.183349609375, -0.755859375, -0.328369140625, 0.09912109375, 0.526611328125, 0.9541015625, 1.381591796875, 1.80908203125, 2.236572265625, 2.6640625, 3.091552734375, 3.51904296875, 3.946533203125, 4.3740234375, 4.801513671875, 5.22900390625, 5.656494140625, 6.083984375, 6.511474609375, 6.93896484375, 7.366455078125, 7.7939453125, 8.221435546875, 8.64892578125, 9.076416015625, 9.50390625, 9.931396484375, 10.35888671875, 10.786376953125, 11.2138671875, 11.641357421875, 12.06884765625, 12.496337890625, 12.923828125, 13.351318359375, 13.77880859375, 14.206298828125, 14.6337890625, 15.061279296875, 15.48876953125, 15.916259765625, 16.34375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 9.0, 9.0, 10.0, 19.0, 16.0, 26.0, 29.0, 51.0, 62.0, 82.0, 124.0, 167.0, 288.0, 547.0, 1867.0, 39984.0, 3077291.0, 22214.0, 1541.0, 519.0, 237.0, 156.0, 122.0, 81.0, 66.0, 33.0, 28.0, 30.0, 31.0, 25.0, 11.0, 7.0, 8.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -34.10498046875, -33.0537109375, -32.00244140625, -30.951171875, -29.89990234375, -28.8486328125, -27.79736328125, -26.74609375, -25.69482421875, -24.6435546875, -23.59228515625, -22.541015625, -21.48974609375, -20.4384765625, -19.38720703125, -18.3359375, -17.28466796875, -16.2333984375, -15.18212890625, -14.130859375, -13.07958984375, -12.0283203125, -10.97705078125, -9.92578125, -8.87451171875, -7.8232421875, -6.77197265625, -5.720703125, -4.66943359375, -3.6181640625, -2.56689453125, -1.515625, -0.46435546875, 0.5869140625, 1.63818359375, 2.689453125, 3.74072265625, 4.7919921875, 5.84326171875, 6.89453125, 7.94580078125, 8.9970703125, 10.04833984375, 11.099609375, 12.15087890625, 13.2021484375, 14.25341796875, 15.3046875, 16.35595703125, 17.4072265625, 18.45849609375, 19.509765625, 20.56103515625, 21.6123046875, 22.66357421875, 23.71484375, 24.76611328125, 25.8173828125, 26.86865234375, 27.919921875, 28.97119140625, 30.0224609375, 31.07373046875, 32.125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [810.0, 208.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.450361728668213, 1.4019050598144531, 9.254171371459961, 17.1064395904541, 24.95870590209961, 32.810970306396484, 40.663238525390625, 48.5155029296875, 56.36777114868164, 64.22003936767578, 72.07230377197266, 79.92457580566406, 87.77684020996094, 95.62910461425781, 103.48136901855469, 111.33363342285156, 119.18590545654297, 127.03816986083984, 134.89044189453125, 142.74270629882812, 150.594970703125, 158.44723510742188, 166.29949951171875, 174.15176391601562, 182.00404357910156, 189.85630798339844, 197.7085723876953, 205.56085205078125, 213.41311645507812, 221.265380859375, 229.11764526367188, 236.96990966796875, 244.8221893310547, 252.67445373535156, 260.5267333984375, 268.3789978027344, 276.23126220703125, 284.0835266113281, 291.935791015625, 299.7880554199219, 307.64031982421875, 315.4925842285156, 323.3448486328125, 331.1971130371094, 339.04937744140625, 346.9016418457031, 354.75390625, 362.606201171875, 370.4584655761719, 378.31072998046875, 386.1629943847656, 394.0152587890625, 401.8675231933594, 409.71978759765625, 417.57208251953125, 425.42431640625, 433.2765808105469, 441.12884521484375, 448.9811096191406, 456.8333740234375, 464.6856384277344, 472.53790283203125, 480.39019775390625, 488.242431640625, 496.0947265625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 4.0, 9.0, 8.0, 6.0, 10.0, 13.0, 14.0, 15.0, 21.0, 13.0, 28.0, 41.0, 30.0, 34.0, 43.0, 37.0, 34.0, 43.0, 41.0, 47.0, 35.0, 53.0, 38.0, 43.0, 41.0, 42.0, 31.0, 36.0, 31.0, 25.0, 14.0, 16.0, 16.0, 18.0, 11.0, 9.0, 13.0, 8.0, 7.0, 10.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.454742431640625, -32.42708969116211, -31.399438858032227, -30.371788024902344, -29.344135284423828, -28.316482543945312, -27.28883171081543, -26.261180877685547, -25.23352813720703, -24.205875396728516, -23.178224563598633, -22.15057373046875, -21.122920989990234, -20.09526824951172, -19.067617416381836, -18.039966583251953, -17.012313842773438, -15.984662055969238, -14.957010269165039, -13.92935848236084, -12.90170669555664, -11.874054908752441, -10.846403121948242, -9.818751335144043, -8.791099548339844, -7.7634477615356445, -6.735795974731445, -5.708144187927246, -4.680492401123047, -3.6528406143188477, -2.6251888275146484, -1.5975370407104492, -0.56988525390625, 0.4577665328979492, 1.4854183197021484, 2.5130701065063477, 3.540721893310547, 4.568373680114746, 5.596025466918945, 6.6236772537231445, 7.651329040527344, 8.678980827331543, 9.706632614135742, 10.734284400939941, 11.76193618774414, 12.78958797454834, 13.817239761352539, 14.844891548156738, 15.872543334960938, 16.900196075439453, 17.927846908569336, 18.95549774169922, 19.983150482177734, 21.01080322265625, 22.038454055786133, 23.066104888916016, 24.09375762939453, 25.121410369873047, 26.14906120300293, 27.176712036132812, 28.204364776611328, 29.232017517089844, 30.259668350219727, 31.28731918334961, 32.314971923828125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 7.0, 13.0, 11.0, 21.0, 18.0, 20.0, 26.0, 24.0, 42.0, 32.0, 35.0, 41.0, 38.0, 59.0, 68.0, 42.0, 45.0, 36.0, 52.0, 45.0, 45.0, 37.0, 29.0, 35.0, 27.0, 24.0, 27.0, 15.0, 23.0, 12.0, 5.0, 6.0, 10.0, 8.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.82421875, -3.6876220703125, -3.551025390625, -3.4144287109375, -3.27783203125, -3.1412353515625, -3.004638671875, -2.8680419921875, -2.7314453125, -2.5948486328125, -2.458251953125, -2.3216552734375, -2.18505859375, -2.0484619140625, -1.911865234375, -1.7752685546875, -1.638671875, -1.5020751953125, -1.365478515625, -1.2288818359375, -1.09228515625, -0.9556884765625, -0.819091796875, -0.6824951171875, -0.5458984375, -0.4093017578125, -0.272705078125, -0.1361083984375, 0.00048828125, 0.1370849609375, 0.273681640625, 0.4102783203125, 0.546875, 0.6834716796875, 0.820068359375, 0.9566650390625, 1.09326171875, 1.2298583984375, 1.366455078125, 1.5030517578125, 1.6396484375, 1.7762451171875, 1.912841796875, 2.0494384765625, 2.18603515625, 2.3226318359375, 2.459228515625, 2.5958251953125, 2.732421875, 2.8690185546875, 3.005615234375, 3.1422119140625, 3.27880859375, 3.4154052734375, 3.552001953125, 3.6885986328125, 3.8251953125, 3.9617919921875, 4.098388671875, 4.2349853515625, 4.37158203125, 4.5081787109375, 4.644775390625, 4.7813720703125, 4.91796875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 4.0, 8.0, 21.0, 22.0, 40.0, 52.0, 81.0, 104.0, 136.0, 209.0, 382.0, 668.0, 1238.0, 2549.0, 5975.0, 17617.0, 70994.0, 337081.0, 1334789.0, 1730888.0, 538563.0, 111592.0, 26267.0, 8028.0, 3214.0, 1546.0, 822.0, 449.0, 279.0, 178.0, 132.0, 96.0, 67.0, 43.0, 35.0, 18.0, 26.0, 13.0, 11.0, 7.0, 7.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.5234375, -5.333984375, -5.14453125, -4.955078125, -4.765625, -4.576171875, -4.38671875, -4.197265625, -4.0078125, -3.818359375, -3.62890625, -3.439453125, -3.25, -3.060546875, -2.87109375, -2.681640625, -2.4921875, -2.302734375, -2.11328125, -1.923828125, -1.734375, -1.544921875, -1.35546875, -1.166015625, -0.9765625, -0.787109375, -0.59765625, -0.408203125, -0.21875, -0.029296875, 0.16015625, 0.349609375, 0.5390625, 0.728515625, 0.91796875, 1.107421875, 1.296875, 1.486328125, 1.67578125, 1.865234375, 2.0546875, 2.244140625, 2.43359375, 2.623046875, 2.8125, 3.001953125, 3.19140625, 3.380859375, 3.5703125, 3.759765625, 3.94921875, 4.138671875, 4.328125, 4.517578125, 4.70703125, 4.896484375, 5.0859375, 5.275390625, 5.46484375, 5.654296875, 5.84375, 6.033203125, 6.22265625, 6.412109375, 6.6015625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 11.0, 10.0, 20.0, 31.0, 41.0, 58.0, 79.0, 143.0, 205.0, 243.0, 379.0, 490.0, 503.0, 474.0, 387.0, 303.0, 207.0, 146.0, 82.0, 64.0, 55.0, 29.0, 29.0, 18.0, 15.0, 9.0, 9.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.33984375, -7.08233642578125, -6.8248291015625, -6.56732177734375, -6.309814453125, -6.05230712890625, -5.7947998046875, -5.53729248046875, -5.27978515625, -5.02227783203125, -4.7647705078125, -4.50726318359375, -4.249755859375, -3.99224853515625, -3.7347412109375, -3.47723388671875, -3.2197265625, -2.96221923828125, -2.7047119140625, -2.44720458984375, -2.189697265625, -1.93218994140625, -1.6746826171875, -1.41717529296875, -1.15966796875, -0.90216064453125, -0.6446533203125, -0.38714599609375, -0.129638671875, 0.12786865234375, 0.3853759765625, 0.64288330078125, 0.900390625, 1.15789794921875, 1.4154052734375, 1.67291259765625, 1.930419921875, 2.18792724609375, 2.4454345703125, 2.70294189453125, 2.96044921875, 3.21795654296875, 3.4754638671875, 3.73297119140625, 3.990478515625, 4.24798583984375, 4.5054931640625, 4.76300048828125, 5.0205078125, 5.27801513671875, 5.5355224609375, 5.79302978515625, 6.050537109375, 6.30804443359375, 6.5655517578125, 6.82305908203125, 7.08056640625, 7.33807373046875, 7.5955810546875, 7.85308837890625, 8.110595703125, 8.36810302734375, 8.6256103515625, 8.88311767578125, 9.140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 4.0, 12.0, 13.0, 11.0, 17.0, 27.0, 41.0, 53.0, 69.0, 104.0, 172.0, 250.0, 506.0, 2434.0, 157156.0, 3989166.0, 41759.0, 1492.0, 342.0, 231.0, 139.0, 81.0, 58.0, 43.0, 29.0, 20.0, 9.0, 11.0, 10.0, 11.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.4375, -38.322998046875, -37.20849609375, -36.093994140625, -34.9794921875, -33.864990234375, -32.75048828125, -31.635986328125, -30.521484375, -29.406982421875, -28.29248046875, -27.177978515625, -26.0634765625, -24.948974609375, -23.83447265625, -22.719970703125, -21.60546875, -20.490966796875, -19.37646484375, -18.261962890625, -17.1474609375, -16.032958984375, -14.91845703125, -13.803955078125, -12.689453125, -11.574951171875, -10.46044921875, -9.345947265625, -8.2314453125, -7.116943359375, -6.00244140625, -4.887939453125, -3.7734375, -2.658935546875, -1.54443359375, -0.429931640625, 0.6845703125, 1.799072265625, 2.91357421875, 4.028076171875, 5.142578125, 6.257080078125, 7.37158203125, 8.486083984375, 9.6005859375, 10.715087890625, 11.82958984375, 12.944091796875, 14.05859375, 15.173095703125, 16.28759765625, 17.402099609375, 18.5166015625, 19.631103515625, 20.74560546875, 21.860107421875, 22.974609375, 24.089111328125, 25.20361328125, 26.318115234375, 27.4326171875, 28.547119140625, 29.66162109375, 30.776123046875, 31.890625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 15.0, 76.0, 183.0, 303.0, 256.0, 128.0, 37.0, 12.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.10205078125, -130.24700927734375, -127.39196014404297, -124.53691864013672, -121.68187713623047, -118.82683563232422, -115.97178649902344, -113.11674499511719, -110.26170349121094, -107.40666198730469, -104.5516128540039, -101.69657135009766, -98.8415298461914, -95.98648834228516, -93.13143920898438, -90.27639770507812, -87.42135620117188, -84.56631469726562, -81.71126556396484, -78.8562240600586, -76.00118255615234, -73.1461410522461, -70.29109191894531, -67.43605041503906, -64.58100128173828, -61.725955963134766, -58.870914459228516, -56.015869140625, -53.16082763671875, -50.305782318115234, -47.45073699951172, -44.59569549560547, -41.74065399169922, -38.8856086730957, -36.03056716918945, -33.17552185058594, -30.320480346679688, -27.465435028076172, -24.61039161682129, -21.755348205566406, -18.900304794311523, -16.04526138305664, -13.190217971801758, -10.335173606872559, -7.480130195617676, -4.625086784362793, -1.7700424194335938, 1.085000991821289, 3.940044403076172, 6.795087814331055, 9.650131225585938, 12.505175590515137, 15.36021900177002, 18.21526336669922, 21.0703067779541, 23.925350189208984, 26.780393600463867, 29.63543701171875, 32.490482330322266, 35.345523834228516, 38.20056915283203, 41.05561065673828, 43.9106559753418, 46.76570129394531, 49.62074279785156]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 12.0, 7.0, 9.0, 13.0, 6.0, 14.0, 13.0, 19.0, 26.0, 29.0, 29.0, 33.0, 32.0, 30.0, 27.0, 30.0, 36.0, 50.0, 41.0, 45.0, 30.0, 38.0, 37.0, 35.0, 46.0, 34.0, 35.0, 29.0, 35.0, 24.0, 14.0, 19.0, 22.0, 20.0, 20.0, 17.0, 12.0, 0.0, 6.0, 6.0, 4.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.638463973999023, -22.94504165649414, -22.251617431640625, -21.55819320678711, -20.864770889282227, -20.171348571777344, -19.477924346923828, -18.784500122070312, -18.09107780456543, -17.397655487060547, -16.70423126220703, -16.010807037353516, -15.317384719848633, -14.623961448669434, -13.930538177490234, -13.237114906311035, -12.543691635131836, -11.850268363952637, -11.156845092773438, -10.463421821594238, -9.769998550415039, -9.07657527923584, -8.38315200805664, -7.689728736877441, -6.996305465698242, -6.302882194519043, -5.609458923339844, -4.9160356521606445, -4.222612380981445, -3.529189109802246, -2.835765838623047, -2.1423425674438477, -1.4489173889160156, -0.7554941177368164, -0.06207084655761719, 0.631352424621582, 1.3247756958007812, 2.0181989669799805, 2.7116222381591797, 3.405045509338379, 4.098468780517578, 4.791892051696777, 5.485315322875977, 6.178738594055176, 6.872161865234375, 7.565585136413574, 8.259008407592773, 8.952431678771973, 9.645854949951172, 10.339278221130371, 11.03270149230957, 11.72612476348877, 12.419548034667969, 13.112971305847168, 13.806394577026367, 14.499817848205566, 15.193241119384766, 15.886664390563965, 16.580087661743164, 17.273509979248047, 17.966934204101562, 18.660358428955078, 19.35378074645996, 20.047203063964844, 20.74062728881836]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 5.0, 10.0, 13.0, 18.0, 24.0, 17.0, 27.0, 36.0, 48.0, 32.0, 56.0, 41.0, 50.0, 64.0, 50.0, 56.0, 47.0, 56.0, 47.0, 54.0, 36.0, 33.0, 29.0, 20.0, 36.0, 20.0, 16.0, 15.0, 16.0, 12.0, 8.0, 0.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90234375, -4.7545166015625, -4.606689453125, -4.4588623046875, -4.31103515625, -4.1632080078125, -4.015380859375, -3.8675537109375, -3.7197265625, -3.5718994140625, -3.424072265625, -3.2762451171875, -3.12841796875, -2.9805908203125, -2.832763671875, -2.6849365234375, -2.537109375, -2.3892822265625, -2.241455078125, -2.0936279296875, -1.94580078125, -1.7979736328125, -1.650146484375, -1.5023193359375, -1.3544921875, -1.2066650390625, -1.058837890625, -0.9110107421875, -0.76318359375, -0.6153564453125, -0.467529296875, -0.3197021484375, -0.171875, -0.0240478515625, 0.123779296875, 0.2716064453125, 0.41943359375, 0.5672607421875, 0.715087890625, 0.8629150390625, 1.0107421875, 1.1585693359375, 1.306396484375, 1.4542236328125, 1.60205078125, 1.7498779296875, 1.897705078125, 2.0455322265625, 2.193359375, 2.3411865234375, 2.489013671875, 2.6368408203125, 2.78466796875, 2.9324951171875, 3.080322265625, 3.2281494140625, 3.3759765625, 3.5238037109375, 3.671630859375, 3.8194580078125, 3.96728515625, 4.1151123046875, 4.262939453125, 4.4107666015625, 4.55859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 3.0, 4.0, 13.0, 8.0, 15.0, 22.0, 26.0, 59.0, 63.0, 110.0, 147.0, 217.0, 342.0, 465.0, 674.0, 995.0, 1549.0, 2881.0, 9367.0, 56012.0, 333029.0, 497586.0, 117525.0, 17680.0, 4239.0, 1898.0, 1122.0, 776.0, 516.0, 373.0, 289.0, 158.0, 125.0, 82.0, 69.0, 37.0, 31.0, 20.0, 14.0, 4.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.33355712890625, -1.2862548828125, -1.23895263671875, -1.191650390625, -1.14434814453125, -1.0970458984375, -1.04974365234375, -1.00244140625, -0.95513916015625, -0.9078369140625, -0.86053466796875, -0.813232421875, -0.76593017578125, -0.7186279296875, -0.67132568359375, -0.6240234375, -0.57672119140625, -0.5294189453125, -0.48211669921875, -0.434814453125, -0.38751220703125, -0.3402099609375, -0.29290771484375, -0.24560546875, -0.19830322265625, -0.1510009765625, -0.10369873046875, -0.056396484375, -0.00909423828125, 0.0382080078125, 0.08551025390625, 0.1328125, 0.18011474609375, 0.2274169921875, 0.27471923828125, 0.322021484375, 0.36932373046875, 0.4166259765625, 0.46392822265625, 0.51123046875, 0.55853271484375, 0.6058349609375, 0.65313720703125, 0.700439453125, 0.74774169921875, 0.7950439453125, 0.84234619140625, 0.8896484375, 0.93695068359375, 0.9842529296875, 1.03155517578125, 1.078857421875, 1.12615966796875, 1.1734619140625, 1.22076416015625, 1.26806640625, 1.31536865234375, 1.3626708984375, 1.40997314453125, 1.457275390625, 1.50457763671875, 1.5518798828125, 1.59918212890625, 1.646484375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 7.0, 6.0, 5.0, 11.0, 19.0, 21.0, 13.0, 11.0, 23.0, 18.0, 24.0, 23.0, 28.0, 31.0, 29.0, 36.0, 30.0, 43.0, 39.0, 40.0, 1067.0, 30.0, 32.0, 30.0, 31.0, 30.0, 30.0, 35.0, 32.0, 27.0, 24.0, 24.0, 27.0, 16.0, 16.0, 16.0, 18.0, 8.0, 6.0, 15.0, 4.0, 8.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 4.0], "bins": [-2.57421875, -2.50164794921875, -2.4290771484375, -2.35650634765625, -2.283935546875, -2.21136474609375, -2.1387939453125, -2.06622314453125, -1.99365234375, -1.92108154296875, -1.8485107421875, -1.77593994140625, -1.703369140625, -1.63079833984375, -1.5582275390625, -1.48565673828125, -1.4130859375, -1.34051513671875, -1.2679443359375, -1.19537353515625, -1.122802734375, -1.05023193359375, -0.9776611328125, -0.90509033203125, -0.83251953125, -0.75994873046875, -0.6873779296875, -0.61480712890625, -0.542236328125, -0.46966552734375, -0.3970947265625, -0.32452392578125, -0.251953125, -0.17938232421875, -0.1068115234375, -0.03424072265625, 0.038330078125, 0.11090087890625, 0.1834716796875, 0.25604248046875, 0.32861328125, 0.40118408203125, 0.4737548828125, 0.54632568359375, 0.618896484375, 0.69146728515625, 0.7640380859375, 0.83660888671875, 0.9091796875, 0.98175048828125, 1.0543212890625, 1.12689208984375, 1.199462890625, 1.27203369140625, 1.3446044921875, 1.41717529296875, 1.48974609375, 1.56231689453125, 1.6348876953125, 1.70745849609375, 1.780029296875, 1.85260009765625, 1.9251708984375, 1.99774169921875, 2.0703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 14.0, 5.0, 8.0, 20.0, 23.0, 40.0, 46.0, 65.0, 111.0, 186.0, 316.0, 532.0, 1076.0, 2507.0, 10152.0, 98974.0, 1683910.0, 268108.0, 23505.0, 4261.0, 1464.0, 740.0, 397.0, 245.0, 128.0, 81.0, 47.0, 39.0, 35.0, 21.0, 18.0, 7.0, 3.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95068359375, -0.9186782836914062, -0.8866729736328125, -0.8546676635742188, -0.822662353515625, -0.7906570434570312, -0.7586517333984375, -0.7266464233398438, -0.69464111328125, -0.6626358032226562, -0.6306304931640625, -0.5986251831054688, -0.566619873046875, -0.5346145629882812, -0.5026092529296875, -0.47060394287109375, -0.4385986328125, -0.40659332275390625, -0.3745880126953125, -0.34258270263671875, -0.310577392578125, -0.27857208251953125, -0.2465667724609375, -0.21456146240234375, -0.18255615234375, -0.15055084228515625, -0.1185455322265625, -0.08654022216796875, -0.054534912109375, -0.02252960205078125, 0.0094757080078125, 0.04148101806640625, 0.073486328125, 0.10549163818359375, 0.1374969482421875, 0.16950225830078125, 0.201507568359375, 0.23351287841796875, 0.2655181884765625, 0.29752349853515625, 0.32952880859375, 0.36153411865234375, 0.3935394287109375, 0.42554473876953125, 0.457550048828125, 0.48955535888671875, 0.5215606689453125, 0.5535659790039062, 0.5855712890625, 0.6175765991210938, 0.6495819091796875, 0.6815872192382812, 0.713592529296875, 0.7455978393554688, 0.7776031494140625, 0.8096084594726562, 0.84161376953125, 0.8736190795898438, 0.9056243896484375, 0.9376296997070312, 0.969635009765625, 1.0016403198242188, 1.0336456298828125, 1.0656509399414062, 1.09765625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 11.0, 7.0, 19.0, 25.0, 47.0, 70.0, 89.0, 130.0, 144.0, 124.0, 91.0, 74.0, 47.0, 34.0, 22.0, 6.0, 8.0, 5.0, 12.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.060760498046875, -0.05846834182739258, -0.056176185607910156, -0.053884029388427734, -0.05159187316894531, -0.04929971694946289, -0.04700756072998047, -0.04471540451049805, -0.042423248291015625, -0.0401310920715332, -0.03783893585205078, -0.03554677963256836, -0.03325462341308594, -0.030962467193603516, -0.028670310974121094, -0.026378154754638672, -0.02408599853515625, -0.021793842315673828, -0.019501686096191406, -0.017209529876708984, -0.014917373657226562, -0.01262521743774414, -0.010333061218261719, -0.008040904998779297, -0.005748748779296875, -0.003456592559814453, -0.0011644363403320312, 0.0011277198791503906, 0.0034198760986328125, 0.005712032318115234, 0.008004188537597656, 0.010296344757080078, 0.0125885009765625, 0.014880657196044922, 0.017172813415527344, 0.019464969635009766, 0.021757125854492188, 0.02404928207397461, 0.02634143829345703, 0.028633594512939453, 0.030925750732421875, 0.0332179069519043, 0.03551006317138672, 0.03780221939086914, 0.04009437561035156, 0.042386531829833984, 0.044678688049316406, 0.04697084426879883, 0.04926300048828125, 0.05155515670776367, 0.053847312927246094, 0.056139469146728516, 0.05843162536621094, 0.06072378158569336, 0.06301593780517578, 0.0653080940246582, 0.06760025024414062, 0.06989240646362305, 0.07218456268310547, 0.07447671890258789, 0.07676887512207031, 0.07906103134155273, 0.08135318756103516, 0.08364534378051758, 0.0859375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 10.0, 8.0, 6.0, 15.0, 33.0, 47.0, 69.0, 137.0, 337.0, 5033.0, 1037821.0, 4362.0, 328.0, 126.0, 87.0, 30.0, 25.0, 20.0, 9.0, 10.0, 9.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.919921875, -1.8686981201171875, -1.817474365234375, -1.7662506103515625, -1.71502685546875, -1.6638031005859375, -1.612579345703125, -1.5613555908203125, -1.5101318359375, -1.4589080810546875, -1.407684326171875, -1.3564605712890625, -1.30523681640625, -1.2540130615234375, -1.202789306640625, -1.1515655517578125, -1.100341796875, -1.0491180419921875, -0.997894287109375, -0.9466705322265625, -0.89544677734375, -0.8442230224609375, -0.792999267578125, -0.7417755126953125, -0.6905517578125, -0.6393280029296875, -0.588104248046875, -0.5368804931640625, -0.48565673828125, -0.4344329833984375, -0.383209228515625, -0.3319854736328125, -0.28076171875, -0.2295379638671875, -0.178314208984375, -0.1270904541015625, -0.07586669921875, -0.0246429443359375, 0.026580810546875, 0.0778045654296875, 0.1290283203125, 0.1802520751953125, 0.231475830078125, 0.2826995849609375, 0.33392333984375, 0.3851470947265625, 0.436370849609375, 0.4875946044921875, 0.538818359375, 0.5900421142578125, 0.641265869140625, 0.6924896240234375, 0.74371337890625, 0.7949371337890625, 0.846160888671875, 0.8973846435546875, 0.9486083984375, 0.9998321533203125, 1.051055908203125, 1.1022796630859375, 1.15350341796875, 1.2047271728515625, 1.255950927734375, 1.3071746826171875, 1.3583984375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 17.0, 26.0, 93.0, 276.0, 354.0, 142.0, 53.0, 20.0, 14.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.43858426809310913, -0.4298347234725952, -0.4210851788520813, -0.4123356342315674, -0.40358611941337585, -0.39483657479286194, -0.386087030172348, -0.3773374855518341, -0.3685879409313202, -0.3598383963108063, -0.35108885169029236, -0.34233933687210083, -0.3335897922515869, -0.324840247631073, -0.3160907030105591, -0.30734115839004517, -0.29859161376953125, -0.28984206914901733, -0.2810925245285034, -0.2723429799079895, -0.263593465089798, -0.25484392046928406, -0.24609437584877014, -0.23734483122825623, -0.2285953164100647, -0.21984577178955078, -0.21109624207019806, -0.20234669744968414, -0.19359715282917023, -0.1848476231098175, -0.1760980784893036, -0.16734853386878967, -0.15859898924827576, -0.14984944462776184, -0.14109991490840912, -0.1323503702878952, -0.12360082566738129, -0.11485128849744797, -0.10610175132751465, -0.09735220670700073, -0.08860266953706741, -0.0798531323671341, -0.07110358774662018, -0.06235405057668686, -0.05360450968146324, -0.044854968786239624, -0.036105431616306305, -0.027355890721082687, -0.01860634982585907, -0.009856809861958027, -0.001107269898056984, 0.007642269134521484, 0.016391810029745102, 0.02514135092496872, 0.03389088809490204, 0.042640428990125656, 0.051389969885349274, 0.06013951078057289, 0.06888905167579651, 0.07763858884572983, 0.08638812601566315, 0.09513767063617706, 0.10388720780611038, 0.1126367449760437, 0.12138628959655762]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 2.0, 5.0, 8.0, 1.0, 4.0, 8.0, 7.0, 9.0, 13.0, 16.0, 14.0, 18.0, 21.0, 24.0, 24.0, 19.0, 35.0, 39.0, 35.0, 43.0, 39.0, 40.0, 36.0, 38.0, 36.0, 38.0, 45.0, 34.0, 34.0, 28.0, 34.0, 33.0, 27.0, 27.0, 22.0, 18.0, 14.0, 17.0, 14.0, 18.0, 17.0, 12.0, 4.0, 5.0, 8.0, 5.0, 1.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0], "bins": [-0.1093643307685852, -0.10626395046710968, -0.10316357016563416, -0.10006318241357803, -0.09696280211210251, -0.09386242181062698, -0.09076203405857086, -0.08766165375709534, -0.08456127345561981, -0.08146089315414429, -0.07836051285266876, -0.07526012510061264, -0.07215974479913712, -0.06905936449766159, -0.06595897674560547, -0.06285859644412994, -0.05975821614265442, -0.056657835841178894, -0.05355745181441307, -0.05045706778764725, -0.04735668748617172, -0.0442563071846962, -0.041155923157930374, -0.03805553913116455, -0.034955158829689026, -0.0318547785282135, -0.028754394501447678, -0.025654012337327003, -0.02255363017320633, -0.019453248009085655, -0.01635286584496498, -0.013252483680844307, -0.010152101516723633, -0.007051719352602959, -0.0039513371884822845, -0.0008509550243616104, 0.0022494271397590637, 0.005349809303879738, 0.008450191468000412, 0.011550573632121086, 0.01465095579624176, 0.017751337960362434, 0.02085172012448311, 0.023952102288603783, 0.027052484452724457, 0.03015286661684513, 0.033253248780965805, 0.03635363280773163, 0.03945401310920715, 0.04255439341068268, 0.0456547774374485, 0.048755161464214325, 0.05185554176568985, 0.054955922067165375, 0.0580563060939312, 0.06115669012069702, 0.06425707042217255, 0.06735745072364807, 0.0704578310251236, 0.07355821877717972, 0.07665859907865524, 0.07975897938013077, 0.08285936713218689, 0.08595974743366241, 0.08906012773513794]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 8.0, 13.0, 13.0, 14.0, 18.0, 18.0, 26.0, 32.0, 45.0, 44.0, 50.0, 48.0, 50.0, 46.0, 57.0, 53.0, 45.0, 50.0, 40.0, 56.0, 51.0, 33.0, 22.0, 23.0, 27.0, 16.0, 20.0, 23.0, 13.0, 10.0, 9.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.8828125, -4.74432373046875, -4.6058349609375, -4.46734619140625, -4.328857421875, -4.19036865234375, -4.0518798828125, -3.91339111328125, -3.77490234375, -3.63641357421875, -3.4979248046875, -3.35943603515625, -3.220947265625, -3.08245849609375, -2.9439697265625, -2.80548095703125, -2.6669921875, -2.52850341796875, -2.3900146484375, -2.25152587890625, -2.113037109375, -1.97454833984375, -1.8360595703125, -1.69757080078125, -1.55908203125, -1.42059326171875, -1.2821044921875, -1.14361572265625, -1.005126953125, -0.86663818359375, -0.7281494140625, -0.58966064453125, -0.451171875, -0.31268310546875, -0.1741943359375, -0.03570556640625, 0.102783203125, 0.24127197265625, 0.3797607421875, 0.51824951171875, 0.65673828125, 0.79522705078125, 0.9337158203125, 1.07220458984375, 1.210693359375, 1.34918212890625, 1.4876708984375, 1.62615966796875, 1.7646484375, 1.90313720703125, 2.0416259765625, 2.18011474609375, 2.318603515625, 2.45709228515625, 2.5955810546875, 2.73406982421875, 2.87255859375, 3.01104736328125, 3.1495361328125, 3.28802490234375, 3.426513671875, 3.56500244140625, 3.7034912109375, 3.84197998046875, 3.98046875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 11.0, 9.0, 11.0, 16.0, 21.0, 40.0, 68.0, 96.0, 161.0, 251.0, 566.0, 1027.0, 2135.0, 4492.0, 9747.0, 20836.0, 48904.0, 139405.0, 400524.0, 268345.0, 89204.0, 33626.0, 15165.0, 7129.0, 3376.0, 1578.0, 806.0, 401.0, 230.0, 119.0, 89.0, 56.0, 35.0, 25.0, 14.0, 18.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.8828125, -5.7137451171875, -5.544677734375, -5.3756103515625, -5.20654296875, -5.0374755859375, -4.868408203125, -4.6993408203125, -4.5302734375, -4.3612060546875, -4.192138671875, -4.0230712890625, -3.85400390625, -3.6849365234375, -3.515869140625, -3.3468017578125, -3.177734375, -3.0086669921875, -2.839599609375, -2.6705322265625, -2.50146484375, -2.3323974609375, -2.163330078125, -1.9942626953125, -1.8251953125, -1.6561279296875, -1.487060546875, -1.3179931640625, -1.14892578125, -0.9798583984375, -0.810791015625, -0.6417236328125, -0.47265625, -0.3035888671875, -0.134521484375, 0.0345458984375, 0.20361328125, 0.3726806640625, 0.541748046875, 0.7108154296875, 0.8798828125, 1.0489501953125, 1.218017578125, 1.3870849609375, 1.55615234375, 1.7252197265625, 1.894287109375, 2.0633544921875, 2.232421875, 2.4014892578125, 2.570556640625, 2.7396240234375, 2.90869140625, 3.0777587890625, 3.246826171875, 3.4158935546875, 3.5849609375, 3.7540283203125, 3.923095703125, 4.0921630859375, 4.26123046875, 4.4302978515625, 4.599365234375, 4.7684326171875, 4.9375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 2.0, 6.0, 11.0, 9.0, 7.0, 16.0, 15.0, 21.0, 19.0, 28.0, 26.0, 38.0, 34.0, 41.0, 61.0, 73.0, 116.0, 295.0, 1503.0, 251.0, 88.0, 60.0, 43.0, 44.0, 39.0, 28.0, 29.0, 29.0, 25.0, 20.0, 17.0, 14.0, 7.0, 9.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.21875, -12.7686767578125, -12.318603515625, -11.8685302734375, -11.41845703125, -10.9683837890625, -10.518310546875, -10.0682373046875, -9.6181640625, -9.1680908203125, -8.718017578125, -8.2679443359375, -7.81787109375, -7.3677978515625, -6.917724609375, -6.4676513671875, -6.017578125, -5.5675048828125, -5.117431640625, -4.6673583984375, -4.21728515625, -3.7672119140625, -3.317138671875, -2.8670654296875, -2.4169921875, -1.9669189453125, -1.516845703125, -1.0667724609375, -0.61669921875, -0.1666259765625, 0.283447265625, 0.7335205078125, 1.18359375, 1.6336669921875, 2.083740234375, 2.5338134765625, 2.98388671875, 3.4339599609375, 3.884033203125, 4.3341064453125, 4.7841796875, 5.2342529296875, 5.684326171875, 6.1343994140625, 6.58447265625, 7.0345458984375, 7.484619140625, 7.9346923828125, 8.384765625, 8.8348388671875, 9.284912109375, 9.7349853515625, 10.18505859375, 10.6351318359375, 11.085205078125, 11.5352783203125, 11.9853515625, 12.4354248046875, 12.885498046875, 13.3355712890625, 13.78564453125, 14.2357177734375, 14.685791015625, 15.1358642578125, 15.5859375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 5.0, 7.0, 5.0, 14.0, 7.0, 18.0, 18.0, 27.0, 40.0, 40.0, 52.0, 66.0, 97.0, 126.0, 168.0, 272.0, 498.0, 2113.0, 97792.0, 3003356.0, 38226.0, 1389.0, 438.0, 237.0, 161.0, 138.0, 80.0, 68.0, 57.0, 39.0, 37.0, 26.0, 17.0, 13.0, 9.0, 6.0, 13.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.828125, -27.9384765625, -27.048828125, -26.1591796875, -25.26953125, -24.3798828125, -23.490234375, -22.6005859375, -21.7109375, -20.8212890625, -19.931640625, -19.0419921875, -18.15234375, -17.2626953125, -16.373046875, -15.4833984375, -14.59375, -13.7041015625, -12.814453125, -11.9248046875, -11.03515625, -10.1455078125, -9.255859375, -8.3662109375, -7.4765625, -6.5869140625, -5.697265625, -4.8076171875, -3.91796875, -3.0283203125, -2.138671875, -1.2490234375, -0.359375, 0.5302734375, 1.419921875, 2.3095703125, 3.19921875, 4.0888671875, 4.978515625, 5.8681640625, 6.7578125, 7.6474609375, 8.537109375, 9.4267578125, 10.31640625, 11.2060546875, 12.095703125, 12.9853515625, 13.875, 14.7646484375, 15.654296875, 16.5439453125, 17.43359375, 18.3232421875, 19.212890625, 20.1025390625, 20.9921875, 21.8818359375, 22.771484375, 23.6611328125, 24.55078125, 25.4404296875, 26.330078125, 27.2197265625, 28.109375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 9.0, 44.0, 123.0, 241.0, 300.0, 179.0, 95.0, 17.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.1440658569336, -69.6980209350586, -68.25196838378906, -66.80592346191406, -65.35987854003906, -63.91383361816406, -62.4677848815918, -61.02173614501953, -59.57569122314453, -58.12964630126953, -56.683597564697266, -55.237548828125, -53.79150390625, -52.345458984375, -50.899410247802734, -49.45336151123047, -48.00731658935547, -46.56127166748047, -45.1152229309082, -43.66917419433594, -42.22312927246094, -40.77708435058594, -39.33103561401367, -37.884986877441406, -36.438941955566406, -34.992897033691406, -33.54684829711914, -32.100799560546875, -30.654754638671875, -29.208707809448242, -27.76266098022461, -26.316614151000977, -24.870569229125977, -23.424522399902344, -21.97847557067871, -20.532428741455078, -19.086381912231445, -17.640335083007812, -16.19428825378418, -14.748241424560547, -13.302194595336914, -11.856147766113281, -10.410100936889648, -8.964054107666016, -7.518007278442383, -6.07196044921875, -4.625913619995117, -3.1798667907714844, -1.7338199615478516, -0.28777313232421875, 1.158273696899414, 2.604320526123047, 4.05036735534668, 5.4964141845703125, 6.942461013793945, 8.388507843017578, 9.834554672241211, 11.280601501464844, 12.726648330688477, 14.17269515991211, 15.618741989135742, 17.064788818359375, 18.510835647583008, 19.95688247680664, 21.402929306030273]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 5.0, 9.0, 12.0, 6.0, 19.0, 15.0, 29.0, 27.0, 20.0, 25.0, 38.0, 36.0, 28.0, 43.0, 33.0, 42.0, 43.0, 52.0, 50.0, 42.0, 48.0, 47.0, 35.0, 32.0, 36.0, 39.0, 37.0, 28.0, 25.0, 20.0, 17.0, 20.0, 13.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.60454559326172, -33.4927864074707, -32.38103103637695, -31.269271850585938, -30.157514572143555, -29.045757293701172, -27.93400001525879, -26.822242736816406, -25.71048355102539, -24.598726272583008, -23.486968994140625, -22.37520980834961, -21.263452529907227, -20.151695251464844, -19.03993797302246, -17.928180694580078, -16.816423416137695, -15.704666137695312, -14.592907905578613, -13.48115062713623, -12.369392395019531, -11.257635116577148, -10.145877838134766, -9.034120559692383, -7.922362327575684, -6.810604572296143, -5.698846817016602, -4.587089538574219, -3.4753317832946777, -2.3635740280151367, -1.251816749572754, -0.1400589942932129, 0.9716987609863281, 2.083456516265869, 3.195214033126831, 4.306971549987793, 5.418729305267334, 6.530487060546875, 7.642244338989258, 8.75400161743164, 9.86575984954834, 10.977517127990723, 12.089275360107422, 13.201032638549805, 14.312789916992188, 15.424548149108887, 16.536304473876953, 17.64806365966797, 18.75982093811035, 19.871578216552734, 20.983335494995117, 22.0950927734375, 23.206851959228516, 24.3186092376709, 25.43036651611328, 26.542123794555664, 27.653881072998047, 28.76563835144043, 29.877395629882812, 30.989154815673828, 32.10091018676758, 33.212669372558594, 34.324424743652344, 35.43618392944336, 36.547943115234375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 3.0, 6.0, 8.0, 13.0, 11.0, 19.0, 17.0, 21.0, 17.0, 24.0, 24.0, 35.0, 40.0, 42.0, 39.0, 46.0, 37.0, 47.0, 59.0, 51.0, 42.0, 45.0, 40.0, 43.0, 37.0, 33.0, 30.0, 24.0, 32.0, 19.0, 19.0, 17.0, 19.0, 14.0, 6.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.90625, -4.769012451171875, -4.63177490234375, -4.494537353515625, -4.3572998046875, -4.220062255859375, -4.08282470703125, -3.945587158203125, -3.808349609375, -3.671112060546875, -3.53387451171875, -3.396636962890625, -3.2593994140625, -3.122161865234375, -2.98492431640625, -2.847686767578125, -2.71044921875, -2.573211669921875, -2.43597412109375, -2.298736572265625, -2.1614990234375, -2.024261474609375, -1.88702392578125, -1.749786376953125, -1.612548828125, -1.475311279296875, -1.33807373046875, -1.200836181640625, -1.0635986328125, -0.926361083984375, -0.78912353515625, -0.651885986328125, -0.5146484375, -0.377410888671875, -0.24017333984375, -0.102935791015625, 0.0343017578125, 0.171539306640625, 0.30877685546875, 0.446014404296875, 0.583251953125, 0.720489501953125, 0.85772705078125, 0.994964599609375, 1.1322021484375, 1.269439697265625, 1.40667724609375, 1.543914794921875, 1.68115234375, 1.818389892578125, 1.95562744140625, 2.092864990234375, 2.2301025390625, 2.367340087890625, 2.50457763671875, 2.641815185546875, 2.779052734375, 2.916290283203125, 3.05352783203125, 3.190765380859375, 3.3280029296875, 3.465240478515625, 3.60247802734375, 3.739715576171875, 3.876953125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 3.0, 4.0, 1.0, 11.0, 12.0, 14.0, 20.0, 24.0, 29.0, 37.0, 64.0, 87.0, 131.0, 197.0, 346.0, 636.0, 1529.0, 3997.0, 15175.0, 99736.0, 813094.0, 2435430.0, 717249.0, 86040.0, 13635.0, 3674.0, 1357.0, 685.0, 369.0, 226.0, 131.0, 102.0, 54.0, 48.0, 33.0, 25.0, 24.0, 17.0, 10.0, 9.0, 8.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.8125, -8.5491943359375, -8.285888671875, -8.0225830078125, -7.75927734375, -7.4959716796875, -7.232666015625, -6.9693603515625, -6.7060546875, -6.4427490234375, -6.179443359375, -5.9161376953125, -5.65283203125, -5.3895263671875, -5.126220703125, -4.8629150390625, -4.599609375, -4.3363037109375, -4.072998046875, -3.8096923828125, -3.54638671875, -3.2830810546875, -3.019775390625, -2.7564697265625, -2.4931640625, -2.2298583984375, -1.966552734375, -1.7032470703125, -1.43994140625, -1.1766357421875, -0.913330078125, -0.6500244140625, -0.38671875, -0.1234130859375, 0.139892578125, 0.4031982421875, 0.66650390625, 0.9298095703125, 1.193115234375, 1.4564208984375, 1.7197265625, 1.9830322265625, 2.246337890625, 2.5096435546875, 2.77294921875, 3.0362548828125, 3.299560546875, 3.5628662109375, 3.826171875, 4.0894775390625, 4.352783203125, 4.6160888671875, 4.87939453125, 5.1427001953125, 5.406005859375, 5.6693115234375, 5.9326171875, 6.1959228515625, 6.459228515625, 6.7225341796875, 6.98583984375, 7.2491455078125, 7.512451171875, 7.7757568359375, 8.0390625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 6.0, 11.0, 12.0, 13.0, 19.0, 23.0, 35.0, 37.0, 41.0, 95.0, 109.0, 119.0, 155.0, 215.0, 308.0, 379.0, 402.0, 400.0, 352.0, 308.0, 267.0, 191.0, 138.0, 113.0, 74.0, 59.0, 41.0, 29.0, 32.0, 13.0, 9.0, 10.0, 11.0, 13.0, 6.0, 4.0, 12.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-7.46484375, -7.264404296875, -7.06396484375, -6.863525390625, -6.6630859375, -6.462646484375, -6.26220703125, -6.061767578125, -5.861328125, -5.660888671875, -5.46044921875, -5.260009765625, -5.0595703125, -4.859130859375, -4.65869140625, -4.458251953125, -4.2578125, -4.057373046875, -3.85693359375, -3.656494140625, -3.4560546875, -3.255615234375, -3.05517578125, -2.854736328125, -2.654296875, -2.453857421875, -2.25341796875, -2.052978515625, -1.8525390625, -1.652099609375, -1.45166015625, -1.251220703125, -1.05078125, -0.850341796875, -0.64990234375, -0.449462890625, -0.2490234375, -0.048583984375, 0.15185546875, 0.352294921875, 0.552734375, 0.753173828125, 0.95361328125, 1.154052734375, 1.3544921875, 1.554931640625, 1.75537109375, 1.955810546875, 2.15625, 2.356689453125, 2.55712890625, 2.757568359375, 2.9580078125, 3.158447265625, 3.35888671875, 3.559326171875, 3.759765625, 3.960205078125, 4.16064453125, 4.361083984375, 4.5615234375, 4.761962890625, 4.96240234375, 5.162841796875, 5.36328125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 10.0, 9.0, 12.0, 9.0, 8.0, 13.0, 16.0, 36.0, 36.0, 43.0, 72.0, 93.0, 143.0, 186.0, 325.0, 710.0, 3316.0, 126616.0, 3885839.0, 171106.0, 3820.0, 793.0, 330.0, 181.0, 146.0, 123.0, 84.0, 39.0, 40.0, 32.0, 25.0, 8.0, 14.0, 17.0, 7.0, 5.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.5498046875, -22.662109375, -21.7744140625, -20.88671875, -19.9990234375, -19.111328125, -18.2236328125, -17.3359375, -16.4482421875, -15.560546875, -14.6728515625, -13.78515625, -12.8974609375, -12.009765625, -11.1220703125, -10.234375, -9.3466796875, -8.458984375, -7.5712890625, -6.68359375, -5.7958984375, -4.908203125, -4.0205078125, -3.1328125, -2.2451171875, -1.357421875, -0.4697265625, 0.41796875, 1.3056640625, 2.193359375, 3.0810546875, 3.96875, 4.8564453125, 5.744140625, 6.6318359375, 7.51953125, 8.4072265625, 9.294921875, 10.1826171875, 11.0703125, 11.9580078125, 12.845703125, 13.7333984375, 14.62109375, 15.5087890625, 16.396484375, 17.2841796875, 18.171875, 19.0595703125, 19.947265625, 20.8349609375, 21.72265625, 22.6103515625, 23.498046875, 24.3857421875, 25.2734375, 26.1611328125, 27.048828125, 27.9365234375, 28.82421875, 29.7119140625, 30.599609375, 31.4873046875, 32.375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 16.0, 82.0, 210.0, 294.0, 277.0, 108.0, 20.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.97957229614258, -34.079280853271484, -31.17898941040039, -28.278697967529297, -25.378406524658203, -22.47811508178711, -19.577821731567383, -16.67753028869629, -13.777238845825195, -10.876947402954102, -7.97665548324585, -5.076363563537598, -2.176072120666504, 0.7242193222045898, 3.62451171875, 6.524803161621094, 9.425094604492188, 12.325386047363281, 15.225677490234375, 18.12596893310547, 21.026260375976562, 23.926551818847656, 26.826845169067383, 29.727136611938477, 32.62742614746094, 35.52771759033203, 38.428009033203125, 41.32830047607422, 44.22859191894531, 47.128883361816406, 50.0291748046875, 52.929466247558594, 55.82976531982422, 58.73005676269531, 61.630348205566406, 64.5306396484375, 67.4309310913086, 70.33122253417969, 73.23151397705078, 76.13180541992188, 79.03209686279297, 81.93238830566406, 84.83267974853516, 87.73297119140625, 90.63326263427734, 93.53355407714844, 96.43384552001953, 99.33413696289062, 102.23443603515625, 105.13472747802734, 108.03501892089844, 110.93531036376953, 113.83560180664062, 116.73589324951172, 119.63618469238281, 122.5364761352539, 125.436767578125, 128.33706665039062, 131.2373504638672, 134.1376495361328, 137.03793334960938, 139.938232421875, 142.83851623535156, 145.7388153076172, 148.63909912109375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 7.0, 7.0, 5.0, 7.0, 9.0, 13.0, 12.0, 17.0, 10.0, 19.0, 15.0, 27.0, 27.0, 24.0, 27.0, 33.0, 27.0, 30.0, 22.0, 38.0, 33.0, 26.0, 49.0, 38.0, 37.0, 35.0, 30.0, 31.0, 28.0, 25.0, 30.0, 31.0, 20.0, 31.0, 19.0, 24.0, 16.0, 14.0, 14.0, 25.0, 15.0, 7.0, 4.0, 6.0, 8.0, 3.0, 9.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.96987533569336, -18.367971420288086, -17.766067504882812, -17.16416358947754, -16.562259674072266, -15.960355758666992, -15.358450889587402, -14.756546974182129, -14.154643058776855, -13.552739143371582, -12.950835227966309, -12.348931312561035, -11.747026443481445, -11.145122528076172, -10.543218612670898, -9.941314697265625, -9.339410781860352, -8.737506866455078, -8.135602951049805, -7.533698558807373, -6.9317946434021, -6.329890727996826, -5.7279863357543945, -5.126082420349121, -4.524178504943848, -3.922274589538574, -3.3203704357147217, -2.718466281890869, -2.1165623664855957, -1.5146584510803223, -0.9127542972564697, -0.3108501434326172, 0.29105186462402344, 0.8929558992385864, 1.4948599338531494, 2.096764087677002, 2.6986680030822754, 3.300571918487549, 3.9024760723114014, 4.504380226135254, 5.106284141540527, 5.708188056945801, 6.310091972351074, 6.911996364593506, 7.513900279998779, 8.115804672241211, 8.717708587646484, 9.319612503051758, 9.921516418457031, 10.523420333862305, 11.125324249267578, 11.727228164672852, 12.329132080078125, 12.931035995483398, 13.532940864562988, 14.134844779968262, 14.736748695373535, 15.338652610778809, 15.940556526184082, 16.542461395263672, 17.144365310668945, 17.74626922607422, 18.348173141479492, 18.950077056884766, 19.55198097229004]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 12.0, 14.0, 17.0, 17.0, 16.0, 25.0, 30.0, 26.0, 39.0, 41.0, 41.0, 46.0, 41.0, 53.0, 57.0, 55.0, 55.0, 55.0, 30.0, 46.0, 36.0, 32.0, 33.0, 31.0, 20.0, 21.0, 17.0, 19.0, 16.0, 13.0, 7.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.42578125, -4.29241943359375, -4.1590576171875, -4.02569580078125, -3.892333984375, -3.75897216796875, -3.6256103515625, -3.49224853515625, -3.35888671875, -3.22552490234375, -3.0921630859375, -2.95880126953125, -2.825439453125, -2.69207763671875, -2.5587158203125, -2.42535400390625, -2.2919921875, -2.15863037109375, -2.0252685546875, -1.89190673828125, -1.758544921875, -1.62518310546875, -1.4918212890625, -1.35845947265625, -1.22509765625, -1.09173583984375, -0.9583740234375, -0.82501220703125, -0.691650390625, -0.55828857421875, -0.4249267578125, -0.29156494140625, -0.158203125, -0.02484130859375, 0.1085205078125, 0.24188232421875, 0.375244140625, 0.50860595703125, 0.6419677734375, 0.77532958984375, 0.90869140625, 1.04205322265625, 1.1754150390625, 1.30877685546875, 1.442138671875, 1.57550048828125, 1.7088623046875, 1.84222412109375, 1.9755859375, 2.10894775390625, 2.2423095703125, 2.37567138671875, 2.509033203125, 2.64239501953125, 2.7757568359375, 2.90911865234375, 3.04248046875, 3.17584228515625, 3.3092041015625, 3.44256591796875, 3.575927734375, 3.70928955078125, 3.8426513671875, 3.97601318359375, 4.109375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 4.0, 11.0, 13.0, 26.0, 34.0, 43.0, 53.0, 90.0, 160.0, 214.0, 377.0, 513.0, 863.0, 1435.0, 2408.0, 3779.0, 6322.0, 10607.0, 17875.0, 28915.0, 45621.0, 69992.0, 101121.0, 132298.0, 152796.0, 141552.0, 111630.0, 79972.0, 53031.0, 33886.0, 20824.0, 12577.0, 7583.0, 4539.0, 2799.0, 1702.0, 1019.0, 675.0, 440.0, 281.0, 134.0, 125.0, 75.0, 46.0, 42.0, 23.0, 12.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.337860107421875, -0.32684326171875, -0.315826416015625, -0.3048095703125, -0.293792724609375, -0.28277587890625, -0.271759033203125, -0.2607421875, -0.249725341796875, -0.23870849609375, -0.227691650390625, -0.2166748046875, -0.205657958984375, -0.19464111328125, -0.183624267578125, -0.172607421875, -0.161590576171875, -0.15057373046875, -0.139556884765625, -0.1285400390625, -0.117523193359375, -0.10650634765625, -0.095489501953125, -0.08447265625, -0.073455810546875, -0.06243896484375, -0.051422119140625, -0.0404052734375, -0.029388427734375, -0.01837158203125, -0.007354736328125, 0.003662109375, 0.014678955078125, 0.02569580078125, 0.036712646484375, 0.0477294921875, 0.058746337890625, 0.06976318359375, 0.080780029296875, 0.091796875, 0.102813720703125, 0.11383056640625, 0.124847412109375, 0.1358642578125, 0.146881103515625, 0.15789794921875, 0.168914794921875, 0.179931640625, 0.190948486328125, 0.20196533203125, 0.212982177734375, 0.2239990234375, 0.235015869140625, 0.24603271484375, 0.257049560546875, 0.26806640625, 0.279083251953125, 0.29010009765625, 0.301116943359375, 0.3121337890625, 0.323150634765625, 0.33416748046875, 0.345184326171875, 0.356201171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 6.0, 4.0, 5.0, 10.0, 13.0, 17.0, 20.0, 16.0, 21.0, 33.0, 31.0, 24.0, 27.0, 30.0, 35.0, 30.0, 39.0, 39.0, 45.0, 1071.0, 45.0, 43.0, 34.0, 32.0, 40.0, 39.0, 38.0, 30.0, 34.0, 23.0, 18.0, 22.0, 14.0, 22.0, 12.0, 10.0, 11.0, 9.0, 5.0, 0.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6640625, -2.5802001953125, -2.496337890625, -2.4124755859375, -2.32861328125, -2.2447509765625, -2.160888671875, -2.0770263671875, -1.9931640625, -1.9093017578125, -1.825439453125, -1.7415771484375, -1.65771484375, -1.5738525390625, -1.489990234375, -1.4061279296875, -1.322265625, -1.2384033203125, -1.154541015625, -1.0706787109375, -0.98681640625, -0.9029541015625, -0.819091796875, -0.7352294921875, -0.6513671875, -0.5675048828125, -0.483642578125, -0.3997802734375, -0.31591796875, -0.2320556640625, -0.148193359375, -0.0643310546875, 0.01953125, 0.1033935546875, 0.187255859375, 0.2711181640625, 0.35498046875, 0.4388427734375, 0.522705078125, 0.6065673828125, 0.6904296875, 0.7742919921875, 0.858154296875, 0.9420166015625, 1.02587890625, 1.1097412109375, 1.193603515625, 1.2774658203125, 1.361328125, 1.4451904296875, 1.529052734375, 1.6129150390625, 1.69677734375, 1.7806396484375, 1.864501953125, 1.9483642578125, 2.0322265625, 2.1160888671875, 2.199951171875, 2.2838134765625, 2.36767578125, 2.4515380859375, 2.535400390625, 2.6192626953125, 2.703125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 5.0, 5.0, 13.0, 19.0, 17.0, 18.0, 21.0, 37.0, 73.0, 76.0, 147.0, 221.0, 318.0, 488.0, 757.0, 1444.0, 2624.0, 4514.0, 8807.0, 17474.0, 35231.0, 70267.0, 130126.0, 289671.0, 1174457.0, 167477.0, 94612.0, 48424.0, 23847.0, 11972.0, 6138.0, 3190.0, 1888.0, 972.0, 612.0, 416.0, 256.0, 150.0, 106.0, 92.0, 39.0, 43.0, 17.0, 15.0, 14.0, 10.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.27978515625, -0.2711029052734375, -0.262420654296875, -0.2537384033203125, -0.24505615234375, -0.2363739013671875, -0.227691650390625, -0.2190093994140625, -0.2103271484375, -0.2016448974609375, -0.192962646484375, -0.1842803955078125, -0.17559814453125, -0.1669158935546875, -0.158233642578125, -0.1495513916015625, -0.140869140625, -0.1321868896484375, -0.123504638671875, -0.1148223876953125, -0.10614013671875, -0.0974578857421875, -0.088775634765625, -0.0800933837890625, -0.0714111328125, -0.0627288818359375, -0.054046630859375, -0.0453643798828125, -0.03668212890625, -0.0279998779296875, -0.019317626953125, -0.0106353759765625, -0.001953125, 0.0067291259765625, 0.015411376953125, 0.0240936279296875, 0.03277587890625, 0.0414581298828125, 0.050140380859375, 0.0588226318359375, 0.0675048828125, 0.0761871337890625, 0.084869384765625, 0.0935516357421875, 0.10223388671875, 0.1109161376953125, 0.119598388671875, 0.1282806396484375, 0.136962890625, 0.1456451416015625, 0.154327392578125, 0.1630096435546875, 0.17169189453125, 0.1803741455078125, 0.189056396484375, 0.1977386474609375, 0.2064208984375, 0.2151031494140625, 0.223785400390625, 0.2324676513671875, 0.24114990234375, 0.2498321533203125, 0.258514404296875, 0.2671966552734375, 0.27587890625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 6.0, 7.0, 4.0, 5.0, 13.0, 17.0, 20.0, 25.0, 41.0, 47.0, 68.0, 89.0, 83.0, 108.0, 81.0, 99.0, 73.0, 57.0, 43.0, 28.0, 14.0, 14.0, 9.0, 7.0, 6.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043365478515625, -0.04194307327270508, -0.040520668029785156, -0.039098262786865234, -0.03767585754394531, -0.03625345230102539, -0.03483104705810547, -0.03340864181518555, -0.031986236572265625, -0.030563831329345703, -0.02914142608642578, -0.02771902084350586, -0.026296615600585938, -0.024874210357666016, -0.023451805114746094, -0.022029399871826172, -0.02060699462890625, -0.019184589385986328, -0.017762184143066406, -0.016339778900146484, -0.014917373657226562, -0.01349496841430664, -0.012072563171386719, -0.010650157928466797, -0.009227752685546875, -0.007805347442626953, -0.006382942199707031, -0.004960536956787109, -0.0035381317138671875, -0.0021157264709472656, -0.0006933212280273438, 0.0007290840148925781, 0.0021514892578125, 0.003573894500732422, 0.004996299743652344, 0.006418704986572266, 0.007841110229492188, 0.00926351547241211, 0.010685920715332031, 0.012108325958251953, 0.013530731201171875, 0.014953136444091797, 0.01637554168701172, 0.01779794692993164, 0.019220352172851562, 0.020642757415771484, 0.022065162658691406, 0.023487567901611328, 0.02490997314453125, 0.026332378387451172, 0.027754783630371094, 0.029177188873291016, 0.030599594116210938, 0.03202199935913086, 0.03344440460205078, 0.0348668098449707, 0.036289215087890625, 0.03771162033081055, 0.03913402557373047, 0.04055643081665039, 0.04197883605957031, 0.043401241302490234, 0.044823646545410156, 0.04624605178833008, 0.04766845703125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 5.0, 3.0, 6.0, 10.0, 9.0, 17.0, 14.0, 17.0, 42.0, 60.0, 99.0, 166.0, 456.0, 6153.0, 1027245.0, 13211.0, 520.0, 197.0, 96.0, 69.0, 35.0, 30.0, 20.0, 9.0, 17.0, 7.0, 6.0, 4.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0263671875, -0.99578857421875, -0.9652099609375, -0.93463134765625, -0.904052734375, -0.87347412109375, -0.8428955078125, -0.81231689453125, -0.78173828125, -0.75115966796875, -0.7205810546875, -0.69000244140625, -0.659423828125, -0.62884521484375, -0.5982666015625, -0.56768798828125, -0.537109375, -0.50653076171875, -0.4759521484375, -0.44537353515625, -0.414794921875, -0.38421630859375, -0.3536376953125, -0.32305908203125, -0.29248046875, -0.26190185546875, -0.2313232421875, -0.20074462890625, -0.170166015625, -0.13958740234375, -0.1090087890625, -0.07843017578125, -0.0478515625, -0.01727294921875, 0.0133056640625, 0.04388427734375, 0.074462890625, 0.10504150390625, 0.1356201171875, 0.16619873046875, 0.19677734375, 0.22735595703125, 0.2579345703125, 0.28851318359375, 0.319091796875, 0.34967041015625, 0.3802490234375, 0.41082763671875, 0.44140625, 0.47198486328125, 0.5025634765625, 0.53314208984375, 0.563720703125, 0.59429931640625, 0.6248779296875, 0.65545654296875, 0.68603515625, 0.71661376953125, 0.7471923828125, 0.77777099609375, 0.808349609375, 0.83892822265625, 0.8695068359375, 0.90008544921875, 0.9306640625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 16.0, 23.0, 41.0, 72.0, 128.0, 204.0, 203.0, 130.0, 68.0, 46.0, 26.0, 14.0, 14.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21625910699367523, -0.21156220138072968, -0.2068653106689453, -0.20216840505599976, -0.1974715143442154, -0.19277460873126984, -0.18807771801948547, -0.18338081240653992, -0.17868392169475555, -0.17398701608181, -0.16929012537002563, -0.16459321975708008, -0.15989632904529572, -0.15519942343235016, -0.1505025327205658, -0.14580562710762024, -0.14110872149467468, -0.13641181588172913, -0.13171492516994476, -0.1270180195569992, -0.12232112884521484, -0.11762423068284988, -0.11292733252048492, -0.10823042690753937, -0.103533536195755, -0.09883663803339005, -0.09413973987102509, -0.08944284170866013, -0.08474594354629517, -0.0800490453839302, -0.07535214722156525, -0.07065524160861969, -0.06595835834741592, -0.061261460185050964, -0.056564562022686005, -0.051867663860321045, -0.047170765697956085, -0.042473867535591125, -0.03777696564793587, -0.03308006748557091, -0.028383169323205948, -0.023686271160840988, -0.01898937299847603, -0.01429247297346592, -0.00959557481110096, -0.004898676648736, -0.0002017766237258911, 0.004495121538639069, 0.009192019701004028, 0.013888917863368988, 0.018585816025733948, 0.023282716050744057, 0.027979614213109016, 0.03267651051282883, 0.037373412400484085, 0.042070310562849045, 0.046767208725214005, 0.051464106887578964, 0.056161005049943924, 0.06085790693759918, 0.06555480509996414, 0.0702517032623291, 0.07494860142469406, 0.07964549958705902, 0.08434239774942398]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 11.0, 8.0, 3.0, 12.0, 11.0, 17.0, 19.0, 20.0, 18.0, 19.0, 19.0, 44.0, 37.0, 32.0, 36.0, 30.0, 31.0, 33.0, 42.0, 36.0, 44.0, 40.0, 38.0, 34.0, 43.0, 30.0, 32.0, 26.0, 30.0, 22.0, 24.0, 21.0, 21.0, 17.0, 18.0, 15.0, 15.0, 13.0, 8.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06199944019317627, -0.05991858243942261, -0.057837724685668945, -0.055756863206624985, -0.05367600545287132, -0.05159514769911766, -0.0495142862200737, -0.04743342846632004, -0.045352570712566376, -0.043271712958812714, -0.04119085520505905, -0.03910999372601509, -0.03702913597226143, -0.03494827821850777, -0.032867416739463806, -0.030786558985710144, -0.028705701231956482, -0.02662484347820282, -0.02454398386180401, -0.022463124245405197, -0.020382266491651535, -0.018301408737897873, -0.01622054912149906, -0.014139690436422825, -0.012058831751346588, -0.009977973066270351, -0.007897114381194115, -0.005816255696117878, -0.0037353970110416412, -0.0016545383259654045, 0.0004263203591108322, 0.002507179044187069, 0.004588037729263306, 0.006668896414339542, 0.008749755099415779, 0.010830613784492016, 0.012911472469568253, 0.01499233115464449, 0.017073189839720726, 0.019154049456119537, 0.0212349072098732, 0.02331576496362686, 0.025396624580025673, 0.027477484196424484, 0.029558341950178146, 0.03163919970393181, 0.03372006118297577, 0.03580091893672943, 0.03788177669048309, 0.039962634444236755, 0.04204349219799042, 0.04412435367703438, 0.04620521143078804, 0.0482860691845417, 0.05036693066358566, 0.052447788417339325, 0.05452864617109299, 0.05660950392484665, 0.05869036167860031, 0.06077122315764427, 0.06285208463668823, 0.0649329423904419, 0.06701380014419556, 0.06909465789794922, 0.07117551565170288]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 9.0, 10.0, 12.0, 21.0, 16.0, 14.0, 18.0, 38.0, 34.0, 37.0, 34.0, 28.0, 43.0, 44.0, 47.0, 50.0, 51.0, 53.0, 38.0, 44.0, 46.0, 39.0, 39.0, 25.0, 34.0, 19.0, 24.0, 23.0, 23.0, 14.0, 8.0, 12.0, 10.0, 5.0, 4.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.19921875, -4.073394775390625, -3.94757080078125, -3.821746826171875, -3.6959228515625, -3.570098876953125, -3.44427490234375, -3.318450927734375, -3.192626953125, -3.066802978515625, -2.94097900390625, -2.815155029296875, -2.6893310546875, -2.563507080078125, -2.43768310546875, -2.311859130859375, -2.18603515625, -2.060211181640625, -1.93438720703125, -1.808563232421875, -1.6827392578125, -1.556915283203125, -1.43109130859375, -1.305267333984375, -1.179443359375, -1.053619384765625, -0.92779541015625, -0.801971435546875, -0.6761474609375, -0.550323486328125, -0.42449951171875, -0.298675537109375, -0.1728515625, -0.047027587890625, 0.07879638671875, 0.204620361328125, 0.3304443359375, 0.456268310546875, 0.58209228515625, 0.707916259765625, 0.833740234375, 0.959564208984375, 1.08538818359375, 1.211212158203125, 1.3370361328125, 1.462860107421875, 1.58868408203125, 1.714508056640625, 1.84033203125, 1.966156005859375, 2.09197998046875, 2.217803955078125, 2.3436279296875, 2.469451904296875, 2.59527587890625, 2.721099853515625, 2.846923828125, 2.972747802734375, 3.09857177734375, 3.224395751953125, 3.3502197265625, 3.476043701171875, 3.60186767578125, 3.727691650390625, 3.853515625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 4.0, 12.0, 14.0, 18.0, 20.0, 37.0, 36.0, 67.0, 101.0, 183.0, 380.0, 710.0, 1444.0, 3026.0, 6043.0, 12870.0, 28133.0, 65140.0, 156580.0, 362840.0, 237081.0, 97891.0, 40856.0, 18334.0, 8520.0, 4073.0, 2004.0, 987.0, 518.0, 242.0, 126.0, 94.0, 55.0, 37.0, 14.0, 16.0, 16.0, 9.0, 8.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9921875, -4.84417724609375, -4.6961669921875, -4.54815673828125, -4.400146484375, -4.25213623046875, -4.1041259765625, -3.95611572265625, -3.80810546875, -3.66009521484375, -3.5120849609375, -3.36407470703125, -3.216064453125, -3.06805419921875, -2.9200439453125, -2.77203369140625, -2.6240234375, -2.47601318359375, -2.3280029296875, -2.17999267578125, -2.031982421875, -1.88397216796875, -1.7359619140625, -1.58795166015625, -1.43994140625, -1.29193115234375, -1.1439208984375, -0.99591064453125, -0.847900390625, -0.69989013671875, -0.5518798828125, -0.40386962890625, -0.255859375, -0.10784912109375, 0.0401611328125, 0.18817138671875, 0.336181640625, 0.48419189453125, 0.6322021484375, 0.78021240234375, 0.92822265625, 1.07623291015625, 1.2242431640625, 1.37225341796875, 1.520263671875, 1.66827392578125, 1.8162841796875, 1.96429443359375, 2.1123046875, 2.26031494140625, 2.4083251953125, 2.55633544921875, 2.704345703125, 2.85235595703125, 3.0003662109375, 3.14837646484375, 3.29638671875, 3.44439697265625, 3.5924072265625, 3.74041748046875, 3.888427734375, 4.03643798828125, 4.1844482421875, 4.33245849609375, 4.48046875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 10.0, 6.0, 11.0, 17.0, 22.0, 15.0, 24.0, 34.0, 35.0, 33.0, 34.0, 41.0, 62.0, 78.0, 122.0, 334.0, 1484.0, 216.0, 81.0, 57.0, 67.0, 43.0, 35.0, 37.0, 35.0, 28.0, 17.0, 17.0, 18.0, 7.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.8408203125, -12.416015625, -11.9912109375, -11.56640625, -11.1416015625, -10.716796875, -10.2919921875, -9.8671875, -9.4423828125, -9.017578125, -8.5927734375, -8.16796875, -7.7431640625, -7.318359375, -6.8935546875, -6.46875, -6.0439453125, -5.619140625, -5.1943359375, -4.76953125, -4.3447265625, -3.919921875, -3.4951171875, -3.0703125, -2.6455078125, -2.220703125, -1.7958984375, -1.37109375, -0.9462890625, -0.521484375, -0.0966796875, 0.328125, 0.7529296875, 1.177734375, 1.6025390625, 2.02734375, 2.4521484375, 2.876953125, 3.3017578125, 3.7265625, 4.1513671875, 4.576171875, 5.0009765625, 5.42578125, 5.8505859375, 6.275390625, 6.7001953125, 7.125, 7.5498046875, 7.974609375, 8.3994140625, 8.82421875, 9.2490234375, 9.673828125, 10.0986328125, 10.5234375, 10.9482421875, 11.373046875, 11.7978515625, 12.22265625, 12.6474609375, 13.072265625, 13.4970703125, 13.921875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 4.0, 17.0, 12.0, 12.0, 16.0, 25.0, 22.0, 40.0, 41.0, 54.0, 82.0, 111.0, 168.0, 247.0, 473.0, 1054.0, 4955.0, 524856.0, 2598222.0, 12350.0, 1379.0, 569.0, 283.0, 184.0, 124.0, 107.0, 74.0, 47.0, 40.0, 34.0, 27.0, 18.0, 13.0, 12.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.109375, -23.220947265625, -22.33251953125, -21.444091796875, -20.5556640625, -19.667236328125, -18.77880859375, -17.890380859375, -17.001953125, -16.113525390625, -15.22509765625, -14.336669921875, -13.4482421875, -12.559814453125, -11.67138671875, -10.782958984375, -9.89453125, -9.006103515625, -8.11767578125, -7.229248046875, -6.3408203125, -5.452392578125, -4.56396484375, -3.675537109375, -2.787109375, -1.898681640625, -1.01025390625, -0.121826171875, 0.7666015625, 1.655029296875, 2.54345703125, 3.431884765625, 4.3203125, 5.208740234375, 6.09716796875, 6.985595703125, 7.8740234375, 8.762451171875, 9.65087890625, 10.539306640625, 11.427734375, 12.316162109375, 13.20458984375, 14.093017578125, 14.9814453125, 15.869873046875, 16.75830078125, 17.646728515625, 18.53515625, 19.423583984375, 20.31201171875, 21.200439453125, 22.0888671875, 22.977294921875, 23.86572265625, 24.754150390625, 25.642578125, 26.531005859375, 27.41943359375, 28.307861328125, 29.1962890625, 30.084716796875, 30.97314453125, 31.861572265625, 32.75]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [3.0, 22.0, 180.0, 447.0, 293.0, 64.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.095093727111816, -5.907675743103027, -3.72025728225708, -1.5328388214111328, 0.6545791625976562, 2.8419971466064453, 5.029416084289551, 7.21683406829834, 9.404252052307129, 11.591670036315918, 13.779088973999023, 15.966506958007812, 18.1539249420166, 20.34134292602539, 22.528762817382812, 24.71617889404297, 26.90359878540039, 29.09101676940918, 31.27843475341797, 33.46585464477539, 35.65327072143555, 37.84069061279297, 40.028106689453125, 42.21552658081055, 44.4029426574707, 46.590362548828125, 48.77777862548828, 50.9651985168457, 53.15261459350586, 55.34003448486328, 57.52745056152344, 59.71487045288086, 61.90229034423828, 64.08970642089844, 66.27713012695312, 68.46454620361328, 70.65196228027344, 72.8393783569336, 75.02680206298828, 77.21421813964844, 79.4016342163086, 81.58905029296875, 83.77647399902344, 85.9638900756836, 88.15130615234375, 90.3387222290039, 92.5261459350586, 94.71356201171875, 96.90098571777344, 99.0884017944336, 101.27582550048828, 103.46324157714844, 105.6506576538086, 107.83807373046875, 110.02549743652344, 112.2129135131836, 114.40032958984375, 116.5877456665039, 118.7751693725586, 120.96258544921875, 123.1500015258789, 125.33741760253906, 127.52484130859375, 129.71224975585938, 131.89967346191406]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 6.0, 7.0, 5.0, 19.0, 13.0, 16.0, 14.0, 23.0, 17.0, 26.0, 29.0, 33.0, 35.0, 49.0, 34.0, 56.0, 41.0, 44.0, 45.0, 48.0, 39.0, 36.0, 46.0, 32.0, 27.0, 44.0, 31.0, 28.0, 15.0, 19.0, 23.0, 14.0, 15.0, 14.0, 6.0, 13.0, 10.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.439697265625, -26.487749099731445, -25.53580093383789, -24.583852767944336, -23.63190460205078, -22.67995834350586, -21.728008270263672, -20.77606201171875, -19.824113845825195, -18.87216567993164, -17.920217514038086, -16.96826934814453, -16.016321182250977, -15.064373970031738, -14.112425804138184, -13.160478591918945, -12.208529472351074, -11.25658130645752, -10.304633140563965, -9.352685928344727, -8.400737762451172, -7.448789596557617, -6.4968414306640625, -5.544893741607666, -4.592945575714111, -3.6409976482391357, -2.68904972076416, -1.7371015548706055, -0.7851536273956299, 0.1667943000793457, 1.1187424659729004, 2.070690155029297, 3.0226383209228516, 3.974586248397827, 4.926534175872803, 5.878482341766357, 6.830430030822754, 7.782378196716309, 8.734326362609863, 9.686273574829102, 10.638221740722656, 11.590169906616211, 12.542118072509766, 13.49406623840332, 14.446013450622559, 15.397961616516113, 16.349910736083984, 17.301856994628906, 18.253807067871094, 19.20575523376465, 20.157703399658203, 21.109651565551758, 22.061599731445312, 23.013545989990234, 23.965496063232422, 24.917442321777344, 25.8693904876709, 26.821338653564453, 27.773286819458008, 28.725234985351562, 29.677183151245117, 30.629131317138672, 31.581077575683594, 32.53302764892578, 33.4849739074707]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 10.0, 12.0, 9.0, 19.0, 18.0, 22.0, 19.0, 24.0, 21.0, 39.0, 37.0, 42.0, 38.0, 34.0, 40.0, 53.0, 48.0, 47.0, 52.0, 58.0, 31.0, 45.0, 35.0, 30.0, 26.0, 25.0, 17.0, 24.0, 21.0, 25.0, 15.0, 9.0, 14.0, 5.0, 14.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-4.79296875, -4.66033935546875, -4.5277099609375, -4.39508056640625, -4.262451171875, -4.12982177734375, -3.9971923828125, -3.86456298828125, -3.73193359375, -3.59930419921875, -3.4666748046875, -3.33404541015625, -3.201416015625, -3.06878662109375, -2.9361572265625, -2.80352783203125, -2.6708984375, -2.53826904296875, -2.4056396484375, -2.27301025390625, -2.140380859375, -2.00775146484375, -1.8751220703125, -1.74249267578125, -1.60986328125, -1.47723388671875, -1.3446044921875, -1.21197509765625, -1.079345703125, -0.94671630859375, -0.8140869140625, -0.68145751953125, -0.548828125, -0.41619873046875, -0.2835693359375, -0.15093994140625, -0.018310546875, 0.11431884765625, 0.2469482421875, 0.37957763671875, 0.51220703125, 0.64483642578125, 0.7774658203125, 0.91009521484375, 1.042724609375, 1.17535400390625, 1.3079833984375, 1.44061279296875, 1.5732421875, 1.70587158203125, 1.8385009765625, 1.97113037109375, 2.103759765625, 2.23638916015625, 2.3690185546875, 2.50164794921875, 2.63427734375, 2.76690673828125, 2.8995361328125, 3.03216552734375, 3.164794921875, 3.29742431640625, 3.4300537109375, 3.56268310546875, 3.6953125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 11.0, 11.0, 19.0, 23.0, 26.0, 39.0, 44.0, 55.0, 98.0, 216.0, 401.0, 1219.0, 5276.0, 49359.0, 772097.0, 2881957.0, 448400.0, 29599.0, 3661.0, 923.0, 357.0, 156.0, 101.0, 58.0, 36.0, 19.0, 17.0, 19.0, 25.0, 11.0, 11.0, 7.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5390625, -11.20361328125, -10.8681640625, -10.53271484375, -10.197265625, -9.86181640625, -9.5263671875, -9.19091796875, -8.85546875, -8.52001953125, -8.1845703125, -7.84912109375, -7.513671875, -7.17822265625, -6.8427734375, -6.50732421875, -6.171875, -5.83642578125, -5.5009765625, -5.16552734375, -4.830078125, -4.49462890625, -4.1591796875, -3.82373046875, -3.48828125, -3.15283203125, -2.8173828125, -2.48193359375, -2.146484375, -1.81103515625, -1.4755859375, -1.14013671875, -0.8046875, -0.46923828125, -0.1337890625, 0.20166015625, 0.537109375, 0.87255859375, 1.2080078125, 1.54345703125, 1.87890625, 2.21435546875, 2.5498046875, 2.88525390625, 3.220703125, 3.55615234375, 3.8916015625, 4.22705078125, 4.5625, 4.89794921875, 5.2333984375, 5.56884765625, 5.904296875, 6.23974609375, 6.5751953125, 6.91064453125, 7.24609375, 7.58154296875, 7.9169921875, 8.25244140625, 8.587890625, 8.92333984375, 9.2587890625, 9.59423828125, 9.9296875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 13.0, 22.0, 29.0, 30.0, 46.0, 63.0, 100.0, 141.0, 202.0, 299.0, 422.0, 471.0, 515.0, 401.0, 385.0, 257.0, 203.0, 122.0, 95.0, 66.0, 43.0, 35.0, 27.0, 19.0, 18.0, 13.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62890625, -6.40301513671875, -6.1771240234375, -5.95123291015625, -5.725341796875, -5.49945068359375, -5.2735595703125, -5.04766845703125, -4.82177734375, -4.59588623046875, -4.3699951171875, -4.14410400390625, -3.918212890625, -3.69232177734375, -3.4664306640625, -3.24053955078125, -3.0146484375, -2.78875732421875, -2.5628662109375, -2.33697509765625, -2.111083984375, -1.88519287109375, -1.6593017578125, -1.43341064453125, -1.20751953125, -0.98162841796875, -0.7557373046875, -0.52984619140625, -0.303955078125, -0.07806396484375, 0.1478271484375, 0.37371826171875, 0.599609375, 0.82550048828125, 1.0513916015625, 1.27728271484375, 1.503173828125, 1.72906494140625, 1.9549560546875, 2.18084716796875, 2.40673828125, 2.63262939453125, 2.8585205078125, 3.08441162109375, 3.310302734375, 3.53619384765625, 3.7620849609375, 3.98797607421875, 4.2138671875, 4.43975830078125, 4.6656494140625, 4.89154052734375, 5.117431640625, 5.34332275390625, 5.5692138671875, 5.79510498046875, 6.02099609375, 6.24688720703125, 6.4727783203125, 6.69866943359375, 6.924560546875, 7.15045166015625, 7.3763427734375, 7.60223388671875, 7.828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 3.0, 15.0, 14.0, 14.0, 24.0, 35.0, 46.0, 52.0, 97.0, 123.0, 219.0, 317.0, 779.0, 13339.0, 3906639.0, 269558.0, 1808.0, 475.0, 233.0, 165.0, 89.0, 67.0, 54.0, 34.0, 26.0, 14.0, 15.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.53125, -41.306640625, -40.08203125, -38.857421875, -37.6328125, -36.408203125, -35.18359375, -33.958984375, -32.734375, -31.509765625, -30.28515625, -29.060546875, -27.8359375, -26.611328125, -25.38671875, -24.162109375, -22.9375, -21.712890625, -20.48828125, -19.263671875, -18.0390625, -16.814453125, -15.58984375, -14.365234375, -13.140625, -11.916015625, -10.69140625, -9.466796875, -8.2421875, -7.017578125, -5.79296875, -4.568359375, -3.34375, -2.119140625, -0.89453125, 0.330078125, 1.5546875, 2.779296875, 4.00390625, 5.228515625, 6.453125, 7.677734375, 8.90234375, 10.126953125, 11.3515625, 12.576171875, 13.80078125, 15.025390625, 16.25, 17.474609375, 18.69921875, 19.923828125, 21.1484375, 22.373046875, 23.59765625, 24.822265625, 26.046875, 27.271484375, 28.49609375, 29.720703125, 30.9453125, 32.169921875, 33.39453125, 34.619140625, 35.84375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 21.0, 44.0, 76.0, 83.0, 133.0, 143.0, 180.0, 131.0, 91.0, 53.0, 26.0, 15.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.183042526245117, -21.878612518310547, -20.574180603027344, -19.269750595092773, -17.965320587158203, -16.660890579223633, -15.356459617614746, -14.05202865600586, -12.747598648071289, -11.443168640136719, -10.138737678527832, -8.834306716918945, -7.529876708984375, -6.2254462242126465, -4.921015739440918, -3.6165847778320312, -2.312154769897461, -1.0077242851257324, 0.2967061996459961, 1.6011366844177246, 2.905567169189453, 4.209997653961182, 5.51442813873291, 6.818859100341797, 8.123289108276367, 9.427719116210938, 10.732150077819824, 12.036581039428711, 13.341011047363281, 14.645441055297852, 15.949872016906738, 17.254302978515625, 18.558734893798828, 19.8631649017334, 21.16759490966797, 22.472026824951172, 23.776456832885742, 25.080886840820312, 26.385318756103516, 27.689748764038086, 28.994178771972656, 30.298608779907227, 31.603038787841797, 32.907470703125, 34.21189880371094, 35.51633071899414, 36.820762634277344, 38.12519073486328, 39.429622650146484, 40.73405456542969, 42.038482666015625, 43.34291458129883, 44.64734649658203, 45.95177459716797, 47.25620651245117, 48.560638427734375, 49.86506652832031, 51.169498443603516, 52.47392654418945, 53.778358459472656, 55.082786560058594, 56.3872184753418, 57.691650390625, 58.99607849121094, 60.30051040649414]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 8.0, 9.0, 10.0, 8.0, 12.0, 10.0, 25.0, 15.0, 21.0, 11.0, 30.0, 20.0, 32.0, 29.0, 33.0, 47.0, 34.0, 47.0, 49.0, 48.0, 38.0, 54.0, 46.0, 37.0, 40.0, 38.0, 28.0, 36.0, 29.0, 28.0, 15.0, 18.0, 17.0, 12.0, 21.0, 9.0, 8.0, 8.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.20796012878418, -22.537710189819336, -21.867462158203125, -21.19721221923828, -20.526962280273438, -19.856712341308594, -19.186464309692383, -18.51621437072754, -17.845964431762695, -17.17571449279785, -16.50546646118164, -15.835216522216797, -15.164966583251953, -14.494717597961426, -13.824468612670898, -13.154218673706055, -12.483969688415527, -11.813720703125, -11.143470764160156, -10.473221778869629, -9.802971839904785, -9.132722854614258, -8.462472915649414, -7.792223930358887, -7.121974468231201, -6.451725006103516, -5.78147554397583, -5.1112260818481445, -4.440977096557617, -3.7707273960113525, -3.100478172302246, -2.4302287101745605, -1.759979248046875, -1.0897297859191895, -0.41948044300079346, 0.25076889991760254, 0.9210183620452881, 1.5912678241729736, 2.26151704788208, 2.9317665100097656, 3.602015972137451, 4.272265434265137, 4.942514896392822, 5.612764358520508, 6.283013343811035, 6.953263282775879, 7.623512268066406, 8.29376220703125, 8.964011192321777, 9.634260177612305, 10.304510116577148, 10.974759101867676, 11.64500904083252, 12.315258026123047, 12.98550796508789, 13.655756950378418, 14.326005935668945, 14.996254920959473, 15.666504859924316, 16.336753845214844, 17.007003784179688, 17.67725372314453, 18.347501754760742, 19.017751693725586, 19.68800163269043]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 7.0, 10.0, 10.0, 12.0, 19.0, 21.0, 19.0, 23.0, 37.0, 40.0, 30.0, 39.0, 39.0, 27.0, 44.0, 44.0, 51.0, 45.0, 55.0, 44.0, 40.0, 45.0, 40.0, 39.0, 21.0, 36.0, 23.0, 25.0, 23.0, 20.0, 14.0, 15.0, 9.0, 11.0, 7.0, 8.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.578125, -4.444671630859375, -4.31121826171875, -4.177764892578125, -4.0443115234375, -3.910858154296875, -3.77740478515625, -3.643951416015625, -3.510498046875, -3.377044677734375, -3.24359130859375, -3.110137939453125, -2.9766845703125, -2.843231201171875, -2.70977783203125, -2.576324462890625, -2.44287109375, -2.309417724609375, -2.17596435546875, -2.042510986328125, -1.9090576171875, -1.775604248046875, -1.64215087890625, -1.508697509765625, -1.375244140625, -1.241790771484375, -1.10833740234375, -0.974884033203125, -0.8414306640625, -0.707977294921875, -0.57452392578125, -0.441070556640625, -0.3076171875, -0.174163818359375, -0.04071044921875, 0.092742919921875, 0.2261962890625, 0.359649658203125, 0.49310302734375, 0.626556396484375, 0.760009765625, 0.893463134765625, 1.02691650390625, 1.160369873046875, 1.2938232421875, 1.427276611328125, 1.56072998046875, 1.694183349609375, 1.82763671875, 1.961090087890625, 2.09454345703125, 2.227996826171875, 2.3614501953125, 2.494903564453125, 2.62835693359375, 2.761810302734375, 2.895263671875, 3.028717041015625, 3.16217041015625, 3.295623779296875, 3.4290771484375, 3.562530517578125, 3.69598388671875, 3.829437255859375, 3.962890625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 8.0, 7.0, 12.0, 14.0, 22.0, 14.0, 43.0, 55.0, 81.0, 128.0, 195.0, 282.0, 448.0, 723.0, 1176.0, 2139.0, 3593.0, 6575.0, 12446.0, 23940.0, 45068.0, 82955.0, 139796.0, 197036.0, 200046.0, 144443.0, 85778.0, 47404.0, 24939.0, 12970.0, 7074.0, 3763.0, 2105.0, 1189.0, 744.0, 474.0, 278.0, 195.0, 123.0, 77.0, 67.0, 38.0, 33.0, 18.0, 9.0, 12.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.474853515625, -0.4595527648925781, -0.44425201416015625, -0.4289512634277344, -0.4136505126953125, -0.3983497619628906, -0.38304901123046875, -0.3677482604980469, -0.352447509765625, -0.3371467590332031, -0.32184600830078125, -0.3065452575683594, -0.2912445068359375, -0.2759437561035156, -0.26064300537109375, -0.24534225463867188, -0.23004150390625, -0.21474075317382812, -0.19944000244140625, -0.18413925170898438, -0.1688385009765625, -0.15353775024414062, -0.13823699951171875, -0.12293624877929688, -0.107635498046875, -0.09233474731445312, -0.07703399658203125, -0.061733245849609375, -0.0464324951171875, -0.031131744384765625, -0.01583099365234375, -0.000530242919921875, 0.0147705078125, 0.030071258544921875, 0.04537200927734375, 0.060672760009765625, 0.0759735107421875, 0.09127426147460938, 0.10657501220703125, 0.12187576293945312, 0.137176513671875, 0.15247726440429688, 0.16777801513671875, 0.18307876586914062, 0.1983795166015625, 0.21368026733398438, 0.22898101806640625, 0.24428176879882812, 0.25958251953125, 0.2748832702636719, 0.29018402099609375, 0.3054847717285156, 0.3207855224609375, 0.3360862731933594, 0.35138702392578125, 0.3666877746582031, 0.381988525390625, 0.3972892761230469, 0.41259002685546875, 0.4278907775878906, 0.4431915283203125, 0.4584922790527344, 0.47379302978515625, 0.4890937805175781, 0.50439453125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 5.0, 8.0, 12.0, 14.0, 11.0, 17.0, 20.0, 27.0, 19.0, 21.0, 26.0, 32.0, 27.0, 38.0, 37.0, 46.0, 39.0, 45.0, 40.0, 1058.0, 32.0, 37.0, 45.0, 28.0, 43.0, 31.0, 37.0, 29.0, 34.0, 22.0, 29.0, 14.0, 14.0, 9.0, 12.0, 9.0, 15.0, 9.0, 8.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.619140625, -2.531982421875, -2.44482421875, -2.357666015625, -2.2705078125, -2.183349609375, -2.09619140625, -2.009033203125, -1.921875, -1.834716796875, -1.74755859375, -1.660400390625, -1.5732421875, -1.486083984375, -1.39892578125, -1.311767578125, -1.224609375, -1.137451171875, -1.05029296875, -0.963134765625, -0.8759765625, -0.788818359375, -0.70166015625, -0.614501953125, -0.52734375, -0.440185546875, -0.35302734375, -0.265869140625, -0.1787109375, -0.091552734375, -0.00439453125, 0.082763671875, 0.169921875, 0.257080078125, 0.34423828125, 0.431396484375, 0.5185546875, 0.605712890625, 0.69287109375, 0.780029296875, 0.8671875, 0.954345703125, 1.04150390625, 1.128662109375, 1.2158203125, 1.302978515625, 1.39013671875, 1.477294921875, 1.564453125, 1.651611328125, 1.73876953125, 1.825927734375, 1.9130859375, 2.000244140625, 2.08740234375, 2.174560546875, 2.26171875, 2.348876953125, 2.43603515625, 2.523193359375, 2.6103515625, 2.697509765625, 2.78466796875, 2.871826171875, 2.958984375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 11.0, 18.0, 20.0, 27.0, 53.0, 63.0, 105.0, 160.0, 262.0, 430.0, 724.0, 1158.0, 2231.0, 4291.0, 8789.0, 19111.0, 44203.0, 98803.0, 200956.0, 1292774.0, 222702.0, 109484.0, 48907.0, 21555.0, 9585.0, 4676.0, 2512.0, 1377.0, 754.0, 485.0, 297.0, 196.0, 134.0, 98.0, 63.0, 39.0, 19.0, 11.0, 5.0, 10.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3466796875, -0.3356971740722656, -0.32471466064453125, -0.3137321472167969, -0.3027496337890625, -0.2917671203613281, -0.28078460693359375, -0.2698020935058594, -0.258819580078125, -0.24783706665039062, -0.23685455322265625, -0.22587203979492188, -0.2148895263671875, -0.20390701293945312, -0.19292449951171875, -0.18194198608398438, -0.17095947265625, -0.15997695922851562, -0.14899444580078125, -0.13801193237304688, -0.1270294189453125, -0.11604690551757812, -0.10506439208984375, -0.09408187866210938, -0.083099365234375, -0.07211685180664062, -0.06113433837890625, -0.050151824951171875, -0.0391693115234375, -0.028186798095703125, -0.01720428466796875, -0.006221771240234375, 0.0047607421875, 0.015743255615234375, 0.02672576904296875, 0.037708282470703125, 0.0486907958984375, 0.059673309326171875, 0.07065582275390625, 0.08163833618164062, 0.092620849609375, 0.10360336303710938, 0.11458587646484375, 0.12556838989257812, 0.1365509033203125, 0.14753341674804688, 0.15851593017578125, 0.16949844360351562, 0.18048095703125, 0.19146347045898438, 0.20244598388671875, 0.21342849731445312, 0.2244110107421875, 0.23539352416992188, 0.24637603759765625, 0.2573585510253906, 0.268341064453125, 0.2793235778808594, 0.29030609130859375, 0.3012886047363281, 0.3122711181640625, 0.3232536315917969, 0.33423614501953125, 0.3452186584472656, 0.356201171875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 3.0, 8.0, 7.0, 11.0, 6.0, 13.0, 12.0, 19.0, 17.0, 23.0, 33.0, 39.0, 49.0, 78.0, 70.0, 77.0, 66.0, 77.0, 72.0, 55.0, 55.0, 35.0, 27.0, 19.0, 19.0, 22.0, 10.0, 10.0, 10.0, 6.0, 8.0, 3.0, 5.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.04315185546875, -0.04196357727050781, -0.040775299072265625, -0.03958702087402344, -0.03839874267578125, -0.03721046447753906, -0.036022186279296875, -0.03483390808105469, -0.0336456298828125, -0.03245735168457031, -0.031269073486328125, -0.030080795288085938, -0.02889251708984375, -0.027704238891601562, -0.026515960693359375, -0.025327682495117188, -0.024139404296875, -0.022951126098632812, -0.021762847900390625, -0.020574569702148438, -0.01938629150390625, -0.018198013305664062, -0.017009735107421875, -0.015821456909179688, -0.0146331787109375, -0.013444900512695312, -0.012256622314453125, -0.011068344116210938, -0.00988006591796875, -0.008691787719726562, -0.007503509521484375, -0.0063152313232421875, -0.005126953125, -0.0039386749267578125, -0.002750396728515625, -0.0015621185302734375, -0.00037384033203125, 0.0008144378662109375, 0.002002716064453125, 0.0031909942626953125, 0.0043792724609375, 0.0055675506591796875, 0.006755828857421875, 0.007944107055664062, 0.00913238525390625, 0.010320663452148438, 0.011508941650390625, 0.012697219848632812, 0.013885498046875, 0.015073776245117188, 0.016262054443359375, 0.017450332641601562, 0.01863861083984375, 0.019826889038085938, 0.021015167236328125, 0.022203445434570312, 0.0233917236328125, 0.024580001831054688, 0.025768280029296875, 0.026956558227539062, 0.02814483642578125, 0.029333114624023438, 0.030521392822265625, 0.03170967102050781, 0.03289794921875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 2.0, 6.0, 5.0, 4.0, 9.0, 15.0, 9.0, 19.0, 23.0, 27.0, 38.0, 36.0, 68.0, 121.0, 186.0, 491.0, 3762.0, 705268.0, 334373.0, 3005.0, 484.0, 195.0, 109.0, 66.0, 49.0, 32.0, 21.0, 28.0, 17.0, 11.0, 11.0, 10.0, 8.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73876953125, -0.7123489379882812, -0.6859283447265625, -0.6595077514648438, -0.633087158203125, -0.6066665649414062, -0.5802459716796875, -0.5538253784179688, -0.52740478515625, -0.5009841918945312, -0.4745635986328125, -0.44814300537109375, -0.421722412109375, -0.39530181884765625, -0.3688812255859375, -0.34246063232421875, -0.3160400390625, -0.28961944580078125, -0.2631988525390625, -0.23677825927734375, -0.210357666015625, -0.18393707275390625, -0.1575164794921875, -0.13109588623046875, -0.10467529296875, -0.07825469970703125, -0.0518341064453125, -0.02541351318359375, 0.001007080078125, 0.02742767333984375, 0.0538482666015625, 0.08026885986328125, 0.106689453125, 0.13311004638671875, 0.1595306396484375, 0.18595123291015625, 0.212371826171875, 0.23879241943359375, 0.2652130126953125, 0.29163360595703125, 0.31805419921875, 0.34447479248046875, 0.3708953857421875, 0.39731597900390625, 0.423736572265625, 0.45015716552734375, 0.4765777587890625, 0.5029983520507812, 0.5294189453125, 0.5558395385742188, 0.5822601318359375, 0.6086807250976562, 0.635101318359375, 0.6615219116210938, 0.6879425048828125, 0.7143630981445312, 0.74078369140625, 0.7672042846679688, 0.7936248779296875, 0.8200454711914062, 0.846466064453125, 0.8728866577148438, 0.8993072509765625, 0.9257278442382812, 0.9521484375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 12.0, 25.0, 63.0, 175.0, 427.0, 233.0, 46.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12484331429004669, -0.11492905765771866, -0.10501480102539062, -0.09510055184364319, -0.08518628776073456, -0.07527203857898712, -0.06535778194665909, -0.055443525314331055, -0.04552926868200302, -0.03561501204967499, -0.025700757279992104, -0.01578650251030922, -0.005872245877981186, 0.0040420107543468475, 0.013956263661384583, 0.023870520293712616, 0.03378477692604065, 0.04369903355836868, 0.053613290190696716, 0.06352753937244415, 0.07344180345535278, 0.08335605263710022, 0.09327030926942825, 0.10318456590175629, 0.11309882253408432, 0.12301307916641235, 0.1329273283481598, 0.14284159243106842, 0.15275584161281586, 0.1626701056957245, 0.17258435487747192, 0.18249860405921936, 0.19241288304328918, 0.20232713222503662, 0.21224139630794525, 0.2221556454896927, 0.23206990957260132, 0.24198415875434875, 0.2518984079360962, 0.261812686920166, 0.27172693610191345, 0.2816411852836609, 0.2915554344654083, 0.30146971344947815, 0.3113839626312256, 0.321298211812973, 0.33121246099472046, 0.3411267399787903, 0.35104095935821533, 0.36095520853996277, 0.3708694577217102, 0.38078373670578003, 0.39069798588752747, 0.4006122350692749, 0.41052648425102234, 0.4204407334327698, 0.4303550124168396, 0.44026926159858704, 0.4501835107803345, 0.4600977897644043, 0.47001203894615173, 0.47992628812789917, 0.4898405373096466, 0.49975478649139404, 0.5096690654754639]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 6.0, 7.0, 10.0, 12.0, 17.0, 10.0, 14.0, 24.0, 23.0, 28.0, 33.0, 41.0, 16.0, 29.0, 34.0, 31.0, 29.0, 36.0, 32.0, 36.0, 39.0, 43.0, 36.0, 49.0, 34.0, 46.0, 32.0, 20.0, 33.0, 24.0, 27.0, 24.0, 16.0, 25.0, 12.0, 12.0, 9.0, 6.0, 5.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.03079885244369507, -0.029816828668117523, -0.028834804892539978, -0.027852781116962433, -0.026870757341384888, -0.025888733565807343, -0.024906709790229797, -0.023924686014652252, -0.022942662239074707, -0.021960638463497162, -0.020978614687919617, -0.01999659091234207, -0.019014567136764526, -0.01803254336118698, -0.017050519585609436, -0.01606849581003189, -0.015086472034454346, -0.0141044482588768, -0.013122424483299255, -0.01214040070772171, -0.011158376932144165, -0.01017635315656662, -0.009194329380989075, -0.00821230560541153, -0.007230281829833984, -0.006248258054256439, -0.005266234278678894, -0.004284210503101349, -0.0033021867275238037, -0.0023201629519462585, -0.0013381391763687134, -0.0003561154007911682, 0.000625908374786377, 0.0016079321503639221, 0.0025899559259414673, 0.0035719797015190125, 0.004554003477096558, 0.005536027252674103, 0.006518051028251648, 0.007500074803829193, 0.008482098579406738, 0.009464122354984283, 0.010446146130561829, 0.011428169906139374, 0.012410193681716919, 0.013392217457294464, 0.01437424123287201, 0.015356265008449554, 0.0163382887840271, 0.017320312559604645, 0.01830233633518219, 0.019284360110759735, 0.02026638388633728, 0.021248407661914825, 0.02223043143749237, 0.023212455213069916, 0.02419447898864746, 0.025176502764225006, 0.02615852653980255, 0.027140550315380096, 0.02812257409095764, 0.029104597866535187, 0.030086621642112732, 0.031068645417690277, 0.03205066919326782]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 0.0, 6.0, 11.0, 10.0, 10.0, 12.0, 19.0, 18.0, 16.0, 25.0, 25.0, 26.0, 26.0, 33.0, 37.0, 34.0, 37.0, 32.0, 44.0, 42.0, 43.0, 34.0, 42.0, 45.0, 41.0, 39.0, 30.0, 24.0, 20.0, 34.0, 24.0, 26.0, 19.0, 15.0, 18.0, 14.0, 13.0, 11.0, 17.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361328125, -3.24798583984375, -3.1346435546875, -3.02130126953125, -2.907958984375, -2.79461669921875, -2.6812744140625, -2.56793212890625, -2.45458984375, -2.34124755859375, -2.2279052734375, -2.11456298828125, -2.001220703125, -1.88787841796875, -1.7745361328125, -1.66119384765625, -1.5478515625, -1.43450927734375, -1.3211669921875, -1.20782470703125, -1.094482421875, -0.98114013671875, -0.8677978515625, -0.75445556640625, -0.64111328125, -0.52777099609375, -0.4144287109375, -0.30108642578125, -0.187744140625, -0.07440185546875, 0.0389404296875, 0.15228271484375, 0.265625, 0.37896728515625, 0.4923095703125, 0.60565185546875, 0.718994140625, 0.83233642578125, 0.9456787109375, 1.05902099609375, 1.17236328125, 1.28570556640625, 1.3990478515625, 1.51239013671875, 1.625732421875, 1.73907470703125, 1.8524169921875, 1.96575927734375, 2.0791015625, 2.19244384765625, 2.3057861328125, 2.41912841796875, 2.532470703125, 2.64581298828125, 2.7591552734375, 2.87249755859375, 2.98583984375, 3.09918212890625, 3.2125244140625, 3.32586669921875, 3.439208984375, 3.55255126953125, 3.6658935546875, 3.77923583984375, 3.892578125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 9.0, 11.0, 15.0, 15.0, 16.0, 21.0, 18.0, 21.0, 39.0, 51.0, 90.0, 153.0, 258.0, 643.0, 1539.0, 4220.0, 11755.0, 33157.0, 92250.0, 269935.0, 409540.0, 143920.0, 51782.0, 18345.0, 6602.0, 2316.0, 891.0, 363.0, 199.0, 86.0, 59.0, 53.0, 37.0, 34.0, 19.0, 15.0, 10.0, 16.0, 15.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9296875, -4.76654052734375, -4.6033935546875, -4.44024658203125, -4.277099609375, -4.11395263671875, -3.9508056640625, -3.78765869140625, -3.62451171875, -3.46136474609375, -3.2982177734375, -3.13507080078125, -2.971923828125, -2.80877685546875, -2.6456298828125, -2.48248291015625, -2.3193359375, -2.15618896484375, -1.9930419921875, -1.82989501953125, -1.666748046875, -1.50360107421875, -1.3404541015625, -1.17730712890625, -1.01416015625, -0.85101318359375, -0.6878662109375, -0.52471923828125, -0.361572265625, -0.19842529296875, -0.0352783203125, 0.12786865234375, 0.291015625, 0.45416259765625, 0.6173095703125, 0.78045654296875, 0.943603515625, 1.10675048828125, 1.2698974609375, 1.43304443359375, 1.59619140625, 1.75933837890625, 1.9224853515625, 2.08563232421875, 2.248779296875, 2.41192626953125, 2.5750732421875, 2.73822021484375, 2.9013671875, 3.06451416015625, 3.2276611328125, 3.39080810546875, 3.553955078125, 3.71710205078125, 3.8802490234375, 4.04339599609375, 4.20654296875, 4.36968994140625, 4.5328369140625, 4.69598388671875, 4.859130859375, 5.02227783203125, 5.1854248046875, 5.34857177734375, 5.51171875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 4.0, 5.0, 2.0, 6.0, 7.0, 9.0, 8.0, 13.0, 8.0, 14.0, 19.0, 21.0, 33.0, 27.0, 40.0, 25.0, 41.0, 32.0, 54.0, 64.0, 139.0, 215.0, 1385.0, 254.0, 133.0, 82.0, 62.0, 45.0, 33.0, 41.0, 31.0, 26.0, 36.0, 25.0, 20.0, 13.0, 18.0, 12.0, 8.0, 5.0, 6.0, 6.0, 6.0, 9.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.15625, -7.8385009765625, -7.520751953125, -7.2030029296875, -6.88525390625, -6.5675048828125, -6.249755859375, -5.9320068359375, -5.6142578125, -5.2965087890625, -4.978759765625, -4.6610107421875, -4.34326171875, -4.0255126953125, -3.707763671875, -3.3900146484375, -3.072265625, -2.7545166015625, -2.436767578125, -2.1190185546875, -1.80126953125, -1.4835205078125, -1.165771484375, -0.8480224609375, -0.5302734375, -0.2125244140625, 0.105224609375, 0.4229736328125, 0.74072265625, 1.0584716796875, 1.376220703125, 1.6939697265625, 2.01171875, 2.3294677734375, 2.647216796875, 2.9649658203125, 3.28271484375, 3.6004638671875, 3.918212890625, 4.2359619140625, 4.5537109375, 4.8714599609375, 5.189208984375, 5.5069580078125, 5.82470703125, 6.1424560546875, 6.460205078125, 6.7779541015625, 7.095703125, 7.4134521484375, 7.731201171875, 8.0489501953125, 8.36669921875, 8.6844482421875, 9.002197265625, 9.3199462890625, 9.6376953125, 9.9554443359375, 10.273193359375, 10.5909423828125, 10.90869140625, 11.2264404296875, 11.544189453125, 11.8619384765625, 12.1796875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 3.0, 8.0, 6.0, 4.0, 6.0, 15.0, 19.0, 21.0, 18.0, 27.0, 39.0, 44.0, 61.0, 78.0, 97.0, 135.0, 189.0, 302.0, 643.0, 2312.0, 41139.0, 2901967.0, 192334.0, 4138.0, 896.0, 365.0, 224.0, 132.0, 122.0, 62.0, 54.0, 48.0, 40.0, 29.0, 23.0, 20.0, 14.0, 12.0, 11.0, 8.0, 8.0, 4.0, 7.0, 3.0, 5.0, 4.0, 2.0, 4.0, 1.0], "bins": [-25.796875, -25.093017578125, -24.38916015625, -23.685302734375, -22.9814453125, -22.277587890625, -21.57373046875, -20.869873046875, -20.166015625, -19.462158203125, -18.75830078125, -18.054443359375, -17.3505859375, -16.646728515625, -15.94287109375, -15.239013671875, -14.53515625, -13.831298828125, -13.12744140625, -12.423583984375, -11.7197265625, -11.015869140625, -10.31201171875, -9.608154296875, -8.904296875, -8.200439453125, -7.49658203125, -6.792724609375, -6.0888671875, -5.385009765625, -4.68115234375, -3.977294921875, -3.2734375, -2.569580078125, -1.86572265625, -1.161865234375, -0.4580078125, 0.245849609375, 0.94970703125, 1.653564453125, 2.357421875, 3.061279296875, 3.76513671875, 4.468994140625, 5.1728515625, 5.876708984375, 6.58056640625, 7.284423828125, 7.98828125, 8.692138671875, 9.39599609375, 10.099853515625, 10.8037109375, 11.507568359375, 12.21142578125, 12.915283203125, 13.619140625, 14.322998046875, 15.02685546875, 15.730712890625, 16.4345703125, 17.138427734375, 17.84228515625, 18.546142578125, 19.25]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 65.0, 889.0, 64.0], "bins": [-323.33575439453125, -318.1600646972656, -312.984375, -307.8086853027344, -302.63299560546875, -297.457275390625, -292.2815856933594, -287.10589599609375, -281.9302062988281, -276.7545166015625, -271.5788269042969, -266.40313720703125, -261.2274475097656, -256.0517578125, -250.8760528564453, -245.7003631591797, -240.52467346191406, -235.34898376464844, -230.1732940673828, -224.99758911132812, -219.8218994140625, -214.64620971679688, -209.47052001953125, -204.29483032226562, -199.119140625, -193.94345092773438, -188.76776123046875, -183.59205627441406, -178.41636657714844, -173.2406768798828, -168.0649871826172, -162.88929748535156, -157.7135772705078, -152.5378875732422, -147.36219787597656, -142.18649291992188, -137.01080322265625, -131.83511352539062, -126.659423828125, -121.48373413085938, -116.30803680419922, -111.1323471069336, -105.95664978027344, -100.78096008300781, -95.60527038574219, -90.42957305908203, -85.2538833618164, -80.07818603515625, -74.90249633789062, -69.726806640625, -64.55110931396484, -59.37541961669922, -54.19972610473633, -49.02403259277344, -43.84834289550781, -38.67264938354492, -33.49695587158203, -28.32126235961914, -23.145570755004883, -17.969879150390625, -12.794185638427734, -7.618492126464844, -2.442800521850586, 2.732891082763672, 7.908584117889404]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 4.0, 4.0, 8.0, 5.0, 9.0, 15.0, 13.0, 12.0, 18.0, 31.0, 24.0, 22.0, 28.0, 29.0, 37.0, 32.0, 33.0, 29.0, 43.0, 26.0, 34.0, 47.0, 51.0, 39.0, 45.0, 39.0, 42.0, 23.0, 33.0, 32.0, 33.0, 22.0, 25.0, 20.0, 21.0, 16.0, 11.0, 9.0, 7.0, 5.0, 6.0, 7.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.113819122314453, -29.2221622467041, -28.33050537109375, -27.438846588134766, -26.547189712524414, -25.655532836914062, -24.76387596130371, -23.87221908569336, -22.980560302734375, -22.088903427124023, -21.197246551513672, -20.305587768554688, -19.413930892944336, -18.522274017333984, -17.630617141723633, -16.73896026611328, -15.847302436828613, -14.955645561218262, -14.063987731933594, -13.172330856323242, -12.280673027038574, -11.389016151428223, -10.497358322143555, -9.605701446533203, -8.714044570922852, -7.822387218475342, -6.930729866027832, -6.0390729904174805, -5.1474151611328125, -4.255758285522461, -3.364100933074951, -2.4724435806274414, -1.5807857513427734, -0.6891284584999084, 0.20252883434295654, 1.0941860675811768, 1.9858434200286865, 2.877500534057617, 3.769157886505127, 4.660815238952637, 5.5524725914001465, 6.444129943847656, 7.335787296295166, 8.227444648742676, 9.119101524353027, 10.010759353637695, 10.902416229248047, 11.794073104858398, 12.685730934143066, 13.577387809753418, 14.469045639038086, 15.360702514648438, 16.25235939025879, 17.14401626586914, 18.035675048828125, 18.927331924438477, 19.818988800048828, 20.71064567565918, 21.60230255126953, 22.493961334228516, 23.385618209838867, 24.27727508544922, 25.16893196105957, 26.060588836669922, 26.952247619628906]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 4.0, 11.0, 6.0, 15.0, 12.0, 12.0, 17.0, 10.0, 13.0, 17.0, 20.0, 33.0, 27.0, 38.0, 21.0, 28.0, 30.0, 38.0, 36.0, 31.0, 38.0, 49.0, 33.0, 37.0, 34.0, 41.0, 33.0, 33.0, 26.0, 22.0, 27.0, 29.0, 27.0, 25.0, 15.0, 20.0, 13.0, 12.0, 8.0, 9.0, 9.0, 8.0, 10.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.31640625, -3.205047607421875, -3.09368896484375, -2.982330322265625, -2.8709716796875, -2.759613037109375, -2.64825439453125, -2.536895751953125, -2.425537109375, -2.314178466796875, -2.20281982421875, -2.091461181640625, -1.9801025390625, -1.868743896484375, -1.75738525390625, -1.646026611328125, -1.53466796875, -1.423309326171875, -1.31195068359375, -1.200592041015625, -1.0892333984375, -0.977874755859375, -0.86651611328125, -0.755157470703125, -0.643798828125, -0.532440185546875, -0.42108154296875, -0.309722900390625, -0.1983642578125, -0.087005615234375, 0.02435302734375, 0.135711669921875, 0.2470703125, 0.358428955078125, 0.46978759765625, 0.581146240234375, 0.6925048828125, 0.803863525390625, 0.91522216796875, 1.026580810546875, 1.137939453125, 1.249298095703125, 1.36065673828125, 1.472015380859375, 1.5833740234375, 1.694732666015625, 1.80609130859375, 1.917449951171875, 2.02880859375, 2.140167236328125, 2.25152587890625, 2.362884521484375, 2.4742431640625, 2.585601806640625, 2.69696044921875, 2.808319091796875, 2.919677734375, 3.031036376953125, 3.14239501953125, 3.253753662109375, 3.3651123046875, 3.476470947265625, 3.58782958984375, 3.699188232421875, 3.810546875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 11.0, 10.0, 17.0, 36.0, 42.0, 46.0, 57.0, 78.0, 115.0, 162.0, 310.0, 414.0, 694.0, 1333.0, 2919.0, 7257.0, 21183.0, 70347.0, 237554.0, 707150.0, 1408628.0, 1106873.0, 435767.0, 132985.0, 38769.0, 12451.0, 4446.0, 1984.0, 969.0, 540.0, 339.0, 213.0, 156.0, 110.0, 77.0, 52.0, 39.0, 40.0, 22.0, 27.0, 17.0, 4.0, 7.0, 5.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.17388916015625, -4.0235595703125, -3.87322998046875, -3.722900390625, -3.57257080078125, -3.4222412109375, -3.27191162109375, -3.12158203125, -2.97125244140625, -2.8209228515625, -2.67059326171875, -2.520263671875, -2.36993408203125, -2.2196044921875, -2.06927490234375, -1.9189453125, -1.76861572265625, -1.6182861328125, -1.46795654296875, -1.317626953125, -1.16729736328125, -1.0169677734375, -0.86663818359375, -0.71630859375, -0.56597900390625, -0.4156494140625, -0.26531982421875, -0.114990234375, 0.03533935546875, 0.1856689453125, 0.33599853515625, 0.486328125, 0.63665771484375, 0.7869873046875, 0.93731689453125, 1.087646484375, 1.23797607421875, 1.3883056640625, 1.53863525390625, 1.68896484375, 1.83929443359375, 1.9896240234375, 2.13995361328125, 2.290283203125, 2.44061279296875, 2.5909423828125, 2.74127197265625, 2.8916015625, 3.04193115234375, 3.1922607421875, 3.34259033203125, 3.492919921875, 3.64324951171875, 3.7935791015625, 3.94390869140625, 4.09423828125, 4.24456787109375, 4.3948974609375, 4.54522705078125, 4.695556640625, 4.84588623046875, 4.9962158203125, 5.14654541015625, 5.296875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 15.0, 8.0, 5.0, 14.0, 20.0, 26.0, 42.0, 52.0, 71.0, 92.0, 135.0, 175.0, 215.0, 278.0, 320.0, 445.0, 479.0, 405.0, 289.0, 271.0, 207.0, 143.0, 94.0, 66.0, 54.0, 36.0, 28.0, 27.0, 13.0, 14.0, 10.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.4620361328125, -6.248291015625, -6.0345458984375, -5.82080078125, -5.6070556640625, -5.393310546875, -5.1795654296875, -4.9658203125, -4.7520751953125, -4.538330078125, -4.3245849609375, -4.11083984375, -3.8970947265625, -3.683349609375, -3.4696044921875, -3.255859375, -3.0421142578125, -2.828369140625, -2.6146240234375, -2.40087890625, -2.1871337890625, -1.973388671875, -1.7596435546875, -1.5458984375, -1.3321533203125, -1.118408203125, -0.9046630859375, -0.69091796875, -0.4771728515625, -0.263427734375, -0.0496826171875, 0.1640625, 0.3778076171875, 0.591552734375, 0.8052978515625, 1.01904296875, 1.2327880859375, 1.446533203125, 1.6602783203125, 1.8740234375, 2.0877685546875, 2.301513671875, 2.5152587890625, 2.72900390625, 2.9427490234375, 3.156494140625, 3.3702392578125, 3.583984375, 3.7977294921875, 4.011474609375, 4.2252197265625, 4.43896484375, 4.6527099609375, 4.866455078125, 5.0802001953125, 5.2939453125, 5.5076904296875, 5.721435546875, 5.9351806640625, 6.14892578125, 6.3626708984375, 6.576416015625, 6.7901611328125, 7.00390625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 12.0, 10.0, 15.0, 24.0, 24.0, 36.0, 43.0, 85.0, 109.0, 197.0, 333.0, 608.0, 1599.0, 12819.0, 1191056.0, 2952641.0, 30588.0, 2276.0, 730.0, 380.0, 232.0, 136.0, 91.0, 70.0, 37.0, 35.0, 33.0, 9.0, 8.0, 9.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.3125, -25.51806640625, -24.7236328125, -23.92919921875, -23.134765625, -22.34033203125, -21.5458984375, -20.75146484375, -19.95703125, -19.16259765625, -18.3681640625, -17.57373046875, -16.779296875, -15.98486328125, -15.1904296875, -14.39599609375, -13.6015625, -12.80712890625, -12.0126953125, -11.21826171875, -10.423828125, -9.62939453125, -8.8349609375, -8.04052734375, -7.24609375, -6.45166015625, -5.6572265625, -4.86279296875, -4.068359375, -3.27392578125, -2.4794921875, -1.68505859375, -0.890625, -0.09619140625, 0.6982421875, 1.49267578125, 2.287109375, 3.08154296875, 3.8759765625, 4.67041015625, 5.46484375, 6.25927734375, 7.0537109375, 7.84814453125, 8.642578125, 9.43701171875, 10.2314453125, 11.02587890625, 11.8203125, 12.61474609375, 13.4091796875, 14.20361328125, 14.998046875, 15.79248046875, 16.5869140625, 17.38134765625, 18.17578125, 18.97021484375, 19.7646484375, 20.55908203125, 21.353515625, 22.14794921875, 22.9423828125, 23.73681640625, 24.53125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 105.0, 462.0, 377.0, 63.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-235.35316467285156, -230.33905029296875, -225.32492065429688, -220.31080627441406, -215.29669189453125, -210.28256225585938, -205.26844787597656, -200.25433349609375, -195.24020385742188, -190.22608947753906, -185.2119598388672, -180.19784545898438, -175.1837158203125, -170.1696014404297, -165.15548706054688, -160.141357421875, -155.1272430419922, -150.11312866210938, -145.0989990234375, -140.0848846435547, -135.07077026367188, -130.056640625, -125.04252624511719, -120.02840423583984, -115.0142822265625, -110.00016021728516, -104.98603820800781, -99.971923828125, -94.95780181884766, -89.94367980957031, -84.9295654296875, -79.91544342041016, -74.90131378173828, -69.88719177246094, -64.87307739257812, -59.85895538330078, -54.84483337402344, -49.830711364746094, -44.816593170166016, -39.80247497558594, -34.788352966308594, -29.774232864379883, -24.760112762451172, -19.74599266052246, -14.73187255859375, -9.717752456665039, -4.703632354736328, 0.31048583984375, 5.324607849121094, 10.338727951049805, 15.352848052978516, 20.366968154907227, 25.381088256835938, 30.39520835876465, 35.40932846069336, 40.42344665527344, 45.43756866455078, 50.451690673828125, 55.4658088684082, 60.47992706298828, 65.49404907226562, 70.50817108154297, 75.52229309082031, 80.53640747070312, 85.55052947998047]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 7.0, 10.0, 13.0, 16.0, 14.0, 10.0, 14.0, 28.0, 20.0, 18.0, 28.0, 31.0, 35.0, 41.0, 40.0, 43.0, 44.0, 36.0, 36.0, 44.0, 47.0, 36.0, 52.0, 43.0, 32.0, 44.0, 37.0, 30.0, 22.0, 20.0, 11.0, 16.0, 19.0, 20.0, 15.0, 6.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.607772827148438, -20.85639190673828, -20.105012893676758, -19.3536319732666, -18.602252960205078, -17.850872039794922, -17.099491119384766, -16.348112106323242, -15.596731185913086, -14.845351219177246, -14.093971252441406, -13.34259033203125, -12.59121036529541, -11.83983039855957, -11.08845043182373, -10.33707046508789, -9.58569049835205, -8.834310531616211, -8.082930564880371, -7.331550121307373, -6.580169677734375, -5.828789710998535, -5.077409744262695, -4.326029300689697, -3.5746493339538574, -2.8232691287994385, -2.0718889236450195, -1.3205089569091797, -0.5691287517547607, 0.1822514533996582, 0.933631420135498, 1.685011863708496, 2.436391830444336, 3.187772035598755, 3.939152240753174, 4.690532207489014, 5.441912651062012, 6.193292617797852, 6.944672584533691, 7.6960530281066895, 8.447433471679688, 9.198813438415527, 9.950193405151367, 10.701574325561523, 11.452954292297363, 12.204334259033203, 12.955714225769043, 13.707094192504883, 14.458474159240723, 15.209854125976562, 15.961234092712402, 16.712614059448242, 17.4639949798584, 18.215373992919922, 18.966754913330078, 19.718135833740234, 20.469514846801758, 21.220895767211914, 21.972274780273438, 22.723655700683594, 23.475034713745117, 24.226415634155273, 24.977794647216797, 25.729175567626953, 26.48055648803711]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 13.0, 7.0, 9.0, 14.0, 18.0, 13.0, 22.0, 32.0, 20.0, 32.0, 36.0, 28.0, 30.0, 40.0, 41.0, 30.0, 49.0, 47.0, 36.0, 43.0, 48.0, 27.0, 44.0, 31.0, 36.0, 31.0, 16.0, 21.0, 24.0, 15.0, 21.0, 15.0, 9.0, 14.0, 12.0, 12.0, 6.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0], "bins": [-4.15625, -4.040740966796875, -3.92523193359375, -3.809722900390625, -3.6942138671875, -3.578704833984375, -3.46319580078125, -3.347686767578125, -3.232177734375, -3.116668701171875, -3.00115966796875, -2.885650634765625, -2.7701416015625, -2.654632568359375, -2.53912353515625, -2.423614501953125, -2.30810546875, -2.192596435546875, -2.07708740234375, -1.961578369140625, -1.8460693359375, -1.730560302734375, -1.61505126953125, -1.499542236328125, -1.384033203125, -1.268524169921875, -1.15301513671875, -1.037506103515625, -0.9219970703125, -0.806488037109375, -0.69097900390625, -0.575469970703125, -0.4599609375, -0.344451904296875, -0.22894287109375, -0.113433837890625, 0.0020751953125, 0.117584228515625, 0.23309326171875, 0.348602294921875, 0.464111328125, 0.579620361328125, 0.69512939453125, 0.810638427734375, 0.9261474609375, 1.041656494140625, 1.15716552734375, 1.272674560546875, 1.38818359375, 1.503692626953125, 1.61920166015625, 1.734710693359375, 1.8502197265625, 1.965728759765625, 2.08123779296875, 2.196746826171875, 2.312255859375, 2.427764892578125, 2.54327392578125, 2.658782958984375, 2.7742919921875, 2.889801025390625, 3.00531005859375, 3.120819091796875, 3.236328125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 12.0, 25.0, 32.0, 52.0, 127.0, 186.0, 302.0, 517.0, 862.0, 1482.0, 2296.0, 3923.0, 6503.0, 10334.0, 16260.0, 25523.0, 39262.0, 59046.0, 84427.0, 111906.0, 135530.0, 140722.0, 120558.0, 94373.0, 67917.0, 45652.0, 29759.0, 19142.0, 12186.0, 7651.0, 4696.0, 2817.0, 1724.0, 1086.0, 675.0, 424.0, 221.0, 148.0, 87.0, 56.0, 22.0, 11.0, 12.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.321533203125, -0.31212615966796875, -0.3027191162109375, -0.29331207275390625, -0.283905029296875, -0.27449798583984375, -0.2650909423828125, -0.25568389892578125, -0.24627685546875, -0.23686981201171875, -0.2274627685546875, -0.21805572509765625, -0.208648681640625, -0.19924163818359375, -0.1898345947265625, -0.18042755126953125, -0.1710205078125, -0.16161346435546875, -0.1522064208984375, -0.14279937744140625, -0.133392333984375, -0.12398529052734375, -0.1145782470703125, -0.10517120361328125, -0.09576416015625, -0.08635711669921875, -0.0769500732421875, -0.06754302978515625, -0.058135986328125, -0.04872894287109375, -0.0393218994140625, -0.02991485595703125, -0.0205078125, -0.01110076904296875, -0.0016937255859375, 0.00771331787109375, 0.017120361328125, 0.02652740478515625, 0.0359344482421875, 0.04534149169921875, 0.05474853515625, 0.06415557861328125, 0.0735626220703125, 0.08296966552734375, 0.092376708984375, 0.10178375244140625, 0.1111907958984375, 0.12059783935546875, 0.1300048828125, 0.13941192626953125, 0.1488189697265625, 0.15822601318359375, 0.167633056640625, 0.17704010009765625, 0.1864471435546875, 0.19585418701171875, 0.20526123046875, 0.21466827392578125, 0.2240753173828125, 0.23348236083984375, 0.242889404296875, 0.25229644775390625, 0.2617034912109375, 0.27111053466796875, 0.280517578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 5.0, 6.0, 17.0, 8.0, 16.0, 16.0, 25.0, 14.0, 17.0, 28.0, 28.0, 22.0, 30.0, 31.0, 35.0, 48.0, 30.0, 47.0, 41.0, 1065.0, 32.0, 46.0, 40.0, 39.0, 29.0, 25.0, 38.0, 35.0, 30.0, 26.0, 15.0, 29.0, 17.0, 17.0, 13.0, 11.0, 13.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.162109375, -3.070709228515625, -2.97930908203125, -2.887908935546875, -2.7965087890625, -2.705108642578125, -2.61370849609375, -2.522308349609375, -2.430908203125, -2.339508056640625, -2.24810791015625, -2.156707763671875, -2.0653076171875, -1.973907470703125, -1.88250732421875, -1.791107177734375, -1.69970703125, -1.608306884765625, -1.51690673828125, -1.425506591796875, -1.3341064453125, -1.242706298828125, -1.15130615234375, -1.059906005859375, -0.968505859375, -0.877105712890625, -0.78570556640625, -0.694305419921875, -0.6029052734375, -0.511505126953125, -0.42010498046875, -0.328704833984375, -0.2373046875, -0.145904541015625, -0.05450439453125, 0.036895751953125, 0.1282958984375, 0.219696044921875, 0.31109619140625, 0.402496337890625, 0.493896484375, 0.585296630859375, 0.67669677734375, 0.768096923828125, 0.8594970703125, 0.950897216796875, 1.04229736328125, 1.133697509765625, 1.22509765625, 1.316497802734375, 1.40789794921875, 1.499298095703125, 1.5906982421875, 1.682098388671875, 1.77349853515625, 1.864898681640625, 1.956298828125, 2.047698974609375, 2.13909912109375, 2.230499267578125, 2.3218994140625, 2.413299560546875, 2.50469970703125, 2.596099853515625, 2.6875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 13.0, 18.0, 16.0, 27.0, 36.0, 76.0, 83.0, 142.0, 265.0, 421.0, 777.0, 1399.0, 2345.0, 4267.0, 7779.0, 13857.0, 24883.0, 43272.0, 72537.0, 112819.0, 175379.0, 1189644.0, 169496.0, 110262.0, 70196.0, 42245.0, 23856.0, 13678.0, 7738.0, 4168.0, 2352.0, 1336.0, 731.0, 413.0, 234.0, 134.0, 79.0, 72.0, 40.0, 17.0, 12.0, 6.0, 9.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2437744140625, -0.237091064453125, -0.23040771484375, -0.223724365234375, -0.217041015625, -0.210357666015625, -0.20367431640625, -0.196990966796875, -0.1903076171875, -0.183624267578125, -0.17694091796875, -0.170257568359375, -0.16357421875, -0.156890869140625, -0.15020751953125, -0.143524169921875, -0.1368408203125, -0.130157470703125, -0.12347412109375, -0.116790771484375, -0.110107421875, -0.103424072265625, -0.09674072265625, -0.090057373046875, -0.0833740234375, -0.076690673828125, -0.07000732421875, -0.063323974609375, -0.056640625, -0.049957275390625, -0.04327392578125, -0.036590576171875, -0.0299072265625, -0.023223876953125, -0.01654052734375, -0.009857177734375, -0.003173828125, 0.003509521484375, 0.01019287109375, 0.016876220703125, 0.0235595703125, 0.030242919921875, 0.03692626953125, 0.043609619140625, 0.05029296875, 0.056976318359375, 0.06365966796875, 0.070343017578125, 0.0770263671875, 0.083709716796875, 0.09039306640625, 0.097076416015625, 0.103759765625, 0.110443115234375, 0.11712646484375, 0.123809814453125, 0.1304931640625, 0.137176513671875, 0.14385986328125, 0.150543212890625, 0.1572265625, 0.163909912109375, 0.17059326171875, 0.177276611328125, 0.1839599609375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 4.0, 7.0, 2.0, 9.0, 13.0, 20.0, 11.0, 25.0, 21.0, 29.0, 37.0, 37.0, 51.0, 56.0, 65.0, 63.0, 67.0, 59.0, 58.0, 50.0, 49.0, 49.0, 37.0, 43.0, 29.0, 12.0, 12.0, 14.0, 15.0, 4.0, 11.0, 8.0, 7.0, 7.0, 4.0, 6.0, 7.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03179931640625, -0.03076934814453125, -0.0297393798828125, -0.02870941162109375, -0.027679443359375, -0.02664947509765625, -0.0256195068359375, -0.02458953857421875, -0.0235595703125, -0.02252960205078125, -0.0214996337890625, -0.02046966552734375, -0.019439697265625, -0.01840972900390625, -0.0173797607421875, -0.01634979248046875, -0.01531982421875, -0.01428985595703125, -0.0132598876953125, -0.01222991943359375, -0.011199951171875, -0.01016998291015625, -0.0091400146484375, -0.00811004638671875, -0.007080078125, -0.00605010986328125, -0.0050201416015625, -0.00399017333984375, -0.002960205078125, -0.00193023681640625, -0.0009002685546875, 0.00012969970703125, 0.00115966796875, 0.00218963623046875, 0.0032196044921875, 0.00424957275390625, 0.005279541015625, 0.00630950927734375, 0.0073394775390625, 0.00836944580078125, 0.0093994140625, 0.01042938232421875, 0.0114593505859375, 0.01248931884765625, 0.013519287109375, 0.01454925537109375, 0.0155792236328125, 0.01660919189453125, 0.01763916015625, 0.01866912841796875, 0.0196990966796875, 0.02072906494140625, 0.021759033203125, 0.02278900146484375, 0.0238189697265625, 0.02484893798828125, 0.02587890625, 0.02690887451171875, 0.0279388427734375, 0.02896881103515625, 0.029998779296875, 0.03102874755859375, 0.0320587158203125, 0.03308868408203125, 0.03411865234375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 5.0, 5.0, 11.0, 5.0, 9.0, 7.0, 12.0, 18.0, 15.0, 15.0, 46.0, 49.0, 64.0, 93.0, 142.0, 318.0, 686.0, 29365.0, 1015422.0, 1280.0, 385.0, 180.0, 123.0, 73.0, 47.0, 41.0, 28.0, 21.0, 15.0, 21.0, 14.0, 8.0, 3.0, 7.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7841796875, -0.7605514526367188, -0.7369232177734375, -0.7132949829101562, -0.689666748046875, -0.6660385131835938, -0.6424102783203125, -0.6187820434570312, -0.59515380859375, -0.5715255737304688, -0.5478973388671875, -0.5242691040039062, -0.500640869140625, -0.47701263427734375, -0.4533843994140625, -0.42975616455078125, -0.4061279296875, -0.38249969482421875, -0.3588714599609375, -0.33524322509765625, -0.311614990234375, -0.28798675537109375, -0.2643585205078125, -0.24073028564453125, -0.21710205078125, -0.19347381591796875, -0.1698455810546875, -0.14621734619140625, -0.122589111328125, -0.09896087646484375, -0.0753326416015625, -0.05170440673828125, -0.028076171875, -0.00444793701171875, 0.0191802978515625, 0.04280853271484375, 0.066436767578125, 0.09006500244140625, 0.1136932373046875, 0.13732147216796875, 0.16094970703125, 0.18457794189453125, 0.2082061767578125, 0.23183441162109375, 0.255462646484375, 0.27909088134765625, 0.3027191162109375, 0.32634735107421875, 0.3499755859375, 0.37360382080078125, 0.3972320556640625, 0.42086029052734375, 0.444488525390625, 0.46811676025390625, 0.4917449951171875, 0.5153732299804688, 0.53900146484375, 0.5626296997070312, 0.5862579345703125, 0.6098861694335938, 0.633514404296875, 0.6571426391601562, 0.6807708740234375, 0.7043991088867188, 0.72802734375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 14.0, 78.0, 508.0, 346.0, 46.0, 12.0, 8.0], "bins": [-0.3658084273338318, -0.35969600081443787, -0.35358357429504395, -0.34747111797332764, -0.3413586914539337, -0.3352462649345398, -0.3291338384151459, -0.32302141189575195, -0.31690898537635803, -0.3107965588569641, -0.3046841323375702, -0.29857170581817627, -0.29245924949645996, -0.28634682297706604, -0.2802343964576721, -0.2741219699382782, -0.2680095434188843, -0.26189711689949036, -0.25578469038009644, -0.24967224895954132, -0.2435598224401474, -0.23744738101959229, -0.23133495450019836, -0.22522252798080444, -0.21911007165908813, -0.2129976451396942, -0.2068852037191391, -0.20077277719974518, -0.19466035068035126, -0.18854790925979614, -0.18243548274040222, -0.1763230562210083, -0.17021061480045319, -0.16409818828105927, -0.15798574686050415, -0.15187332034111023, -0.1457608938217163, -0.1396484673023224, -0.13353602588176727, -0.12742359936237335, -0.12131116539239883, -0.11519873142242432, -0.1090863049030304, -0.10297387093305588, -0.09686143696308136, -0.09074901044368744, -0.08463657647371292, -0.0785241425037384, -0.07241171598434448, -0.06629928201436996, -0.060186855494976044, -0.054074421525001526, -0.047961991280317307, -0.04184956103563309, -0.03573712706565857, -0.02962469682097435, -0.02351226843893528, -0.01739983633160591, -0.011287406086921692, -0.005174973979592323, 0.0009374562650918961, 0.007049886509776115, 0.013162320479750633, 0.019274750724434853, 0.025387180969119072]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 7.0, 9.0, 8.0, 3.0, 15.0, 15.0, 14.0, 19.0, 19.0, 20.0, 29.0, 40.0, 32.0, 34.0, 37.0, 35.0, 50.0, 38.0, 39.0, 40.0, 45.0, 40.0, 49.0, 48.0, 35.0, 38.0, 34.0, 28.0, 32.0, 22.0, 33.0, 22.0, 14.0, 14.0, 10.0, 5.0, 10.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07566899061203003, -0.07314570248126984, -0.07062241435050964, -0.06809912621974945, -0.06557583808898926, -0.06305254995822906, -0.06052926182746887, -0.05800597369670868, -0.055482685565948486, -0.05295939743518829, -0.0504361093044281, -0.04791282117366791, -0.045389533042907715, -0.04286624491214752, -0.04034295678138733, -0.037819668650627136, -0.03529638051986694, -0.03277309238910675, -0.030249804258346558, -0.027726516127586365, -0.025203227996826172, -0.02267993986606598, -0.020156651735305786, -0.017633363604545593, -0.0151100754737854, -0.012586787343025208, -0.010063499212265015, -0.007540211081504822, -0.005016922950744629, -0.002493634819984436, 2.9653310775756836e-05, 0.0025529414415359497, 0.005076229572296143, 0.0075995177030563354, 0.010122805833816528, 0.012646093964576721, 0.015169382095336914, 0.017692670226097107, 0.0202159583568573, 0.022739246487617493, 0.025262534618377686, 0.02778582274913788, 0.03030911087989807, 0.032832399010658264, 0.03535568714141846, 0.03787897527217865, 0.04040226340293884, 0.042925551533699036, 0.04544883966445923, 0.04797212779521942, 0.050495415925979614, 0.05301870405673981, 0.0555419921875, 0.05806528031826019, 0.060588568449020386, 0.06311185657978058, 0.06563514471054077, 0.06815843284130096, 0.07068172097206116, 0.07320500910282135, 0.07572829723358154, 0.07825158536434174, 0.08077487349510193, 0.08329816162586212, 0.08582144975662231]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 7.0, 9.0, 6.0, 6.0, 14.0, 11.0, 14.0, 21.0, 26.0, 28.0, 26.0, 29.0, 33.0, 37.0, 42.0, 34.0, 35.0, 43.0, 43.0, 36.0, 46.0, 33.0, 37.0, 41.0, 27.0, 43.0, 25.0, 29.0, 28.0, 21.0, 18.0, 29.0, 17.0, 19.0, 10.0, 16.0, 5.0, 8.0, 9.0, 8.0, 5.0, 2.0, 4.0, 1.0, 4.0, 1.0, 5.0, 2.0, 3.0], "bins": [-4.0625, -3.94586181640625, -3.8292236328125, -3.71258544921875, -3.595947265625, -3.47930908203125, -3.3626708984375, -3.24603271484375, -3.12939453125, -3.01275634765625, -2.8961181640625, -2.77947998046875, -2.662841796875, -2.54620361328125, -2.4295654296875, -2.31292724609375, -2.1962890625, -2.07965087890625, -1.9630126953125, -1.84637451171875, -1.729736328125, -1.61309814453125, -1.4964599609375, -1.37982177734375, -1.26318359375, -1.14654541015625, -1.0299072265625, -0.91326904296875, -0.796630859375, -0.67999267578125, -0.5633544921875, -0.44671630859375, -0.330078125, -0.21343994140625, -0.0968017578125, 0.01983642578125, 0.136474609375, 0.25311279296875, 0.3697509765625, 0.48638916015625, 0.60302734375, 0.71966552734375, 0.8363037109375, 0.95294189453125, 1.069580078125, 1.18621826171875, 1.3028564453125, 1.41949462890625, 1.5361328125, 1.65277099609375, 1.7694091796875, 1.88604736328125, 2.002685546875, 2.11932373046875, 2.2359619140625, 2.35260009765625, 2.46923828125, 2.58587646484375, 2.7025146484375, 2.81915283203125, 2.935791015625, 3.05242919921875, 3.1690673828125, 3.28570556640625, 3.40234375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 7.0, 10.0, 11.0, 27.0, 40.0, 45.0, 83.0, 145.0, 190.0, 293.0, 386.0, 687.0, 1170.0, 1863.0, 3027.0, 4988.0, 8395.0, 14099.0, 24688.0, 45365.0, 87057.0, 173492.0, 268314.0, 196184.0, 99250.0, 51311.0, 28171.0, 15735.0, 9258.0, 5482.0, 3399.0, 2073.0, 1215.0, 733.0, 450.0, 313.0, 205.0, 137.0, 72.0, 48.0, 40.0, 30.0, 9.0, 18.0, 10.0, 10.0, 11.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.302734375, -3.198211669921875, -3.09368896484375, -2.989166259765625, -2.8846435546875, -2.780120849609375, -2.67559814453125, -2.571075439453125, -2.466552734375, -2.362030029296875, -2.25750732421875, -2.152984619140625, -2.0484619140625, -1.943939208984375, -1.83941650390625, -1.734893798828125, -1.63037109375, -1.525848388671875, -1.42132568359375, -1.316802978515625, -1.2122802734375, -1.107757568359375, -1.00323486328125, -0.898712158203125, -0.794189453125, -0.689666748046875, -0.58514404296875, -0.480621337890625, -0.3760986328125, -0.271575927734375, -0.16705322265625, -0.062530517578125, 0.0419921875, 0.146514892578125, 0.25103759765625, 0.355560302734375, 0.4600830078125, 0.564605712890625, 0.66912841796875, 0.773651123046875, 0.878173828125, 0.982696533203125, 1.08721923828125, 1.191741943359375, 1.2962646484375, 1.400787353515625, 1.50531005859375, 1.609832763671875, 1.71435546875, 1.818878173828125, 1.92340087890625, 2.027923583984375, 2.1324462890625, 2.236968994140625, 2.34149169921875, 2.446014404296875, 2.550537109375, 2.655059814453125, 2.75958251953125, 2.864105224609375, 2.9686279296875, 3.073150634765625, 3.17767333984375, 3.282196044921875, 3.38671875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 5.0, 4.0, 8.0, 9.0, 11.0, 13.0, 15.0, 14.0, 17.0, 18.0, 34.0, 29.0, 38.0, 42.0, 49.0, 44.0, 54.0, 77.0, 229.0, 1397.0, 290.0, 145.0, 67.0, 65.0, 55.0, 38.0, 29.0, 28.0, 25.0, 23.0, 21.0, 31.0, 16.0, 17.0, 16.0, 6.0, 11.0, 7.0, 10.0, 4.0, 6.0, 11.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.203125, -10.850830078125, -10.49853515625, -10.146240234375, -9.7939453125, -9.441650390625, -9.08935546875, -8.737060546875, -8.384765625, -8.032470703125, -7.68017578125, -7.327880859375, -6.9755859375, -6.623291015625, -6.27099609375, -5.918701171875, -5.56640625, -5.214111328125, -4.86181640625, -4.509521484375, -4.1572265625, -3.804931640625, -3.45263671875, -3.100341796875, -2.748046875, -2.395751953125, -2.04345703125, -1.691162109375, -1.3388671875, -0.986572265625, -0.63427734375, -0.281982421875, 0.0703125, 0.422607421875, 0.77490234375, 1.127197265625, 1.4794921875, 1.831787109375, 2.18408203125, 2.536376953125, 2.888671875, 3.240966796875, 3.59326171875, 3.945556640625, 4.2978515625, 4.650146484375, 5.00244140625, 5.354736328125, 5.70703125, 6.059326171875, 6.41162109375, 6.763916015625, 7.1162109375, 7.468505859375, 7.82080078125, 8.173095703125, 8.525390625, 8.877685546875, 9.22998046875, 9.582275390625, 9.9345703125, 10.286865234375, 10.63916015625, 10.991455078125, 11.34375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 11.0, 12.0, 6.0, 19.0, 22.0, 27.0, 34.0, 42.0, 55.0, 59.0, 87.0, 113.0, 179.0, 226.0, 433.0, 1012.0, 7312.0, 154198.0, 2856623.0, 116824.0, 6098.0, 1005.0, 411.0, 256.0, 189.0, 104.0, 79.0, 46.0, 49.0, 35.0, 30.0, 19.0, 15.0, 20.0, 6.0, 7.0, 11.0, 3.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-19.125, -18.553466796875, -17.98193359375, -17.410400390625, -16.8388671875, -16.267333984375, -15.69580078125, -15.124267578125, -14.552734375, -13.981201171875, -13.40966796875, -12.838134765625, -12.2666015625, -11.695068359375, -11.12353515625, -10.552001953125, -9.98046875, -9.408935546875, -8.83740234375, -8.265869140625, -7.6943359375, -7.122802734375, -6.55126953125, -5.979736328125, -5.408203125, -4.836669921875, -4.26513671875, -3.693603515625, -3.1220703125, -2.550537109375, -1.97900390625, -1.407470703125, -0.8359375, -0.264404296875, 0.30712890625, 0.878662109375, 1.4501953125, 2.021728515625, 2.59326171875, 3.164794921875, 3.736328125, 4.307861328125, 4.87939453125, 5.450927734375, 6.0224609375, 6.593994140625, 7.16552734375, 7.737060546875, 8.30859375, 8.880126953125, 9.45166015625, 10.023193359375, 10.5947265625, 11.166259765625, 11.73779296875, 12.309326171875, 12.880859375, 13.452392578125, 14.02392578125, 14.595458984375, 15.1669921875, 15.738525390625, 16.31005859375, 16.881591796875, 17.453125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 40.0, 729.0, 246.0, 5.0], "bins": [-298.4379577636719, -293.59881591796875, -288.7596740722656, -283.9205322265625, -279.0813903808594, -274.2422790527344, -269.40313720703125, -264.5639953613281, -259.724853515625, -254.88571166992188, -250.04656982421875, -245.2074432373047, -240.36830139160156, -235.52915954589844, -230.6900177001953, -225.85089111328125, -221.01174926757812, -216.172607421875, -211.33346557617188, -206.4943389892578, -201.6551971435547, -196.81605529785156, -191.97691345214844, -187.13778686523438, -182.2986297607422, -177.45948791503906, -172.62034606933594, -167.78121948242188, -162.94207763671875, -158.10293579101562, -153.2637939453125, -148.42465209960938, -143.58551025390625, -138.74636840820312, -133.9072265625, -129.06809997558594, -124.22895812988281, -119.38981628417969, -114.55067443847656, -109.71154022216797, -104.87240600585938, -100.03326416015625, -95.19412994384766, -90.35498809814453, -85.51585388183594, -80.67671203613281, -75.83757019042969, -70.9984359741211, -66.1593017578125, -61.32016372680664, -56.48102569580078, -51.641883850097656, -46.80274963378906, -41.96360778808594, -37.12446975708008, -32.28533172607422, -27.446189880371094, -22.607051849365234, -17.767913818359375, -12.928773880004883, -8.089635848999023, -3.250497817993164, 1.5886421203613281, 6.4277801513671875, 11.266918182373047]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 7.0, 4.0, 11.0, 10.0, 11.0, 16.0, 16.0, 15.0, 15.0, 26.0, 28.0, 19.0, 34.0, 30.0, 31.0, 42.0, 32.0, 29.0, 42.0, 41.0, 46.0, 30.0, 46.0, 53.0, 37.0, 37.0, 43.0, 42.0, 28.0, 32.0, 20.0, 23.0, 24.0, 20.0, 12.0, 12.0, 10.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-30.812227249145508, -29.86284637451172, -28.913463592529297, -27.964082717895508, -27.01470184326172, -26.065319061279297, -25.115938186645508, -24.16655731201172, -23.217174530029297, -22.267793655395508, -21.318410873413086, -20.369029998779297, -19.419649124145508, -18.47026824951172, -17.520885467529297, -16.571504592895508, -15.622123718261719, -14.672741889953613, -13.723361015319824, -12.773979187011719, -11.82459831237793, -10.875216484069824, -9.925834655761719, -8.97645378112793, -8.027071952819824, -7.077690601348877, -6.12830924987793, -5.178927421569824, -4.229546070098877, -3.2801647186279297, -2.330782890319824, -1.381401538848877, -0.4320201873779297, 0.5173612833023071, 1.466742753982544, 2.4161243438720703, 3.3655056953430176, 4.314887046813965, 5.26426887512207, 6.213650226593018, 7.163031578063965, 8.11241340637207, 9.06179428100586, 10.011176109313965, 10.96055793762207, 11.90993881225586, 12.859320640563965, 13.80870246887207, 14.75808334350586, 15.707465171813965, 16.65684700012207, 17.60622787475586, 18.55560874938965, 19.504989624023438, 20.45437240600586, 21.40375328063965, 22.353134155273438, 23.302515029907227, 24.25189781188965, 25.201278686523438, 26.150659561157227, 27.100040435791016, 28.049423217773438, 28.998804092407227, 29.94818687438965]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 7.0, 10.0, 7.0, 17.0, 13.0, 14.0, 19.0, 14.0, 30.0, 25.0, 28.0, 32.0, 34.0, 52.0, 35.0, 31.0, 37.0, 42.0, 46.0, 36.0, 41.0, 41.0, 38.0, 30.0, 40.0, 40.0, 33.0, 30.0, 16.0, 27.0, 22.0, 16.0, 20.0, 9.0, 14.0, 7.0, 11.0, 9.0, 6.0, 5.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.89453125, -3.7645263671875, -3.634521484375, -3.5045166015625, -3.37451171875, -3.2445068359375, -3.114501953125, -2.9844970703125, -2.8544921875, -2.7244873046875, -2.594482421875, -2.4644775390625, -2.33447265625, -2.2044677734375, -2.074462890625, -1.9444580078125, -1.814453125, -1.6844482421875, -1.554443359375, -1.4244384765625, -1.29443359375, -1.1644287109375, -1.034423828125, -0.9044189453125, -0.7744140625, -0.6444091796875, -0.514404296875, -0.3843994140625, -0.25439453125, -0.1243896484375, 0.005615234375, 0.1356201171875, 0.265625, 0.3956298828125, 0.525634765625, 0.6556396484375, 0.78564453125, 0.9156494140625, 1.045654296875, 1.1756591796875, 1.3056640625, 1.4356689453125, 1.565673828125, 1.6956787109375, 1.82568359375, 1.9556884765625, 2.085693359375, 2.2156982421875, 2.345703125, 2.4757080078125, 2.605712890625, 2.7357177734375, 2.86572265625, 2.9957275390625, 3.125732421875, 3.2557373046875, 3.3857421875, 3.5157470703125, 3.645751953125, 3.7757568359375, 3.90576171875, 4.0357666015625, 4.165771484375, 4.2957763671875, 4.42578125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 9.0, 8.0, 9.0, 8.0, 15.0, 19.0, 15.0, 21.0, 20.0, 36.0, 64.0, 81.0, 111.0, 235.0, 823.0, 4180.0, 41441.0, 675977.0, 2947240.0, 489085.0, 30139.0, 3320.0, 728.0, 255.0, 121.0, 64.0, 51.0, 26.0, 31.0, 26.0, 18.0, 16.0, 15.0, 15.0, 14.0, 10.0, 7.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-11.7890625, -11.44677734375, -11.1044921875, -10.76220703125, -10.419921875, -10.07763671875, -9.7353515625, -9.39306640625, -9.05078125, -8.70849609375, -8.3662109375, -8.02392578125, -7.681640625, -7.33935546875, -6.9970703125, -6.65478515625, -6.3125, -5.97021484375, -5.6279296875, -5.28564453125, -4.943359375, -4.60107421875, -4.2587890625, -3.91650390625, -3.57421875, -3.23193359375, -2.8896484375, -2.54736328125, -2.205078125, -1.86279296875, -1.5205078125, -1.17822265625, -0.8359375, -0.49365234375, -0.1513671875, 0.19091796875, 0.533203125, 0.87548828125, 1.2177734375, 1.56005859375, 1.90234375, 2.24462890625, 2.5869140625, 2.92919921875, 3.271484375, 3.61376953125, 3.9560546875, 4.29833984375, 4.640625, 4.98291015625, 5.3251953125, 5.66748046875, 6.009765625, 6.35205078125, 6.6943359375, 7.03662109375, 7.37890625, 7.72119140625, 8.0634765625, 8.40576171875, 8.748046875, 9.09033203125, 9.4326171875, 9.77490234375, 10.1171875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 8.0, 13.0, 11.0, 14.0, 22.0, 26.0, 30.0, 57.0, 57.0, 88.0, 113.0, 186.0, 215.0, 292.0, 369.0, 446.0, 437.0, 373.0, 375.0, 242.0, 184.0, 143.0, 114.0, 80.0, 45.0, 29.0, 21.0, 20.0, 17.0, 12.0, 13.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.410888671875, -5.21240234375, -5.013916015625, -4.8154296875, -4.616943359375, -4.41845703125, -4.219970703125, -4.021484375, -3.822998046875, -3.62451171875, -3.426025390625, -3.2275390625, -3.029052734375, -2.83056640625, -2.632080078125, -2.43359375, -2.235107421875, -2.03662109375, -1.838134765625, -1.6396484375, -1.441162109375, -1.24267578125, -1.044189453125, -0.845703125, -0.647216796875, -0.44873046875, -0.250244140625, -0.0517578125, 0.146728515625, 0.34521484375, 0.543701171875, 0.7421875, 0.940673828125, 1.13916015625, 1.337646484375, 1.5361328125, 1.734619140625, 1.93310546875, 2.131591796875, 2.330078125, 2.528564453125, 2.72705078125, 2.925537109375, 3.1240234375, 3.322509765625, 3.52099609375, 3.719482421875, 3.91796875, 4.116455078125, 4.31494140625, 4.513427734375, 4.7119140625, 4.910400390625, 5.10888671875, 5.307373046875, 5.505859375, 5.704345703125, 5.90283203125, 6.101318359375, 6.2998046875, 6.498291015625, 6.69677734375, 6.895263671875, 7.09375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 10.0, 15.0, 18.0, 24.0, 30.0, 28.0, 70.0, 113.0, 176.0, 253.0, 463.0, 980.0, 5877.0, 133223.0, 3453209.0, 580705.0, 15881.0, 1698.0, 546.0, 306.0, 202.0, 129.0, 92.0, 56.0, 43.0, 27.0, 22.0, 17.0, 17.0, 13.0, 3.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.609375, -22.94775390625, -22.2861328125, -21.62451171875, -20.962890625, -20.30126953125, -19.6396484375, -18.97802734375, -18.31640625, -17.65478515625, -16.9931640625, -16.33154296875, -15.669921875, -15.00830078125, -14.3466796875, -13.68505859375, -13.0234375, -12.36181640625, -11.7001953125, -11.03857421875, -10.376953125, -9.71533203125, -9.0537109375, -8.39208984375, -7.73046875, -7.06884765625, -6.4072265625, -5.74560546875, -5.083984375, -4.42236328125, -3.7607421875, -3.09912109375, -2.4375, -1.77587890625, -1.1142578125, -0.45263671875, 0.208984375, 0.87060546875, 1.5322265625, 2.19384765625, 2.85546875, 3.51708984375, 4.1787109375, 4.84033203125, 5.501953125, 6.16357421875, 6.8251953125, 7.48681640625, 8.1484375, 8.81005859375, 9.4716796875, 10.13330078125, 10.794921875, 11.45654296875, 12.1181640625, 12.77978515625, 13.44140625, 14.10302734375, 14.7646484375, 15.42626953125, 16.087890625, 16.74951171875, 17.4111328125, 18.07275390625, 18.734375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 19.0, 63.0, 145.0, 193.0, 231.0, 165.0, 108.0, 59.0, 16.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.100749015808105, -11.34965991973877, -9.598569869995117, -7.847480773925781, -6.096391677856445, -4.345302581787109, -2.594212532043457, -0.8431234359741211, 0.9079656600952148, 2.65905499458313, 4.410144329071045, 6.161233901977539, 7.912322998046875, 9.663412094116211, 11.414502143859863, 13.1655912399292, 14.916680335998535, 16.667770385742188, 18.418859481811523, 20.16994857788086, 21.921037673950195, 23.67212677001953, 25.4232177734375, 27.174304962158203, 28.925395965576172, 30.676485061645508, 32.427574157714844, 34.17866516113281, 35.929752349853516, 37.680843353271484, 39.43193054199219, 41.183021545410156, 42.934112548828125, 44.685203552246094, 46.4362907409668, 48.187381744384766, 49.93846893310547, 51.68955993652344, 53.440650939941406, 55.19173812866211, 56.94282531738281, 58.69391632080078, 60.445003509521484, 62.19609451293945, 63.947181701660156, 65.69827270507812, 67.4493637084961, 69.20045471191406, 70.9515380859375, 72.70262908935547, 74.45372009277344, 76.20480346679688, 77.95589447021484, 79.70698547363281, 81.45807647705078, 83.20916748046875, 84.96025848388672, 86.71134948730469, 88.46244049072266, 90.2135238647461, 91.96461486816406, 93.71570587158203, 95.466796875, 97.21788024902344, 98.9689712524414]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 4.0, 5.0, 6.0, 8.0, 15.0, 12.0, 9.0, 14.0, 13.0, 17.0, 17.0, 22.0, 27.0, 26.0, 23.0, 33.0, 30.0, 38.0, 36.0, 31.0, 40.0, 26.0, 37.0, 32.0, 30.0, 30.0, 48.0, 29.0, 36.0, 36.0, 39.0, 28.0, 39.0, 28.0, 23.0, 18.0, 14.0, 22.0, 14.0, 10.0, 7.0, 7.0, 2.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.264514923095703, -19.64227867126465, -19.020042419433594, -18.39780616760254, -17.775569915771484, -17.15333366394043, -16.531097412109375, -15.90886116027832, -15.286624908447266, -14.664388656616211, -14.042152404785156, -13.419916152954102, -12.797679901123047, -12.175443649291992, -11.553207397460938, -10.930971145629883, -10.308734893798828, -9.686498641967773, -9.064262390136719, -8.442026138305664, -7.819789886474609, -7.197553634643555, -6.5753173828125, -5.953081130981445, -5.330844879150391, -4.708608627319336, -4.086372375488281, -3.4641361236572266, -2.841899871826172, -2.219663619995117, -1.5974273681640625, -0.9751911163330078, -0.3529529571533203, 0.2692832946777344, 0.8915195465087891, 1.5137557983398438, 2.1359920501708984, 2.758228302001953, 3.380464553833008, 4.0027008056640625, 4.624937057495117, 5.247173309326172, 5.869409561157227, 6.491645812988281, 7.113882064819336, 7.736118316650391, 8.358354568481445, 8.9805908203125, 9.602827072143555, 10.22506332397461, 10.847299575805664, 11.469535827636719, 12.091772079467773, 12.714008331298828, 13.336244583129883, 13.958480834960938, 14.580717086791992, 15.202953338623047, 15.825189590454102, 16.447425842285156, 17.06966209411621, 17.691898345947266, 18.31413459777832, 18.936370849609375, 19.55860710144043]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 8.0, 10.0, 17.0, 8.0, 13.0, 16.0, 12.0, 22.0, 18.0, 23.0, 33.0, 35.0, 33.0, 39.0, 33.0, 43.0, 37.0, 38.0, 43.0, 44.0, 45.0, 42.0, 28.0, 30.0, 43.0, 26.0, 30.0, 23.0, 25.0, 29.0, 27.0, 21.0, 17.0, 16.0, 10.0, 11.0, 8.0, 7.0, 11.0, 2.0, 8.0, 4.0, 2.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.1328125, -4.009063720703125, -3.88531494140625, -3.761566162109375, -3.6378173828125, -3.514068603515625, -3.39031982421875, -3.266571044921875, -3.142822265625, -3.019073486328125, -2.89532470703125, -2.771575927734375, -2.6478271484375, -2.524078369140625, -2.40032958984375, -2.276580810546875, -2.15283203125, -2.029083251953125, -1.90533447265625, -1.781585693359375, -1.6578369140625, -1.534088134765625, -1.41033935546875, -1.286590576171875, -1.162841796875, -1.039093017578125, -0.91534423828125, -0.791595458984375, -0.6678466796875, -0.544097900390625, -0.42034912109375, -0.296600341796875, -0.1728515625, -0.049102783203125, 0.07464599609375, 0.198394775390625, 0.3221435546875, 0.445892333984375, 0.56964111328125, 0.693389892578125, 0.817138671875, 0.940887451171875, 1.06463623046875, 1.188385009765625, 1.3121337890625, 1.435882568359375, 1.55963134765625, 1.683380126953125, 1.80712890625, 1.930877685546875, 2.05462646484375, 2.178375244140625, 2.3021240234375, 2.425872802734375, 2.54962158203125, 2.673370361328125, 2.797119140625, 2.920867919921875, 3.04461669921875, 3.168365478515625, 3.2921142578125, 3.415863037109375, 3.53961181640625, 3.663360595703125, 3.787109375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 2.0, 8.0, 8.0, 14.0, 15.0, 39.0, 49.0, 79.0, 126.0, 193.0, 276.0, 391.0, 666.0, 953.0, 1580.0, 2420.0, 3803.0, 6086.0, 9449.0, 14949.0, 22661.0, 34527.0, 50983.0, 72710.0, 97351.0, 120591.0, 134093.0, 126195.0, 103987.0, 79032.0, 55951.0, 37958.0, 25385.0, 16675.0, 10472.0, 6684.0, 4443.0, 2777.0, 1802.0, 1106.0, 746.0, 484.0, 298.0, 185.0, 126.0, 69.0, 73.0, 32.0, 27.0, 11.0, 10.0, 2.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25634765625, -0.24797821044921875, -0.2396087646484375, -0.23123931884765625, -0.222869873046875, -0.21450042724609375, -0.2061309814453125, -0.19776153564453125, -0.18939208984375, -0.18102264404296875, -0.1726531982421875, -0.16428375244140625, -0.155914306640625, -0.14754486083984375, -0.1391754150390625, -0.13080596923828125, -0.1224365234375, -0.11406707763671875, -0.1056976318359375, -0.09732818603515625, -0.088958740234375, -0.08058929443359375, -0.0722198486328125, -0.06385040283203125, -0.05548095703125, -0.04711151123046875, -0.0387420654296875, -0.03037261962890625, -0.022003173828125, -0.01363372802734375, -0.0052642822265625, 0.00310516357421875, 0.011474609375, 0.01984405517578125, 0.0282135009765625, 0.03658294677734375, 0.044952392578125, 0.05332183837890625, 0.0616912841796875, 0.07006072998046875, 0.07843017578125, 0.08679962158203125, 0.0951690673828125, 0.10353851318359375, 0.111907958984375, 0.12027740478515625, 0.1286468505859375, 0.13701629638671875, 0.1453857421875, 0.15375518798828125, 0.1621246337890625, 0.17049407958984375, 0.178863525390625, 0.18723297119140625, 0.1956024169921875, 0.20397186279296875, 0.21234130859375, 0.22071075439453125, 0.2290802001953125, 0.23744964599609375, 0.245819091796875, 0.25418853759765625, 0.2625579833984375, 0.27092742919921875, 0.279296875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 6.0, 9.0, 17.0, 13.0, 15.0, 13.0, 18.0, 27.0, 27.0, 31.0, 38.0, 33.0, 38.0, 40.0, 42.0, 47.0, 42.0, 49.0, 1060.0, 38.0, 40.0, 31.0, 35.0, 31.0, 38.0, 27.0, 31.0, 20.0, 24.0, 20.0, 15.0, 19.0, 10.0, 15.0, 18.0, 10.0, 7.0, 7.0, 7.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.568359375, -3.466522216796875, -3.36468505859375, -3.262847900390625, -3.1610107421875, -3.059173583984375, -2.95733642578125, -2.855499267578125, -2.753662109375, -2.651824951171875, -2.54998779296875, -2.448150634765625, -2.3463134765625, -2.244476318359375, -2.14263916015625, -2.040802001953125, -1.93896484375, -1.837127685546875, -1.73529052734375, -1.633453369140625, -1.5316162109375, -1.429779052734375, -1.32794189453125, -1.226104736328125, -1.124267578125, -1.022430419921875, -0.92059326171875, -0.818756103515625, -0.7169189453125, -0.615081787109375, -0.51324462890625, -0.411407470703125, -0.3095703125, -0.207733154296875, -0.10589599609375, -0.004058837890625, 0.0977783203125, 0.199615478515625, 0.30145263671875, 0.403289794921875, 0.505126953125, 0.606964111328125, 0.70880126953125, 0.810638427734375, 0.9124755859375, 1.014312744140625, 1.11614990234375, 1.217987060546875, 1.31982421875, 1.421661376953125, 1.52349853515625, 1.625335693359375, 1.7271728515625, 1.829010009765625, 1.93084716796875, 2.032684326171875, 2.134521484375, 2.236358642578125, 2.33819580078125, 2.440032958984375, 2.5418701171875, 2.643707275390625, 2.74554443359375, 2.847381591796875, 2.94921875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 17.0, 18.0, 36.0, 49.0, 80.0, 143.0, 255.0, 436.0, 732.0, 1333.0, 2424.0, 4486.0, 8295.0, 15152.0, 27790.0, 49037.0, 83263.0, 129424.0, 308293.0, 1080566.0, 150191.0, 98793.0, 59894.0, 34502.0, 18981.0, 10402.0, 5613.0, 2985.0, 1692.0, 908.0, 518.0, 296.0, 187.0, 103.0, 67.0, 49.0, 32.0, 22.0, 11.0, 11.0, 11.0, 4.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.205078125, -0.19805145263671875, -0.1910247802734375, -0.18399810791015625, -0.176971435546875, -0.16994476318359375, -0.1629180908203125, -0.15589141845703125, -0.14886474609375, -0.14183807373046875, -0.1348114013671875, -0.12778472900390625, -0.120758056640625, -0.11373138427734375, -0.1067047119140625, -0.09967803955078125, -0.0926513671875, -0.08562469482421875, -0.0785980224609375, -0.07157135009765625, -0.064544677734375, -0.05751800537109375, -0.0504913330078125, -0.04346466064453125, -0.03643798828125, -0.02941131591796875, -0.0223846435546875, -0.01535797119140625, -0.008331298828125, -0.00130462646484375, 0.0057220458984375, 0.01274871826171875, 0.019775390625, 0.02680206298828125, 0.0338287353515625, 0.04085540771484375, 0.047882080078125, 0.05490875244140625, 0.0619354248046875, 0.06896209716796875, 0.07598876953125, 0.08301544189453125, 0.0900421142578125, 0.09706878662109375, 0.104095458984375, 0.11112213134765625, 0.1181488037109375, 0.12517547607421875, 0.1322021484375, 0.13922882080078125, 0.1462554931640625, 0.15328216552734375, 0.160308837890625, 0.16733551025390625, 0.1743621826171875, 0.18138885498046875, 0.18841552734375, 0.19544219970703125, 0.2024688720703125, 0.20949554443359375, 0.216522216796875, 0.22354888916015625, 0.2305755615234375, 0.23760223388671875, 0.24462890625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 7.0, 11.0, 11.0, 19.0, 19.0, 33.0, 30.0, 63.0, 69.0, 77.0, 97.0, 103.0, 101.0, 81.0, 67.0, 47.0, 44.0, 22.0, 17.0, 19.0, 17.0, 11.0, 2.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0533447265625, -0.05170297622680664, -0.05006122589111328, -0.04841947555541992, -0.04677772521972656, -0.0451359748840332, -0.043494224548339844, -0.041852474212646484, -0.040210723876953125, -0.038568973541259766, -0.036927223205566406, -0.03528547286987305, -0.03364372253417969, -0.03200197219848633, -0.03036022186279297, -0.02871847152709961, -0.02707672119140625, -0.02543497085571289, -0.02379322052001953, -0.022151470184326172, -0.020509719848632812, -0.018867969512939453, -0.017226219177246094, -0.015584468841552734, -0.013942718505859375, -0.012300968170166016, -0.010659217834472656, -0.009017467498779297, -0.0073757171630859375, -0.005733966827392578, -0.004092216491699219, -0.0024504661560058594, -0.0008087158203125, 0.0008330345153808594, 0.0024747848510742188, 0.004116535186767578, 0.0057582855224609375, 0.007400035858154297, 0.009041786193847656, 0.010683536529541016, 0.012325286865234375, 0.013967037200927734, 0.015608787536621094, 0.017250537872314453, 0.018892288208007812, 0.020534038543701172, 0.02217578887939453, 0.02381753921508789, 0.02545928955078125, 0.02710103988647461, 0.02874279022216797, 0.030384540557861328, 0.03202629089355469, 0.03366804122924805, 0.035309791564941406, 0.036951541900634766, 0.038593292236328125, 0.040235042572021484, 0.041876792907714844, 0.0435185432434082, 0.04516029357910156, 0.04680204391479492, 0.04844379425048828, 0.05008554458618164, 0.051727294921875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 3.0, 11.0, 20.0, 22.0, 30.0, 42.0, 86.0, 144.0, 363.0, 1693.0, 1044352.0, 1104.0, 310.0, 143.0, 71.0, 44.0, 29.0, 23.0, 14.0, 10.0, 3.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.337890625, -1.2953033447265625, -1.252716064453125, -1.2101287841796875, -1.16754150390625, -1.1249542236328125, -1.082366943359375, -1.0397796630859375, -0.9971923828125, -0.9546051025390625, -0.912017822265625, -0.8694305419921875, -0.82684326171875, -0.7842559814453125, -0.741668701171875, -0.6990814208984375, -0.656494140625, -0.6139068603515625, -0.571319580078125, -0.5287322998046875, -0.48614501953125, -0.4435577392578125, -0.400970458984375, -0.3583831787109375, -0.3157958984375, -0.2732086181640625, -0.230621337890625, -0.1880340576171875, -0.14544677734375, -0.1028594970703125, -0.060272216796875, -0.0176849365234375, 0.02490234375, 0.0674896240234375, 0.110076904296875, 0.1526641845703125, 0.19525146484375, 0.2378387451171875, 0.280426025390625, 0.3230133056640625, 0.3656005859375, 0.4081878662109375, 0.450775146484375, 0.4933624267578125, 0.53594970703125, 0.5785369873046875, 0.621124267578125, 0.6637115478515625, 0.706298828125, 0.7488861083984375, 0.791473388671875, 0.8340606689453125, 0.87664794921875, 0.9192352294921875, 0.961822509765625, 1.0044097900390625, 1.0469970703125, 1.0895843505859375, 1.132171630859375, 1.1747589111328125, 1.21734619140625, 1.2599334716796875, 1.302520751953125, 1.3451080322265625, 1.3876953125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 34.0, 148.0, 709.0, 101.0, 16.0, 4.0, 0.0, 2.0], "bins": [-0.4821374714374542, -0.47389090061187744, -0.46564435958862305, -0.45739778876304626, -0.4491512179374695, -0.4409046471118927, -0.4326581060886383, -0.4244115352630615, -0.41616496443748474, -0.40791839361190796, -0.39967185258865356, -0.3914252817630768, -0.3831787109375, -0.3749321401119232, -0.3666855990886688, -0.35843902826309204, -0.35019248723983765, -0.34194591641426086, -0.33369937539100647, -0.3254528045654297, -0.3172062337398529, -0.3089596629142761, -0.30071312189102173, -0.29246655106544495, -0.28421998023986816, -0.2759734094142914, -0.267726868391037, -0.2594802975654602, -0.2512337267398834, -0.24298717081546783, -0.23474061489105225, -0.22649404406547546, -0.21824747323989868, -0.2100009173154831, -0.2017543464899063, -0.19350779056549072, -0.18526121973991394, -0.17701466381549835, -0.16876810789108276, -0.16052153706550598, -0.1522749811410904, -0.1440284252166748, -0.13578185439109802, -0.12753529846668243, -0.11928872764110565, -0.11104217171669006, -0.10279560834169388, -0.09454904496669769, -0.08630248159170151, -0.07805591821670532, -0.06980935484170914, -0.06156279519200325, -0.053316231817007065, -0.04506966844201088, -0.03682310879230499, -0.028576545417308807, -0.020329982042312622, -0.012083419598639011, -0.0038368571549654007, 0.004409704357385635, 0.01265626773238182, 0.020902831107378006, 0.029149390757083893, 0.03739595413208008, 0.04564251750707626]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 5.0, 10.0, 15.0, 9.0, 18.0, 12.0, 15.0, 18.0, 27.0, 24.0, 25.0, 27.0, 42.0, 34.0, 44.0, 31.0, 43.0, 39.0, 41.0, 51.0, 25.0, 42.0, 48.0, 45.0, 41.0, 32.0, 33.0, 37.0, 18.0, 26.0, 20.0, 11.0, 7.0, 19.0, 20.0, 11.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.10975223779678345, -0.10658009350299835, -0.10340795665979385, -0.10023581981658936, -0.09706367552280426, -0.09389153122901917, -0.09071939438581467, -0.08754725754261017, -0.08437511324882507, -0.08120296895503998, -0.07803083211183548, -0.07485869526863098, -0.07168655097484589, -0.06851440668106079, -0.06534226983785629, -0.062170129269361496, -0.0589979887008667, -0.0558258481323719, -0.052653707563877106, -0.04948156699538231, -0.04630942642688751, -0.043137285858392715, -0.03996514528989792, -0.03679300472140312, -0.033620864152908325, -0.03044872358441353, -0.02727658301591873, -0.024104442447423935, -0.020932301878929138, -0.01776016131043434, -0.014588020741939545, -0.011415880173444748, -0.008243739604949951, -0.005071599036455154, -0.0018994584679603577, 0.001272682100534439, 0.004444822669029236, 0.007616963237524033, 0.01078910380601883, 0.013961244374513626, 0.017133384943008423, 0.02030552551150322, 0.023477666079998016, 0.026649806648492813, 0.02982194721698761, 0.03299408778548241, 0.0361662283539772, 0.039338368922472, 0.0425105094909668, 0.045682650059461594, 0.04885479062795639, 0.05202693119645119, 0.055199071764945984, 0.05837121233344078, 0.06154335290193558, 0.06471548974514008, 0.06788763403892517, 0.07105977833271027, 0.07423191517591476, 0.07740405201911926, 0.08057619631290436, 0.08374834060668945, 0.08692047744989395, 0.09009261429309845, 0.09326475858688354]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 9.0, 9.0, 11.0, 4.0, 15.0, 20.0, 16.0, 19.0, 20.0, 31.0, 22.0, 32.0, 29.0, 33.0, 35.0, 47.0, 41.0, 40.0, 34.0, 49.0, 39.0, 50.0, 41.0, 35.0, 34.0, 19.0, 29.0, 26.0, 25.0, 31.0, 23.0, 22.0, 19.0, 16.0, 16.0, 13.0, 5.0, 6.0, 7.0, 6.0, 5.0, 3.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.96875, -3.84381103515625, -3.7188720703125, -3.59393310546875, -3.468994140625, -3.34405517578125, -3.2191162109375, -3.09417724609375, -2.96923828125, -2.84429931640625, -2.7193603515625, -2.59442138671875, -2.469482421875, -2.34454345703125, -2.2196044921875, -2.09466552734375, -1.9697265625, -1.84478759765625, -1.7198486328125, -1.59490966796875, -1.469970703125, -1.34503173828125, -1.2200927734375, -1.09515380859375, -0.97021484375, -0.84527587890625, -0.7203369140625, -0.59539794921875, -0.470458984375, -0.34552001953125, -0.2205810546875, -0.09564208984375, 0.029296875, 0.15423583984375, 0.2791748046875, 0.40411376953125, 0.529052734375, 0.65399169921875, 0.7789306640625, 0.90386962890625, 1.02880859375, 1.15374755859375, 1.2786865234375, 1.40362548828125, 1.528564453125, 1.65350341796875, 1.7784423828125, 1.90338134765625, 2.0283203125, 2.15325927734375, 2.2781982421875, 2.40313720703125, 2.528076171875, 2.65301513671875, 2.7779541015625, 2.90289306640625, 3.02783203125, 3.15277099609375, 3.2777099609375, 3.40264892578125, 3.527587890625, 3.65252685546875, 3.7774658203125, 3.90240478515625, 4.02734375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 15.0, 20.0, 30.0, 36.0, 28.0, 58.0, 75.0, 95.0, 149.0, 317.0, 668.0, 1754.0, 4739.0, 13143.0, 38577.0, 166025.0, 523944.0, 225323.0, 48093.0, 15915.0, 5707.0, 2079.0, 808.0, 349.0, 191.0, 97.0, 84.0, 52.0, 40.0, 31.0, 19.0, 14.0, 20.0, 13.0, 10.0, 10.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.4493408203125, -6.238525390625, -6.0277099609375, -5.81689453125, -5.6060791015625, -5.395263671875, -5.1844482421875, -4.9736328125, -4.7628173828125, -4.552001953125, -4.3411865234375, -4.13037109375, -3.9195556640625, -3.708740234375, -3.4979248046875, -3.287109375, -3.0762939453125, -2.865478515625, -2.6546630859375, -2.44384765625, -2.2330322265625, -2.022216796875, -1.8114013671875, -1.6005859375, -1.3897705078125, -1.178955078125, -0.9681396484375, -0.75732421875, -0.5465087890625, -0.335693359375, -0.1248779296875, 0.0859375, 0.2967529296875, 0.507568359375, 0.7183837890625, 0.92919921875, 1.1400146484375, 1.350830078125, 1.5616455078125, 1.7724609375, 1.9832763671875, 2.194091796875, 2.4049072265625, 2.61572265625, 2.8265380859375, 3.037353515625, 3.2481689453125, 3.458984375, 3.6697998046875, 3.880615234375, 4.0914306640625, 4.30224609375, 4.5130615234375, 4.723876953125, 4.9346923828125, 5.1455078125, 5.3563232421875, 5.567138671875, 5.7779541015625, 5.98876953125, 6.1995849609375, 6.410400390625, 6.6212158203125, 6.83203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 5.0, 6.0, 4.0, 18.0, 9.0, 13.0, 23.0, 18.0, 20.0, 20.0, 32.0, 35.0, 42.0, 44.0, 40.0, 72.0, 110.0, 233.0, 1520.0, 261.0, 113.0, 55.0, 46.0, 37.0, 32.0, 35.0, 37.0, 30.0, 36.0, 25.0, 11.0, 10.0, 4.0, 8.0, 8.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.6796875, -13.271728515625, -12.86376953125, -12.455810546875, -12.0478515625, -11.639892578125, -11.23193359375, -10.823974609375, -10.416015625, -10.008056640625, -9.60009765625, -9.192138671875, -8.7841796875, -8.376220703125, -7.96826171875, -7.560302734375, -7.15234375, -6.744384765625, -6.33642578125, -5.928466796875, -5.5205078125, -5.112548828125, -4.70458984375, -4.296630859375, -3.888671875, -3.480712890625, -3.07275390625, -2.664794921875, -2.2568359375, -1.848876953125, -1.44091796875, -1.032958984375, -0.625, -0.217041015625, 0.19091796875, 0.598876953125, 1.0068359375, 1.414794921875, 1.82275390625, 2.230712890625, 2.638671875, 3.046630859375, 3.45458984375, 3.862548828125, 4.2705078125, 4.678466796875, 5.08642578125, 5.494384765625, 5.90234375, 6.310302734375, 6.71826171875, 7.126220703125, 7.5341796875, 7.942138671875, 8.35009765625, 8.758056640625, 9.166015625, 9.573974609375, 9.98193359375, 10.389892578125, 10.7978515625, 11.205810546875, 11.61376953125, 12.021728515625, 12.4296875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 4.0, 1.0, 3.0, 6.0, 11.0, 9.0, 5.0, 7.0, 14.0, 17.0, 28.0, 35.0, 55.0, 66.0, 93.0, 89.0, 152.0, 246.0, 534.0, 1968.0, 34343.0, 2918083.0, 183182.0, 4966.0, 781.0, 315.0, 198.0, 133.0, 88.0, 51.0, 46.0, 25.0, 36.0, 28.0, 19.0, 15.0, 17.0, 7.0, 6.0, 7.0, 4.0, 3.0, 8.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.46875, -20.74560546875, -20.0224609375, -19.29931640625, -18.576171875, -17.85302734375, -17.1298828125, -16.40673828125, -15.68359375, -14.96044921875, -14.2373046875, -13.51416015625, -12.791015625, -12.06787109375, -11.3447265625, -10.62158203125, -9.8984375, -9.17529296875, -8.4521484375, -7.72900390625, -7.005859375, -6.28271484375, -5.5595703125, -4.83642578125, -4.11328125, -3.39013671875, -2.6669921875, -1.94384765625, -1.220703125, -0.49755859375, 0.2255859375, 0.94873046875, 1.671875, 2.39501953125, 3.1181640625, 3.84130859375, 4.564453125, 5.28759765625, 6.0107421875, 6.73388671875, 7.45703125, 8.18017578125, 8.9033203125, 9.62646484375, 10.349609375, 11.07275390625, 11.7958984375, 12.51904296875, 13.2421875, 13.96533203125, 14.6884765625, 15.41162109375, 16.134765625, 16.85791015625, 17.5810546875, 18.30419921875, 19.02734375, 19.75048828125, 20.4736328125, 21.19677734375, 21.919921875, 22.64306640625, 23.3662109375, 24.08935546875, 24.8125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 161.0, 755.0, 101.0], "bins": [-240.7195587158203, -236.86416625976562, -233.00877380371094, -229.15338134765625, -225.29798889160156, -221.44259643554688, -217.5872039794922, -213.7318115234375, -209.8764190673828, -206.02102661132812, -202.16563415527344, -198.31024169921875, -194.45484924316406, -190.59945678710938, -186.7440643310547, -182.888671875, -179.03326416015625, -175.17787170410156, -171.32247924804688, -167.4670867919922, -163.6116943359375, -159.7563018798828, -155.90090942382812, -152.04551696777344, -148.19012451171875, -144.33473205566406, -140.47933959960938, -136.6239471435547, -132.7685546875, -128.9131622314453, -125.05776977539062, -121.2023696899414, -117.34696960449219, -113.4915771484375, -109.63618469238281, -105.78079223632812, -101.92539978027344, -98.07000732421875, -94.21461486816406, -90.35921478271484, -86.50382995605469, -82.6484375, -78.79304504394531, -74.93765258789062, -71.08226013183594, -67.22686767578125, -63.3714714050293, -59.516075134277344, -55.660682678222656, -51.80529022216797, -47.94989776611328, -44.094505310058594, -40.23910903930664, -36.38371658325195, -32.528324127197266, -28.672929763793945, -24.817535400390625, -20.962142944335938, -17.106748580932617, -13.25135612487793, -9.395962715148926, -5.540569305419922, -1.6851768493652344, 2.170217514038086, 6.025609970092773]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 3.0, 3.0, 5.0, 4.0, 12.0, 8.0, 9.0, 9.0, 14.0, 19.0, 10.0, 23.0, 30.0, 31.0, 29.0, 43.0, 49.0, 38.0, 39.0, 36.0, 42.0, 46.0, 37.0, 38.0, 43.0, 31.0, 44.0, 27.0, 34.0, 32.0, 16.0, 23.0, 20.0, 36.0, 25.0, 15.0, 16.0, 10.0, 17.0, 7.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.577312469482422, -25.673234939575195, -24.769155502319336, -23.86507797241211, -22.961000442504883, -22.056922912597656, -21.152843475341797, -20.24876594543457, -19.344688415527344, -18.440610885620117, -17.536531448364258, -16.63245391845703, -15.728376388549805, -14.824297904968262, -13.920219421386719, -13.016141891479492, -12.112062454223633, -11.20798397064209, -10.303906440734863, -9.39982795715332, -8.495750427246094, -7.591671943664551, -6.687593460083008, -5.783515453338623, -4.879437446594238, -3.9753594398498535, -3.0712811946868896, -2.167202949523926, -1.263124942779541, -0.35904693603515625, 0.5450315475463867, 1.4491095542907715, 2.3531856536865234, 3.257263660430908, 4.161341667175293, 5.065420150756836, 5.969498157501221, 6.8735761642456055, 7.777654647827148, 8.681732177734375, 9.585810661315918, 10.489889144897461, 11.393966674804688, 12.29804515838623, 13.202123641967773, 14.106201171875, 15.010279655456543, 15.914358139038086, 16.818435668945312, 17.72251319885254, 18.6265926361084, 19.530670166015625, 20.43474769592285, 21.338825225830078, 22.242904663085938, 23.146982192993164, 24.05105972290039, 24.955137252807617, 25.859216690063477, 26.763294219970703, 27.66737174987793, 28.571449279785156, 29.475528717041016, 30.379606246948242, 31.2836856842041]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 16.0, 13.0, 10.0, 13.0, 13.0, 16.0, 23.0, 24.0, 30.0, 31.0, 40.0, 38.0, 50.0, 42.0, 45.0, 31.0, 37.0, 35.0, 40.0, 46.0, 35.0, 26.0, 25.0, 47.0, 20.0, 27.0, 34.0, 22.0, 24.0, 18.0, 23.0, 15.0, 10.0, 9.0, 14.0, 9.0, 6.0, 5.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.09765625, -3.97052001953125, -3.8433837890625, -3.71624755859375, -3.589111328125, -3.46197509765625, -3.3348388671875, -3.20770263671875, -3.08056640625, -2.95343017578125, -2.8262939453125, -2.69915771484375, -2.572021484375, -2.44488525390625, -2.3177490234375, -2.19061279296875, -2.0634765625, -1.93634033203125, -1.8092041015625, -1.68206787109375, -1.554931640625, -1.42779541015625, -1.3006591796875, -1.17352294921875, -1.04638671875, -0.91925048828125, -0.7921142578125, -0.66497802734375, -0.537841796875, -0.41070556640625, -0.2835693359375, -0.15643310546875, -0.029296875, 0.09783935546875, 0.2249755859375, 0.35211181640625, 0.479248046875, 0.60638427734375, 0.7335205078125, 0.86065673828125, 0.98779296875, 1.11492919921875, 1.2420654296875, 1.36920166015625, 1.496337890625, 1.62347412109375, 1.7506103515625, 1.87774658203125, 2.0048828125, 2.13201904296875, 2.2591552734375, 2.38629150390625, 2.513427734375, 2.64056396484375, 2.7677001953125, 2.89483642578125, 3.02197265625, 3.14910888671875, 3.2762451171875, 3.40338134765625, 3.530517578125, 3.65765380859375, 3.7847900390625, 3.91192626953125, 4.0390625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 10.0, 9.0, 7.0, 24.0, 19.0, 33.0, 45.0, 58.0, 100.0, 115.0, 233.0, 407.0, 920.0, 2397.0, 9641.0, 53475.0, 376655.0, 1917838.0, 1533273.0, 251451.0, 36432.0, 7160.0, 2124.0, 795.0, 397.0, 178.0, 128.0, 103.0, 58.0, 43.0, 34.0, 25.0, 13.0, 15.0, 15.0, 6.0, 10.0, 6.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.671875, -8.42340087890625, -8.1749267578125, -7.92645263671875, -7.677978515625, -7.42950439453125, -7.1810302734375, -6.93255615234375, -6.68408203125, -6.43560791015625, -6.1871337890625, -5.93865966796875, -5.690185546875, -5.44171142578125, -5.1932373046875, -4.94476318359375, -4.6962890625, -4.44781494140625, -4.1993408203125, -3.95086669921875, -3.702392578125, -3.45391845703125, -3.2054443359375, -2.95697021484375, -2.70849609375, -2.46002197265625, -2.2115478515625, -1.96307373046875, -1.714599609375, -1.46612548828125, -1.2176513671875, -0.96917724609375, -0.720703125, -0.47222900390625, -0.2237548828125, 0.02471923828125, 0.273193359375, 0.52166748046875, 0.7701416015625, 1.01861572265625, 1.26708984375, 1.51556396484375, 1.7640380859375, 2.01251220703125, 2.260986328125, 2.50946044921875, 2.7579345703125, 3.00640869140625, 3.2548828125, 3.50335693359375, 3.7518310546875, 4.00030517578125, 4.248779296875, 4.49725341796875, 4.7457275390625, 4.99420166015625, 5.24267578125, 5.49114990234375, 5.7396240234375, 5.98809814453125, 6.236572265625, 6.48504638671875, 6.7335205078125, 6.98199462890625, 7.23046875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 9.0, 26.0, 21.0, 35.0, 54.0, 57.0, 78.0, 136.0, 142.0, 171.0, 231.0, 288.0, 372.0, 412.0, 391.0, 355.0, 298.0, 251.0, 164.0, 138.0, 114.0, 72.0, 63.0, 40.0, 34.0, 26.0, 12.0, 18.0, 11.0, 9.0, 3.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.4375, -4.25927734375, -4.0810546875, -3.90283203125, -3.724609375, -3.54638671875, -3.3681640625, -3.18994140625, -3.01171875, -2.83349609375, -2.6552734375, -2.47705078125, -2.298828125, -2.12060546875, -1.9423828125, -1.76416015625, -1.5859375, -1.40771484375, -1.2294921875, -1.05126953125, -0.873046875, -0.69482421875, -0.5166015625, -0.33837890625, -0.16015625, 0.01806640625, 0.1962890625, 0.37451171875, 0.552734375, 0.73095703125, 0.9091796875, 1.08740234375, 1.265625, 1.44384765625, 1.6220703125, 1.80029296875, 1.978515625, 2.15673828125, 2.3349609375, 2.51318359375, 2.69140625, 2.86962890625, 3.0478515625, 3.22607421875, 3.404296875, 3.58251953125, 3.7607421875, 3.93896484375, 4.1171875, 4.29541015625, 4.4736328125, 4.65185546875, 4.830078125, 5.00830078125, 5.1865234375, 5.36474609375, 5.54296875, 5.72119140625, 5.8994140625, 6.07763671875, 6.255859375, 6.43408203125, 6.6123046875, 6.79052734375, 6.96875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 13.0, 14.0, 25.0, 19.0, 37.0, 47.0, 66.0, 121.0, 162.0, 283.0, 412.0, 891.0, 2650.0, 14674.0, 177628.0, 2621237.0, 1291922.0, 72737.0, 7805.0, 1732.0, 731.0, 382.0, 203.0, 155.0, 98.0, 58.0, 49.0, 38.0, 21.0, 14.0, 9.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0], "bins": [-17.796875, -17.338623046875, -16.88037109375, -16.422119140625, -15.9638671875, -15.505615234375, -15.04736328125, -14.589111328125, -14.130859375, -13.672607421875, -13.21435546875, -12.756103515625, -12.2978515625, -11.839599609375, -11.38134765625, -10.923095703125, -10.46484375, -10.006591796875, -9.54833984375, -9.090087890625, -8.6318359375, -8.173583984375, -7.71533203125, -7.257080078125, -6.798828125, -6.340576171875, -5.88232421875, -5.424072265625, -4.9658203125, -4.507568359375, -4.04931640625, -3.591064453125, -3.1328125, -2.674560546875, -2.21630859375, -1.758056640625, -1.2998046875, -0.841552734375, -0.38330078125, 0.074951171875, 0.533203125, 0.991455078125, 1.44970703125, 1.907958984375, 2.3662109375, 2.824462890625, 3.28271484375, 3.740966796875, 4.19921875, 4.657470703125, 5.11572265625, 5.573974609375, 6.0322265625, 6.490478515625, 6.94873046875, 7.406982421875, 7.865234375, 8.323486328125, 8.78173828125, 9.239990234375, 9.6982421875, 10.156494140625, 10.61474609375, 11.072998046875, 11.53125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 19.0, 26.0, 43.0, 59.0, 88.0, 103.0, 110.0, 122.0, 105.0, 105.0, 69.0, 63.0, 38.0, 32.0, 9.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.646228790283203, -21.677724838256836, -20.7092227935791, -19.740718841552734, -18.772216796875, -17.803712844848633, -16.8352108001709, -15.866706848144531, -14.898204803466797, -13.929701805114746, -12.961198806762695, -11.992695808410645, -11.024192810058594, -10.055688858032227, -9.087186813354492, -8.118682861328125, -7.150179862976074, -6.181676864624023, -5.213173866271973, -4.244670867919922, -3.276167631149292, -2.307664394378662, -1.3391613960266113, -0.37065839767456055, 0.5978446006774902, 1.566347599029541, 2.534850597381592, 3.5033538341522217, 4.471857070922852, 5.440360069274902, 6.408863067626953, 7.377366065979004, 8.345869064331055, 9.314372062683105, 10.282875061035156, 11.251378059387207, 12.219881057739258, 13.188385009765625, 14.15688705444336, 15.125391006469727, 16.09389305114746, 17.062397003173828, 18.030899047851562, 18.99940299987793, 19.967905044555664, 20.93640899658203, 21.904911041259766, 22.873414993286133, 23.8419189453125, 24.810422897338867, 25.7789249420166, 26.74742889404297, 27.715930938720703, 28.68443489074707, 29.652936935424805, 30.621440887451172, 31.589942932128906, 32.55844497680664, 33.52695083618164, 34.495452880859375, 35.46395492553711, 36.432456970214844, 37.400962829589844, 38.36946487426758, 39.33796691894531]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 10.0, 15.0, 8.0, 16.0, 21.0, 14.0, 15.0, 35.0, 29.0, 21.0, 37.0, 44.0, 37.0, 30.0, 36.0, 48.0, 47.0, 45.0, 45.0, 38.0, 44.0, 32.0, 46.0, 45.0, 33.0, 25.0, 29.0, 26.0, 27.0, 18.0, 13.0, 12.0, 12.0, 7.0, 9.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.33858871459961, -20.663816452026367, -19.989044189453125, -19.314273834228516, -18.639501571655273, -17.96472930908203, -17.289958953857422, -16.61518669128418, -15.940414428710938, -15.265642166137695, -14.59087085723877, -13.916099548339844, -13.241327285766602, -12.56655502319336, -11.891783714294434, -11.217012405395508, -10.542240142822266, -9.867467880249023, -9.192696571350098, -8.517925262451172, -7.84315299987793, -7.168381214141846, -6.493609428405762, -5.818837642669678, -5.144065856933594, -4.46929407119751, -3.794522285461426, -3.119750499725342, -2.444978713989258, -1.7702069282531738, -1.0954351425170898, -0.42066335678100586, 0.2541065216064453, 0.9288783073425293, 1.6036500930786133, 2.2784218788146973, 2.9531936645507812, 3.6279654502868652, 4.302737236022949, 4.977509021759033, 5.652280807495117, 6.327052593231201, 7.001824378967285, 7.676596164703369, 8.351367950439453, 9.026140213012695, 9.700911521911621, 10.375682830810547, 11.050455093383789, 11.725227355957031, 12.399998664855957, 13.074769973754883, 13.749542236328125, 14.424314498901367, 15.099085807800293, 15.773857116699219, 16.44862937927246, 17.123401641845703, 17.798171997070312, 18.472944259643555, 19.147716522216797, 19.82248878479004, 20.49726104736328, 21.17203140258789, 21.846803665161133]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 9.0, 12.0, 9.0, 20.0, 7.0, 15.0, 18.0, 25.0, 28.0, 28.0, 31.0, 29.0, 48.0, 40.0, 39.0, 49.0, 39.0, 37.0, 45.0, 45.0, 48.0, 34.0, 26.0, 30.0, 44.0, 30.0, 22.0, 25.0, 25.0, 23.0, 19.0, 20.0, 12.0, 7.0, 10.0, 18.0, 7.0, 1.0, 1.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.2265625, -4.09564208984375, -3.9647216796875, -3.83380126953125, -3.702880859375, -3.57196044921875, -3.4410400390625, -3.31011962890625, -3.17919921875, -3.04827880859375, -2.9173583984375, -2.78643798828125, -2.655517578125, -2.52459716796875, -2.3936767578125, -2.26275634765625, -2.1318359375, -2.00091552734375, -1.8699951171875, -1.73907470703125, -1.608154296875, -1.47723388671875, -1.3463134765625, -1.21539306640625, -1.08447265625, -0.95355224609375, -0.8226318359375, -0.69171142578125, -0.560791015625, -0.42987060546875, -0.2989501953125, -0.16802978515625, -0.037109375, 0.09381103515625, 0.2247314453125, 0.35565185546875, 0.486572265625, 0.61749267578125, 0.7484130859375, 0.87933349609375, 1.01025390625, 1.14117431640625, 1.2720947265625, 1.40301513671875, 1.533935546875, 1.66485595703125, 1.7957763671875, 1.92669677734375, 2.0576171875, 2.18853759765625, 2.3194580078125, 2.45037841796875, 2.581298828125, 2.71221923828125, 2.8431396484375, 2.97406005859375, 3.10498046875, 3.23590087890625, 3.3668212890625, 3.49774169921875, 3.628662109375, 3.75958251953125, 3.8905029296875, 4.02142333984375, 4.15234375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 7.0, 13.0, 17.0, 35.0, 63.0, 103.0, 159.0, 237.0, 438.0, 759.0, 1138.0, 1986.0, 3125.0, 5260.0, 8260.0, 13336.0, 21062.0, 32900.0, 48547.0, 69617.0, 94612.0, 119413.0, 136580.0, 130123.0, 107579.0, 82851.0, 58452.0, 40285.0, 26628.0, 16995.0, 10559.0, 6853.0, 4112.0, 2479.0, 1592.0, 998.0, 551.0, 338.0, 206.0, 105.0, 62.0, 45.0, 27.0, 16.0, 11.0, 11.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-0.305908203125, -0.29735374450683594, -0.2887992858886719, -0.2802448272705078, -0.27169036865234375, -0.2631359100341797, -0.2545814514160156, -0.24602699279785156, -0.2374725341796875, -0.22891807556152344, -0.22036361694335938, -0.2118091583251953, -0.20325469970703125, -0.1947002410888672, -0.18614578247070312, -0.17759132385253906, -0.169036865234375, -0.16048240661621094, -0.15192794799804688, -0.1433734893798828, -0.13481903076171875, -0.1262645721435547, -0.11771011352539062, -0.10915565490722656, -0.1006011962890625, -0.09204673767089844, -0.08349227905273438, -0.07493782043457031, -0.06638336181640625, -0.05782890319824219, -0.049274444580078125, -0.04071998596191406, -0.03216552734375, -0.023611068725585938, -0.015056610107421875, -0.0065021514892578125, 0.00205230712890625, 0.010606765747070312, 0.019161224365234375, 0.027715682983398438, 0.0362701416015625, 0.04482460021972656, 0.053379058837890625, 0.06193351745605469, 0.07048797607421875, 0.07904243469238281, 0.08759689331054688, 0.09615135192871094, 0.104705810546875, 0.11326026916503906, 0.12181472778320312, 0.1303691864013672, 0.13892364501953125, 0.1474781036376953, 0.15603256225585938, 0.16458702087402344, 0.1731414794921875, 0.18169593811035156, 0.19025039672851562, 0.1988048553466797, 0.20735931396484375, 0.2159137725830078, 0.22446823120117188, 0.23302268981933594, 0.2415771484375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 10.0, 13.0, 20.0, 10.0, 19.0, 18.0, 24.0, 25.0, 31.0, 27.0, 33.0, 32.0, 43.0, 41.0, 42.0, 44.0, 43.0, 1070.0, 40.0, 49.0, 33.0, 36.0, 33.0, 30.0, 36.0, 30.0, 19.0, 26.0, 23.0, 18.0, 18.0, 15.0, 11.0, 11.0, 7.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0], "bins": [-3.533203125, -3.43292236328125, -3.3326416015625, -3.23236083984375, -3.132080078125, -3.03179931640625, -2.9315185546875, -2.83123779296875, -2.73095703125, -2.63067626953125, -2.5303955078125, -2.43011474609375, -2.329833984375, -2.22955322265625, -2.1292724609375, -2.02899169921875, -1.9287109375, -1.82843017578125, -1.7281494140625, -1.62786865234375, -1.527587890625, -1.42730712890625, -1.3270263671875, -1.22674560546875, -1.12646484375, -1.02618408203125, -0.9259033203125, -0.82562255859375, -0.725341796875, -0.62506103515625, -0.5247802734375, -0.42449951171875, -0.32421875, -0.22393798828125, -0.1236572265625, -0.02337646484375, 0.076904296875, 0.17718505859375, 0.2774658203125, 0.37774658203125, 0.47802734375, 0.57830810546875, 0.6785888671875, 0.77886962890625, 0.879150390625, 0.97943115234375, 1.0797119140625, 1.17999267578125, 1.2802734375, 1.38055419921875, 1.4808349609375, 1.58111572265625, 1.681396484375, 1.78167724609375, 1.8819580078125, 1.98223876953125, 2.08251953125, 2.18280029296875, 2.2830810546875, 2.38336181640625, 2.483642578125, 2.58392333984375, 2.6842041015625, 2.78448486328125, 2.884765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 4.0, 9.0, 9.0, 12.0, 16.0, 25.0, 29.0, 69.0, 95.0, 177.0, 248.0, 412.0, 643.0, 998.0, 1489.0, 2383.0, 3914.0, 6016.0, 9481.0, 14960.0, 22820.0, 34873.0, 51548.0, 73537.0, 101677.0, 156938.0, 1075112.0, 191326.0, 107942.0, 77958.0, 55326.0, 37592.0, 25208.0, 16090.0, 10191.0, 6604.0, 4121.0, 2671.0, 1725.0, 974.0, 676.0, 434.0, 307.0, 172.0, 133.0, 69.0, 39.0, 32.0, 18.0, 15.0, 12.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15380859375, -0.14861106872558594, -0.14341354370117188, -0.1382160186767578, -0.13301849365234375, -0.1278209686279297, -0.12262344360351562, -0.11742591857910156, -0.1122283935546875, -0.10703086853027344, -0.10183334350585938, -0.09663581848144531, -0.09143829345703125, -0.08624076843261719, -0.08104324340820312, -0.07584571838378906, -0.070648193359375, -0.06545066833496094, -0.060253143310546875, -0.05505561828613281, -0.04985809326171875, -0.04466056823730469, -0.039463043212890625, -0.03426551818847656, -0.0290679931640625, -0.023870468139648438, -0.018672943115234375, -0.013475418090820312, -0.00827789306640625, -0.0030803680419921875, 0.002117156982421875, 0.0073146820068359375, 0.01251220703125, 0.017709732055664062, 0.022907257080078125, 0.028104782104492188, 0.03330230712890625, 0.03849983215332031, 0.043697357177734375, 0.04889488220214844, 0.0540924072265625, 0.05928993225097656, 0.06448745727539062, 0.06968498229980469, 0.07488250732421875, 0.08008003234863281, 0.08527755737304688, 0.09047508239746094, 0.095672607421875, 0.10087013244628906, 0.10606765747070312, 0.11126518249511719, 0.11646270751953125, 0.12166023254394531, 0.12685775756835938, 0.13205528259277344, 0.1372528076171875, 0.14245033264160156, 0.14764785766601562, 0.1528453826904297, 0.15804290771484375, 0.1632404327392578, 0.16843795776367188, 0.17363548278808594, 0.1788330078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 10.0, 3.0, 8.0, 6.0, 10.0, 13.0, 13.0, 16.0, 23.0, 27.0, 36.0, 46.0, 47.0, 52.0, 53.0, 49.0, 71.0, 67.0, 60.0, 54.0, 43.0, 56.0, 49.0, 33.0, 30.0, 26.0, 26.0, 15.0, 13.0, 5.0, 5.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03466796875, -0.03354787826538086, -0.03242778778076172, -0.03130769729614258, -0.030187606811523438, -0.029067516326904297, -0.027947425842285156, -0.026827335357666016, -0.025707244873046875, -0.024587154388427734, -0.023467063903808594, -0.022346973419189453, -0.021226882934570312, -0.020106792449951172, -0.01898670196533203, -0.01786661148071289, -0.01674652099609375, -0.01562643051147461, -0.014506340026855469, -0.013386249542236328, -0.012266159057617188, -0.011146068572998047, -0.010025978088378906, -0.008905887603759766, -0.007785797119140625, -0.006665706634521484, -0.005545616149902344, -0.004425525665283203, -0.0033054351806640625, -0.002185344696044922, -0.0010652542114257812, 5.4836273193359375e-05, 0.0011749267578125, 0.0022950172424316406, 0.0034151077270507812, 0.004535198211669922, 0.0056552886962890625, 0.006775379180908203, 0.007895469665527344, 0.009015560150146484, 0.010135650634765625, 0.011255741119384766, 0.012375831604003906, 0.013495922088623047, 0.014616012573242188, 0.015736103057861328, 0.01685619354248047, 0.01797628402709961, 0.01909637451171875, 0.02021646499633789, 0.02133655548095703, 0.022456645965576172, 0.023576736450195312, 0.024696826934814453, 0.025816917419433594, 0.026937007904052734, 0.028057098388671875, 0.029177188873291016, 0.030297279357910156, 0.0314173698425293, 0.03253746032714844, 0.03365755081176758, 0.03477764129638672, 0.03589773178100586, 0.037017822265625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 9.0, 10.0, 8.0, 25.0, 23.0, 46.0, 46.0, 64.0, 134.0, 155.0, 294.0, 773.0, 10846.0, 1032730.0, 2207.0, 479.0, 238.0, 134.0, 80.0, 52.0, 47.0, 32.0, 20.0, 15.0, 15.0, 11.0, 6.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.849609375, -0.82330322265625, -0.7969970703125, -0.77069091796875, -0.744384765625, -0.71807861328125, -0.6917724609375, -0.66546630859375, -0.63916015625, -0.61285400390625, -0.5865478515625, -0.56024169921875, -0.533935546875, -0.50762939453125, -0.4813232421875, -0.45501708984375, -0.4287109375, -0.40240478515625, -0.3760986328125, -0.34979248046875, -0.323486328125, -0.29718017578125, -0.2708740234375, -0.24456787109375, -0.21826171875, -0.19195556640625, -0.1656494140625, -0.13934326171875, -0.113037109375, -0.08673095703125, -0.0604248046875, -0.03411865234375, -0.0078125, 0.01849365234375, 0.0447998046875, 0.07110595703125, 0.097412109375, 0.12371826171875, 0.1500244140625, 0.17633056640625, 0.20263671875, 0.22894287109375, 0.2552490234375, 0.28155517578125, 0.307861328125, 0.33416748046875, 0.3604736328125, 0.38677978515625, 0.4130859375, 0.43939208984375, 0.4656982421875, 0.49200439453125, 0.518310546875, 0.54461669921875, 0.5709228515625, 0.59722900390625, 0.62353515625, 0.64984130859375, 0.6761474609375, 0.70245361328125, 0.728759765625, 0.75506591796875, 0.7813720703125, 0.80767822265625, 0.833984375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 13.0, 86.0, 840.0, 69.0, 4.0], "bins": [-0.8456180095672607, -0.8318808674812317, -0.8181437849998474, -0.8044066429138184, -0.7906695604324341, -0.776932418346405, -0.763195276260376, -0.7494581937789917, -0.7357210516929626, -0.7219839096069336, -0.7082468271255493, -0.6945096850395203, -0.680772602558136, -0.6670354604721069, -0.6532983183860779, -0.6395612359046936, -0.6258240938186646, -0.6120869517326355, -0.5983498692512512, -0.5846127271652222, -0.5708756446838379, -0.5571385025978088, -0.5434013605117798, -0.5296642780303955, -0.5159271359443665, -0.5021899938583374, -0.4884529113769531, -0.4747157692909241, -0.4609786570072174, -0.44724154472351074, -0.4335044324398041, -0.4197673201560974, -0.40603023767471313, -0.39229312539100647, -0.3785560131072998, -0.36481887102127075, -0.3510817587375641, -0.3373446464538574, -0.32360753417015076, -0.3098704218864441, -0.29613327980041504, -0.2823961675167084, -0.2686590552330017, -0.25492191314697266, -0.241184800863266, -0.22744768857955933, -0.21371057629585266, -0.1999734491109848, -0.18623632192611694, -0.17249920964241028, -0.15876208245754242, -0.14502497017383575, -0.1312878429889679, -0.11755073070526123, -0.10381361097097397, -0.0900764912366867, -0.07633937150239944, -0.06260225176811218, -0.04886513203382492, -0.03512801602482796, -0.021390896290540695, -0.007653780281543732, 0.00608333945274353, 0.019820459187030792, 0.033557578921318054]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 8.0, 8.0, 9.0, 7.0, 9.0, 18.0, 10.0, 19.0, 14.0, 23.0, 17.0, 36.0, 37.0, 25.0, 43.0, 32.0, 46.0, 44.0, 48.0, 48.0, 35.0, 53.0, 30.0, 40.0, 38.0, 38.0, 38.0, 29.0, 29.0, 25.0, 21.0, 20.0, 11.0, 12.0, 18.0, 11.0, 12.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09909456968307495, -0.09594019502401352, -0.09278582036495209, -0.08963144570589066, -0.08647707104682922, -0.0833226889371872, -0.08016831427812576, -0.07701393961906433, -0.0738595649600029, -0.07070519030094147, -0.06755081564188004, -0.0643964409828186, -0.06124206259846687, -0.05808768793940544, -0.05493330955505371, -0.05177893489599228, -0.04862456023693085, -0.045470185577869415, -0.04231581091880798, -0.03916143253445625, -0.03600705787539482, -0.03285268321633339, -0.029698306694626808, -0.026543930172920227, -0.023389555513858795, -0.020235180854797363, -0.017080804333090782, -0.013926428742706776, -0.01077205315232277, -0.007617678493261337, -0.004463301971554756, -0.001308925449848175, 0.0018454492092132568, 0.004999824799597263, 0.00815420038998127, 0.011308575980365276, 0.014462951570749283, 0.017617326229810715, 0.020771702751517296, 0.023926079273223877, 0.02708045393228531, 0.03023482859134674, 0.03338920325040817, 0.0365435816347599, 0.039697956293821335, 0.04285233095288277, 0.0460067093372345, 0.04916108399629593, 0.05231545865535736, 0.05546983331441879, 0.058624207973480225, 0.061778586357831955, 0.06493295729160309, 0.06808733940124512, 0.07124171406030655, 0.07439608871936798, 0.07755046337842941, 0.08070483803749084, 0.08385921269655228, 0.08701358735561371, 0.09016796946525574, 0.09332233667373657, 0.0964767187833786, 0.09963109344244003, 0.10278546810150146]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 7.0, 6.0, 7.0, 10.0, 16.0, 16.0, 21.0, 20.0, 28.0, 20.0, 25.0, 33.0, 46.0, 35.0, 48.0, 55.0, 37.0, 44.0, 43.0, 34.0, 42.0, 41.0, 34.0, 50.0, 29.0, 30.0, 22.0, 33.0, 31.0, 14.0, 16.0, 18.0, 19.0, 13.0, 9.0, 8.0, 8.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.55078125, -4.416259765625, -4.28173828125, -4.147216796875, -4.0126953125, -3.878173828125, -3.74365234375, -3.609130859375, -3.474609375, -3.340087890625, -3.20556640625, -3.071044921875, -2.9365234375, -2.802001953125, -2.66748046875, -2.532958984375, -2.3984375, -2.263916015625, -2.12939453125, -1.994873046875, -1.8603515625, -1.725830078125, -1.59130859375, -1.456787109375, -1.322265625, -1.187744140625, -1.05322265625, -0.918701171875, -0.7841796875, -0.649658203125, -0.51513671875, -0.380615234375, -0.24609375, -0.111572265625, 0.02294921875, 0.157470703125, 0.2919921875, 0.426513671875, 0.56103515625, 0.695556640625, 0.830078125, 0.964599609375, 1.09912109375, 1.233642578125, 1.3681640625, 1.502685546875, 1.63720703125, 1.771728515625, 1.90625, 2.040771484375, 2.17529296875, 2.309814453125, 2.4443359375, 2.578857421875, 2.71337890625, 2.847900390625, 2.982421875, 3.116943359375, 3.25146484375, 3.385986328125, 3.5205078125, 3.655029296875, 3.78955078125, 3.924072265625, 4.05859375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 5.0, 9.0, 6.0, 9.0, 19.0, 18.0, 18.0, 30.0, 44.0, 61.0, 93.0, 105.0, 159.0, 257.0, 411.0, 819.0, 1796.0, 4009.0, 10497.0, 28659.0, 120561.0, 630496.0, 191023.0, 36921.0, 13010.0, 5096.0, 2155.0, 936.0, 441.0, 279.0, 157.0, 116.0, 77.0, 74.0, 40.0, 31.0, 30.0, 28.0, 17.0, 15.0, 12.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.41387939453125, -8.1558837890625, -7.89788818359375, -7.639892578125, -7.38189697265625, -7.1239013671875, -6.86590576171875, -6.60791015625, -6.34991455078125, -6.0919189453125, -5.83392333984375, -5.575927734375, -5.31793212890625, -5.0599365234375, -4.80194091796875, -4.5439453125, -4.28594970703125, -4.0279541015625, -3.76995849609375, -3.511962890625, -3.25396728515625, -2.9959716796875, -2.73797607421875, -2.47998046875, -2.22198486328125, -1.9639892578125, -1.70599365234375, -1.447998046875, -1.19000244140625, -0.9320068359375, -0.67401123046875, -0.416015625, -0.15802001953125, 0.0999755859375, 0.35797119140625, 0.615966796875, 0.87396240234375, 1.1319580078125, 1.38995361328125, 1.64794921875, 1.90594482421875, 2.1639404296875, 2.42193603515625, 2.679931640625, 2.93792724609375, 3.1959228515625, 3.45391845703125, 3.7119140625, 3.96990966796875, 4.2279052734375, 4.48590087890625, 4.743896484375, 5.00189208984375, 5.2598876953125, 5.51788330078125, 5.77587890625, 6.03387451171875, 6.2918701171875, 6.54986572265625, 6.807861328125, 7.06585693359375, 7.3238525390625, 7.58184814453125, 7.83984375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 8.0, 11.0, 9.0, 9.0, 13.0, 11.0, 23.0, 18.0, 21.0, 37.0, 41.0, 28.0, 38.0, 30.0, 34.0, 44.0, 70.0, 159.0, 390.0, 1425.0, 171.0, 69.0, 45.0, 58.0, 33.0, 43.0, 35.0, 14.0, 24.0, 23.0, 15.0, 20.0, 13.0, 12.0, 13.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-11.90625, -11.546142578125, -11.18603515625, -10.825927734375, -10.4658203125, -10.105712890625, -9.74560546875, -9.385498046875, -9.025390625, -8.665283203125, -8.30517578125, -7.945068359375, -7.5849609375, -7.224853515625, -6.86474609375, -6.504638671875, -6.14453125, -5.784423828125, -5.42431640625, -5.064208984375, -4.7041015625, -4.343994140625, -3.98388671875, -3.623779296875, -3.263671875, -2.903564453125, -2.54345703125, -2.183349609375, -1.8232421875, -1.463134765625, -1.10302734375, -0.742919921875, -0.3828125, -0.022705078125, 0.33740234375, 0.697509765625, 1.0576171875, 1.417724609375, 1.77783203125, 2.137939453125, 2.498046875, 2.858154296875, 3.21826171875, 3.578369140625, 3.9384765625, 4.298583984375, 4.65869140625, 5.018798828125, 5.37890625, 5.739013671875, 6.09912109375, 6.459228515625, 6.8193359375, 7.179443359375, 7.53955078125, 7.899658203125, 8.259765625, 8.619873046875, 8.97998046875, 9.340087890625, 9.7001953125, 10.060302734375, 10.42041015625, 10.780517578125, 11.140625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 7.0, 10.0, 16.0, 18.0, 16.0, 25.0, 34.0, 35.0, 67.0, 61.0, 118.0, 168.0, 289.0, 653.0, 3362.0, 45376.0, 2954966.0, 132537.0, 6041.0, 851.0, 355.0, 157.0, 139.0, 89.0, 76.0, 42.0, 40.0, 32.0, 27.0, 18.0, 16.0, 9.0, 15.0, 10.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.252197265625, -17.56689453125, -16.881591796875, -16.1962890625, -15.510986328125, -14.82568359375, -14.140380859375, -13.455078125, -12.769775390625, -12.08447265625, -11.399169921875, -10.7138671875, -10.028564453125, -9.34326171875, -8.657958984375, -7.97265625, -7.287353515625, -6.60205078125, -5.916748046875, -5.2314453125, -4.546142578125, -3.86083984375, -3.175537109375, -2.490234375, -1.804931640625, -1.11962890625, -0.434326171875, 0.2509765625, 0.936279296875, 1.62158203125, 2.306884765625, 2.9921875, 3.677490234375, 4.36279296875, 5.048095703125, 5.7333984375, 6.418701171875, 7.10400390625, 7.789306640625, 8.474609375, 9.159912109375, 9.84521484375, 10.530517578125, 11.2158203125, 11.901123046875, 12.58642578125, 13.271728515625, 13.95703125, 14.642333984375, 15.32763671875, 16.012939453125, 16.6982421875, 17.383544921875, 18.06884765625, 18.754150390625, 19.439453125, 20.124755859375, 20.81005859375, 21.495361328125, 22.1806640625, 22.865966796875, 23.55126953125, 24.236572265625, 24.921875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 9.0, 81.0, 200.0, 333.0, 249.0, 110.0, 30.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.555974006652832, -7.284080982208252, -6.012187957763672, -4.74029541015625, -3.46840238571167, -2.19650936126709, -0.924616813659668, 0.3472766876220703, 1.6191692352294922, 2.8910622596740723, 4.162955284118652, 5.434847831726074, 6.706740856170654, 7.978633880615234, 9.250526428222656, 10.522419929504395, 11.794312477111816, 13.066205024719238, 14.338098526000977, 15.609991073608398, 16.88188362121582, 18.153778076171875, 19.425670623779297, 20.69756317138672, 21.96945571899414, 23.241348266601562, 24.513240814208984, 25.785133361816406, 27.05702781677246, 28.328920364379883, 29.600812911987305, 30.87270736694336, 32.144596099853516, 33.41648864746094, 34.68838119506836, 35.96027374267578, 37.2321662902832, 38.504058837890625, 39.77595520019531, 41.047847747802734, 42.319740295410156, 43.59163284301758, 44.863525390625, 46.13541793823242, 47.407310485839844, 48.67920684814453, 49.95109558105469, 51.222991943359375, 52.49488067626953, 53.76677322387695, 55.038665771484375, 56.3105583190918, 57.58245086669922, 58.854347229003906, 60.12623596191406, 61.39813232421875, 62.67002487182617, 63.941917419433594, 65.21381378173828, 66.48570251464844, 67.75759887695312, 69.02948760986328, 70.30138397216797, 71.57327270507812, 72.84516906738281]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 1.0, 7.0, 6.0, 9.0, 16.0, 16.0, 13.0, 24.0, 17.0, 21.0, 38.0, 20.0, 46.0, 32.0, 33.0, 29.0, 34.0, 38.0, 44.0, 35.0, 39.0, 39.0, 46.0, 59.0, 48.0, 31.0, 33.0, 32.0, 29.0, 31.0, 19.0, 16.0, 22.0, 18.0, 13.0, 5.0, 7.0, 8.0, 1.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.792509078979492, -26.926511764526367, -26.06051254272461, -25.194515228271484, -24.328516006469727, -23.4625186920166, -22.596519470214844, -21.73052215576172, -20.864524841308594, -19.99852752685547, -19.13252830505371, -18.266530990600586, -17.400531768798828, -16.534534454345703, -15.668536186218262, -14.80253791809082, -13.936538696289062, -13.070540428161621, -12.20454216003418, -11.338544845581055, -10.472545623779297, -9.606548309326172, -8.74055004119873, -7.874551773071289, -7.008553504943848, -6.142555236816406, -5.276556968688965, -4.410559177398682, -3.5445609092712402, -2.678562641143799, -1.8125648498535156, -0.9465665817260742, -0.08056640625, 0.7854317426681519, 1.6514298915863037, 2.517427921295166, 3.3834261894226074, 4.249424457550049, 5.115422248840332, 5.981420516967773, 6.847418785095215, 7.713417053222656, 8.579415321350098, 9.445413589477539, 10.311410903930664, 11.177410125732422, 12.043407440185547, 12.909405708312988, 13.77540397644043, 14.641402244567871, 15.507400512695312, 16.373397827148438, 17.239397048950195, 18.10539436340332, 18.971393585205078, 19.837390899658203, 20.703388214111328, 21.569385528564453, 22.43538475036621, 23.301382064819336, 24.167381286621094, 25.03337860107422, 25.899375915527344, 26.7653751373291, 27.63137435913086]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 8.0, 11.0, 9.0, 17.0, 17.0, 13.0, 16.0, 15.0, 24.0, 31.0, 30.0, 42.0, 36.0, 38.0, 51.0, 42.0, 48.0, 48.0, 61.0, 42.0, 48.0, 41.0, 42.0, 28.0, 28.0, 26.0, 25.0, 29.0, 24.0, 22.0, 25.0, 16.0, 8.0, 9.0, 7.0, 15.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.59381103515625, -4.4454345703125, -4.29705810546875, -4.148681640625, -4.00030517578125, -3.8519287109375, -3.70355224609375, -3.55517578125, -3.40679931640625, -3.2584228515625, -3.11004638671875, -2.961669921875, -2.81329345703125, -2.6649169921875, -2.51654052734375, -2.3681640625, -2.21978759765625, -2.0714111328125, -1.92303466796875, -1.774658203125, -1.62628173828125, -1.4779052734375, -1.32952880859375, -1.18115234375, -1.03277587890625, -0.8843994140625, -0.73602294921875, -0.587646484375, -0.43927001953125, -0.2908935546875, -0.14251708984375, 0.005859375, 0.15423583984375, 0.3026123046875, 0.45098876953125, 0.599365234375, 0.74774169921875, 0.8961181640625, 1.04449462890625, 1.19287109375, 1.34124755859375, 1.4896240234375, 1.63800048828125, 1.786376953125, 1.93475341796875, 2.0831298828125, 2.23150634765625, 2.3798828125, 2.52825927734375, 2.6766357421875, 2.82501220703125, 2.973388671875, 3.12176513671875, 3.2701416015625, 3.41851806640625, 3.56689453125, 3.71527099609375, 3.8636474609375, 4.01202392578125, 4.160400390625, 4.30877685546875, 4.4571533203125, 4.60552978515625, 4.75390625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 11.0, 8.0, 16.0, 17.0, 17.0, 26.0, 41.0, 71.0, 91.0, 140.0, 255.0, 559.0, 1470.0, 5208.0, 27734.0, 213102.0, 1525073.0, 2029175.0, 338399.0, 41996.0, 7307.0, 2021.0, 683.0, 316.0, 198.0, 100.0, 65.0, 48.0, 30.0, 26.0, 18.0, 18.0, 12.0, 9.0, 10.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.83251953125, -7.5634765625, -7.29443359375, -7.025390625, -6.75634765625, -6.4873046875, -6.21826171875, -5.94921875, -5.68017578125, -5.4111328125, -5.14208984375, -4.873046875, -4.60400390625, -4.3349609375, -4.06591796875, -3.796875, -3.52783203125, -3.2587890625, -2.98974609375, -2.720703125, -2.45166015625, -2.1826171875, -1.91357421875, -1.64453125, -1.37548828125, -1.1064453125, -0.83740234375, -0.568359375, -0.29931640625, -0.0302734375, 0.23876953125, 0.5078125, 0.77685546875, 1.0458984375, 1.31494140625, 1.583984375, 1.85302734375, 2.1220703125, 2.39111328125, 2.66015625, 2.92919921875, 3.1982421875, 3.46728515625, 3.736328125, 4.00537109375, 4.2744140625, 4.54345703125, 4.8125, 5.08154296875, 5.3505859375, 5.61962890625, 5.888671875, 6.15771484375, 6.4267578125, 6.69580078125, 6.96484375, 7.23388671875, 7.5029296875, 7.77197265625, 8.041015625, 8.31005859375, 8.5791015625, 8.84814453125, 9.1171875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 11.0, 10.0, 19.0, 33.0, 44.0, 44.0, 94.0, 101.0, 141.0, 188.0, 242.0, 324.0, 360.0, 434.0, 409.0, 359.0, 289.0, 245.0, 174.0, 142.0, 88.0, 86.0, 71.0, 36.0, 33.0, 27.0, 12.0, 11.0, 7.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.54443359375, -4.3623046875, -4.18017578125, -3.998046875, -3.81591796875, -3.6337890625, -3.45166015625, -3.26953125, -3.08740234375, -2.9052734375, -2.72314453125, -2.541015625, -2.35888671875, -2.1767578125, -1.99462890625, -1.8125, -1.63037109375, -1.4482421875, -1.26611328125, -1.083984375, -0.90185546875, -0.7197265625, -0.53759765625, -0.35546875, -0.17333984375, 0.0087890625, 0.19091796875, 0.373046875, 0.55517578125, 0.7373046875, 0.91943359375, 1.1015625, 1.28369140625, 1.4658203125, 1.64794921875, 1.830078125, 2.01220703125, 2.1943359375, 2.37646484375, 2.55859375, 2.74072265625, 2.9228515625, 3.10498046875, 3.287109375, 3.46923828125, 3.6513671875, 3.83349609375, 4.015625, 4.19775390625, 4.3798828125, 4.56201171875, 4.744140625, 4.92626953125, 5.1083984375, 5.29052734375, 5.47265625, 5.65478515625, 5.8369140625, 6.01904296875, 6.201171875, 6.38330078125, 6.5654296875, 6.74755859375, 6.9296875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 12.0, 6.0, 8.0, 17.0, 15.0, 34.0, 42.0, 78.0, 101.0, 172.0, 262.0, 440.0, 877.0, 2993.0, 23802.0, 476047.0, 3338901.0, 328032.0, 18111.0, 2444.0, 810.0, 408.0, 222.0, 148.0, 90.0, 71.0, 49.0, 24.0, 20.0, 14.0, 8.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-20.078125, -19.569091796875, -19.06005859375, -18.551025390625, -18.0419921875, -17.532958984375, -17.02392578125, -16.514892578125, -16.005859375, -15.496826171875, -14.98779296875, -14.478759765625, -13.9697265625, -13.460693359375, -12.95166015625, -12.442626953125, -11.93359375, -11.424560546875, -10.91552734375, -10.406494140625, -9.8974609375, -9.388427734375, -8.87939453125, -8.370361328125, -7.861328125, -7.352294921875, -6.84326171875, -6.334228515625, -5.8251953125, -5.316162109375, -4.80712890625, -4.298095703125, -3.7890625, -3.280029296875, -2.77099609375, -2.261962890625, -1.7529296875, -1.243896484375, -0.73486328125, -0.225830078125, 0.283203125, 0.792236328125, 1.30126953125, 1.810302734375, 2.3193359375, 2.828369140625, 3.33740234375, 3.846435546875, 4.35546875, 4.864501953125, 5.37353515625, 5.882568359375, 6.3916015625, 6.900634765625, 7.40966796875, 7.918701171875, 8.427734375, 8.936767578125, 9.44580078125, 9.954833984375, 10.4638671875, 10.972900390625, 11.48193359375, 11.990966796875, 12.5]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 15.0, 35.0, 69.0, 86.0, 140.0, 159.0, 156.0, 141.0, 93.0, 48.0, 30.0, 19.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.67111587524414, -9.483283042907715, -8.295450210571289, -7.10761833190918, -5.919785499572754, -4.731952667236328, -3.5441203117370605, -2.356287956237793, -1.1684551239013672, 0.019377470016479492, 1.2072100639343262, 2.395042657852173, 3.5828752517700195, 4.770708084106445, 5.958540439605713, 7.1463727951049805, 8.334205627441406, 9.522038459777832, 10.709871292114258, 11.897703170776367, 13.085536003112793, 14.273368835449219, 15.461200714111328, 16.649032592773438, 17.83686637878418, 19.02469825744629, 20.21253204345703, 21.40036392211914, 22.58819580078125, 23.776029586791992, 24.9638614654541, 26.151695251464844, 27.339523315429688, 28.527355194091797, 29.71518898010254, 30.90302085876465, 32.09085464477539, 33.2786865234375, 34.46651840209961, 35.65435028076172, 36.842185974121094, 38.0300178527832, 39.21784973144531, 40.40568542480469, 41.5935173034668, 42.781349182128906, 43.969181060791016, 45.157012939453125, 46.344844818115234, 47.532676696777344, 48.72050857543945, 49.90834426879883, 51.09617614746094, 52.28400802612305, 53.471839904785156, 54.659671783447266, 55.847503662109375, 57.035335540771484, 58.223167419433594, 59.41100311279297, 60.59883499145508, 61.78666687011719, 62.9744987487793, 64.1623306274414, 65.35016632080078]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 2.0, 6.0, 2.0, 7.0, 13.0, 14.0, 17.0, 17.0, 22.0, 30.0, 28.0, 20.0, 36.0, 40.0, 36.0, 41.0, 35.0, 38.0, 44.0, 39.0, 37.0, 37.0, 39.0, 32.0, 31.0, 34.0, 31.0, 40.0, 36.0, 25.0, 27.0, 25.0, 13.0, 15.0, 10.0, 13.0, 10.0, 11.0, 7.0, 8.0, 6.0, 7.0, 8.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.68697166442871, -19.07669448852539, -18.46641731262207, -17.85614013671875, -17.24586296081543, -16.63558578491211, -16.02530860900879, -15.415030479431152, -14.804753303527832, -14.194476127624512, -13.584198951721191, -12.973921775817871, -12.363643646240234, -11.753366470336914, -11.143089294433594, -10.532812118530273, -9.922534942626953, -9.312257766723633, -8.701980590820312, -8.091703414916992, -7.481425762176514, -6.871148586273193, -6.260870933532715, -5.6505937576293945, -5.040316581726074, -4.430039405822754, -3.8197619915008545, -3.209484577178955, -2.5992074012756348, -1.9889302253723145, -1.378652811050415, -0.7683753967285156, -0.1580963134765625, 0.45218098163604736, 1.0624582767486572, 1.672735571861267, 2.283012866973877, 2.8932900428771973, 3.5035674571990967, 4.113844871520996, 4.724122047424316, 5.334399223327637, 5.944676399230957, 6.5549540519714355, 7.165231227874756, 7.775508403778076, 8.385786056518555, 8.996063232421875, 9.606340408325195, 10.216617584228516, 10.826894760131836, 11.437171936035156, 12.047449111938477, 12.657726287841797, 13.268004417419434, 13.878281593322754, 14.488558769226074, 15.098835945129395, 15.709113121032715, 16.31939125061035, 16.929668426513672, 17.539945602416992, 18.150222778320312, 18.760499954223633, 19.370777130126953]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 8.0, 6.0, 11.0, 7.0, 13.0, 16.0, 17.0, 18.0, 25.0, 30.0, 24.0, 22.0, 28.0, 27.0, 36.0, 46.0, 44.0, 44.0, 29.0, 46.0, 45.0, 49.0, 47.0, 41.0, 37.0, 40.0, 21.0, 33.0, 32.0, 16.0, 23.0, 22.0, 16.0, 16.0, 8.0, 14.0, 16.0, 6.0, 9.0, 7.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.97662353515625, -3.8399658203125, -3.70330810546875, -3.566650390625, -3.42999267578125, -3.2933349609375, -3.15667724609375, -3.02001953125, -2.88336181640625, -2.7467041015625, -2.61004638671875, -2.473388671875, -2.33673095703125, -2.2000732421875, -2.06341552734375, -1.9267578125, -1.79010009765625, -1.6534423828125, -1.51678466796875, -1.380126953125, -1.24346923828125, -1.1068115234375, -0.97015380859375, -0.83349609375, -0.69683837890625, -0.5601806640625, -0.42352294921875, -0.286865234375, -0.15020751953125, -0.0135498046875, 0.12310791015625, 0.259765625, 0.39642333984375, 0.5330810546875, 0.66973876953125, 0.806396484375, 0.94305419921875, 1.0797119140625, 1.21636962890625, 1.35302734375, 1.48968505859375, 1.6263427734375, 1.76300048828125, 1.899658203125, 2.03631591796875, 2.1729736328125, 2.30963134765625, 2.4462890625, 2.58294677734375, 2.7196044921875, 2.85626220703125, 2.992919921875, 3.12957763671875, 3.2662353515625, 3.40289306640625, 3.53955078125, 3.67620849609375, 3.8128662109375, 3.94952392578125, 4.086181640625, 4.22283935546875, 4.3594970703125, 4.49615478515625, 4.6328125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 8.0, 12.0, 11.0, 36.0, 44.0, 66.0, 105.0, 177.0, 266.0, 459.0, 730.0, 1158.0, 1857.0, 2860.0, 4322.0, 6795.0, 10522.0, 16155.0, 24350.0, 36406.0, 52285.0, 72919.0, 95924.0, 118611.0, 129486.0, 121565.0, 100520.0, 77757.0, 56811.0, 39419.0, 26693.0, 17735.0, 11641.0, 7458.0, 4835.0, 3231.0, 2008.0, 1245.0, 754.0, 476.0, 310.0, 210.0, 120.0, 73.0, 50.0, 28.0, 21.0, 15.0, 17.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24967002868652344, -0.24177169799804688, -0.2338733673095703, -0.22597503662109375, -0.2180767059326172, -0.21017837524414062, -0.20228004455566406, -0.1943817138671875, -0.18648338317871094, -0.17858505249023438, -0.1706867218017578, -0.16278839111328125, -0.1548900604248047, -0.14699172973632812, -0.13909339904785156, -0.131195068359375, -0.12329673767089844, -0.11539840698242188, -0.10750007629394531, -0.09960174560546875, -0.09170341491699219, -0.08380508422851562, -0.07590675354003906, -0.0680084228515625, -0.06011009216308594, -0.052211761474609375, -0.04431343078613281, -0.03641510009765625, -0.028516769409179688, -0.020618438720703125, -0.012720108032226562, -0.00482177734375, 0.0030765533447265625, 0.010974884033203125, 0.018873214721679688, 0.02677154541015625, 0.03466987609863281, 0.042568206787109375, 0.05046653747558594, 0.0583648681640625, 0.06626319885253906, 0.07416152954101562, 0.08205986022949219, 0.08995819091796875, 0.09785652160644531, 0.10575485229492188, 0.11365318298339844, 0.121551513671875, 0.12944984436035156, 0.13734817504882812, 0.1452465057373047, 0.15314483642578125, 0.1610431671142578, 0.16894149780273438, 0.17683982849121094, 0.1847381591796875, 0.19263648986816406, 0.20053482055664062, 0.2084331512451172, 0.21633148193359375, 0.2242298126220703, 0.23212814331054688, 0.24002647399902344, 0.2479248046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 11.0, 9.0, 15.0, 10.0, 13.0, 22.0, 18.0, 27.0, 17.0, 23.0, 31.0, 34.0, 39.0, 37.0, 41.0, 43.0, 42.0, 48.0, 1064.0, 42.0, 42.0, 39.0, 43.0, 38.0, 31.0, 34.0, 25.0, 22.0, 25.0, 17.0, 24.0, 21.0, 15.0, 9.0, 8.0, 8.0, 6.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.806640625, -2.714080810546875, -2.62152099609375, -2.528961181640625, -2.4364013671875, -2.343841552734375, -2.25128173828125, -2.158721923828125, -2.066162109375, -1.973602294921875, -1.88104248046875, -1.788482666015625, -1.6959228515625, -1.603363037109375, -1.51080322265625, -1.418243408203125, -1.32568359375, -1.233123779296875, -1.14056396484375, -1.048004150390625, -0.9554443359375, -0.862884521484375, -0.77032470703125, -0.677764892578125, -0.585205078125, -0.492645263671875, -0.40008544921875, -0.307525634765625, -0.2149658203125, -0.122406005859375, -0.02984619140625, 0.062713623046875, 0.1552734375, 0.247833251953125, 0.34039306640625, 0.432952880859375, 0.5255126953125, 0.618072509765625, 0.71063232421875, 0.803192138671875, 0.895751953125, 0.988311767578125, 1.08087158203125, 1.173431396484375, 1.2659912109375, 1.358551025390625, 1.45111083984375, 1.543670654296875, 1.63623046875, 1.728790283203125, 1.82135009765625, 1.913909912109375, 2.0064697265625, 2.099029541015625, 2.19158935546875, 2.284149169921875, 2.376708984375, 2.469268798828125, 2.56182861328125, 2.654388427734375, 2.7469482421875, 2.839508056640625, 2.93206787109375, 3.024627685546875, 3.1171875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 9.0, 16.0, 32.0, 46.0, 83.0, 108.0, 190.0, 271.0, 402.0, 657.0, 965.0, 1592.0, 2444.0, 3640.0, 5668.0, 8900.0, 13524.0, 20541.0, 30229.0, 44036.0, 61924.0, 83802.0, 107663.0, 299296.0, 986645.0, 117011.0, 90004.0, 68127.0, 48706.0, 33847.0, 23270.0, 14935.0, 10017.0, 6595.0, 4170.0, 2781.0, 1745.0, 1159.0, 701.0, 478.0, 315.0, 206.0, 137.0, 96.0, 56.0, 32.0, 23.0, 15.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.14599609375, -0.14115333557128906, -0.13631057739257812, -0.1314678192138672, -0.12662506103515625, -0.12178230285644531, -0.11693954467773438, -0.11209678649902344, -0.1072540283203125, -0.10241127014160156, -0.09756851196289062, -0.09272575378417969, -0.08788299560546875, -0.08304023742675781, -0.07819747924804688, -0.07335472106933594, -0.068511962890625, -0.06366920471191406, -0.058826446533203125, -0.05398368835449219, -0.04914093017578125, -0.04429817199707031, -0.039455413818359375, -0.03461265563964844, -0.0297698974609375, -0.024927139282226562, -0.020084381103515625, -0.015241622924804688, -0.01039886474609375, -0.0055561065673828125, -0.000713348388671875, 0.0041294097900390625, 0.00897216796875, 0.013814926147460938, 0.018657684326171875, 0.023500442504882812, 0.02834320068359375, 0.03318595886230469, 0.038028717041015625, 0.04287147521972656, 0.0477142333984375, 0.05255699157714844, 0.057399749755859375, 0.06224250793457031, 0.06708526611328125, 0.07192802429199219, 0.07677078247070312, 0.08161354064941406, 0.086456298828125, 0.09129905700683594, 0.09614181518554688, 0.10098457336425781, 0.10582733154296875, 0.11067008972167969, 0.11551284790039062, 0.12035560607910156, 0.1251983642578125, 0.13004112243652344, 0.13488388061523438, 0.1397266387939453, 0.14456939697265625, 0.1494121551513672, 0.15425491333007812, 0.15909767150878906, 0.1639404296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 8.0, 4.0, 6.0, 13.0, 10.0, 6.0, 14.0, 16.0, 22.0, 22.0, 39.0, 34.0, 42.0, 53.0, 58.0, 69.0, 56.0, 43.0, 58.0, 69.0, 62.0, 45.0, 39.0, 33.0, 34.0, 30.0, 24.0, 17.0, 12.0, 11.0, 12.0, 5.0, 9.0, 3.0, 5.0, 3.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.020477294921875, -0.01980876922607422, -0.019140243530273438, -0.018471717834472656, -0.017803192138671875, -0.017134666442871094, -0.016466140747070312, -0.01579761505126953, -0.01512908935546875, -0.014460563659667969, -0.013792037963867188, -0.013123512268066406, -0.012454986572265625, -0.011786460876464844, -0.011117935180664062, -0.010449409484863281, -0.0097808837890625, -0.009112358093261719, -0.008443832397460938, -0.007775306701660156, -0.007106781005859375, -0.006438255310058594, -0.0057697296142578125, -0.005101203918457031, -0.00443267822265625, -0.0037641525268554688, -0.0030956268310546875, -0.0024271011352539062, -0.001758575439453125, -0.0010900497436523438, -0.0004215240478515625, 0.00024700164794921875, 0.00091552734375, 0.0015840530395507812, 0.0022525787353515625, 0.0029211044311523438, 0.003589630126953125, 0.004258155822753906, 0.0049266815185546875, 0.005595207214355469, 0.00626373291015625, 0.006932258605957031, 0.0076007843017578125, 0.008269309997558594, 0.008937835693359375, 0.009606361389160156, 0.010274887084960938, 0.010943412780761719, 0.0116119384765625, 0.012280464172363281, 0.012948989868164062, 0.013617515563964844, 0.014286041259765625, 0.014954566955566406, 0.015623092651367188, 0.01629161834716797, 0.01696014404296875, 0.01762866973876953, 0.018297195434570312, 0.018965721130371094, 0.019634246826171875, 0.020302772521972656, 0.020971298217773438, 0.02163982391357422, 0.022308349609375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 6.0, 4.0, 9.0, 10.0, 7.0, 8.0, 13.0, 14.0, 12.0, 26.0, 26.0, 47.0, 52.0, 66.0, 104.0, 175.0, 271.0, 609.0, 7328.0, 1036314.0, 2152.0, 509.0, 259.0, 150.0, 91.0, 67.0, 51.0, 36.0, 33.0, 20.0, 9.0, 12.0, 13.0, 10.0, 10.0, 8.0, 2.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.496826171875, -0.48194122314453125, -0.4670562744140625, -0.45217132568359375, -0.437286376953125, -0.42240142822265625, -0.4075164794921875, -0.39263153076171875, -0.37774658203125, -0.36286163330078125, -0.3479766845703125, -0.33309173583984375, -0.318206787109375, -0.30332183837890625, -0.2884368896484375, -0.27355194091796875, -0.2586669921875, -0.24378204345703125, -0.2288970947265625, -0.21401214599609375, -0.199127197265625, -0.18424224853515625, -0.1693572998046875, -0.15447235107421875, -0.13958740234375, -0.12470245361328125, -0.1098175048828125, -0.09493255615234375, -0.080047607421875, -0.06516265869140625, -0.0502777099609375, -0.03539276123046875, -0.0205078125, -0.00562286376953125, 0.0092620849609375, 0.02414703369140625, 0.039031982421875, 0.05391693115234375, 0.0688018798828125, 0.08368682861328125, 0.09857177734375, 0.11345672607421875, 0.1283416748046875, 0.14322662353515625, 0.158111572265625, 0.17299652099609375, 0.1878814697265625, 0.20276641845703125, 0.2176513671875, 0.23253631591796875, 0.2474212646484375, 0.26230621337890625, 0.277191162109375, 0.29207611083984375, 0.3069610595703125, 0.32184600830078125, 0.33673095703125, 0.35161590576171875, 0.3665008544921875, 0.38138580322265625, 0.396270751953125, 0.41115570068359375, 0.4260406494140625, 0.44092559814453125, 0.455810546875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 49.0, 846.0, 106.0, 7.0, 3.0], "bins": [-0.6190749406814575, -0.6088619828224182, -0.5986490249633789, -0.5884360671043396, -0.5782230496406555, -0.5680100917816162, -0.5577971339225769, -0.5475841760635376, -0.5373712182044983, -0.527158260345459, -0.5169453024864197, -0.5067323446273804, -0.4965193569660187, -0.486306369304657, -0.4760934114456177, -0.46588045358657837, -0.4556674659252167, -0.44545450806617737, -0.4352415204048157, -0.42502856254577637, -0.41481560468673706, -0.40460264682769775, -0.39438965916633606, -0.38417670130729675, -0.37396371364593506, -0.36375075578689575, -0.35353776812553406, -0.34332481026649475, -0.33311185240745544, -0.32289886474609375, -0.31268590688705444, -0.30247294902801514, -0.29225999116897583, -0.2820470333099365, -0.27183404564857483, -0.2616210877895355, -0.2514081299304962, -0.24119515717029572, -0.23098218441009521, -0.2207692265510559, -0.2105562686920166, -0.2003432959318161, -0.1901303380727768, -0.1799173653125763, -0.169704407453537, -0.1594914346933365, -0.149278461933136, -0.13906550407409668, -0.12885251641273499, -0.11863955110311508, -0.10842658579349518, -0.09821361303329468, -0.08800064772367477, -0.07778768241405487, -0.06757470965385437, -0.05736174434423447, -0.04714878648519516, -0.036935821175575256, -0.026722852140665054, -0.0165098849684, -0.006296917796134949, 0.003916047513484955, 0.014129016548395157, 0.02434198558330536, 0.03455495089292526]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 2.0, 7.0, 3.0, 18.0, 11.0, 17.0, 18.0, 15.0, 20.0, 22.0, 32.0, 22.0, 26.0, 17.0, 35.0, 40.0, 38.0, 44.0, 34.0, 42.0, 50.0, 36.0, 37.0, 42.0, 30.0, 37.0, 41.0, 28.0, 31.0, 24.0, 20.0, 24.0, 12.0, 17.0, 16.0, 14.0, 9.0, 14.0, 8.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05212104320526123, -0.05041785538196564, -0.048714667558670044, -0.04701147601008415, -0.04530828818678856, -0.043605100363492966, -0.041901908814907074, -0.04019872099161148, -0.03849553316831589, -0.036792345345020294, -0.0350891575217247, -0.03338596597313881, -0.031682778149843216, -0.029979590326547623, -0.02827640064060688, -0.026573210954666138, -0.024870023131370544, -0.02316683530807495, -0.02146364562213421, -0.019760455936193466, -0.018057268112897873, -0.01635408028960228, -0.014650890603661537, -0.01294770184904337, -0.011244513094425201, -0.009541324339807034, -0.007838135585188866, -0.006134946830570698, -0.00443175807595253, -0.002728569321334362, -0.0010253805667161942, 0.0006778081879019737, 0.0023809969425201416, 0.0040841856971383095, 0.005787374451756477, 0.007490563206374645, 0.009193751960992813, 0.010896940715610981, 0.012600129470229149, 0.014303318224847317, 0.016006506979465485, 0.017709694802761078, 0.01941288448870182, 0.021116074174642563, 0.022819261997938156, 0.02452244982123375, 0.026225639507174492, 0.027928829193115234, 0.029632017016410828, 0.03133520483970642, 0.033038392663002014, 0.034741584211587906, 0.0364447720348835, 0.03814795985817909, 0.039851151406764984, 0.04155433923006058, 0.04325752705335617, 0.044960714876651764, 0.04666390269994736, 0.04836709424853325, 0.05007028207182884, 0.051773469895124435, 0.05347666144371033, 0.05517984926700592, 0.056883037090301514]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 6.0, 10.0, 7.0, 11.0, 16.0, 13.0, 20.0, 25.0, 23.0, 22.0, 38.0, 27.0, 33.0, 39.0, 36.0, 30.0, 42.0, 40.0, 37.0, 40.0, 46.0, 46.0, 30.0, 48.0, 36.0, 29.0, 45.0, 31.0, 21.0, 26.0, 19.0, 22.0, 18.0, 11.0, 16.0, 8.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.85546875, -4.718841552734375, -4.58221435546875, -4.445587158203125, -4.3089599609375, -4.172332763671875, -4.03570556640625, -3.899078369140625, -3.762451171875, -3.625823974609375, -3.48919677734375, -3.352569580078125, -3.2159423828125, -3.079315185546875, -2.94268798828125, -2.806060791015625, -2.66943359375, -2.532806396484375, -2.39617919921875, -2.259552001953125, -2.1229248046875, -1.986297607421875, -1.84967041015625, -1.713043212890625, -1.576416015625, -1.439788818359375, -1.30316162109375, -1.166534423828125, -1.0299072265625, -0.893280029296875, -0.75665283203125, -0.620025634765625, -0.4833984375, -0.346771240234375, -0.21014404296875, -0.073516845703125, 0.0631103515625, 0.199737548828125, 0.33636474609375, 0.472991943359375, 0.609619140625, 0.746246337890625, 0.88287353515625, 1.019500732421875, 1.1561279296875, 1.292755126953125, 1.42938232421875, 1.566009521484375, 1.70263671875, 1.839263916015625, 1.97589111328125, 2.112518310546875, 2.2491455078125, 2.385772705078125, 2.52239990234375, 2.659027099609375, 2.795654296875, 2.932281494140625, 3.06890869140625, 3.205535888671875, 3.3421630859375, 3.478790283203125, 3.61541748046875, 3.752044677734375, 3.888671875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 8.0, 16.0, 23.0, 26.0, 46.0, 68.0, 101.0, 144.0, 209.0, 352.0, 547.0, 830.0, 1337.0, 2224.0, 3697.0, 6461.0, 11870.0, 21805.0, 42365.0, 86154.0, 183714.0, 294270.0, 199179.0, 93518.0, 46003.0, 23767.0, 12766.0, 6972.0, 3904.0, 2393.0, 1375.0, 832.0, 540.0, 325.0, 239.0, 129.0, 100.0, 85.0, 46.0, 24.0, 26.0, 19.0, 16.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-4.62890625, -4.490966796875, -4.35302734375, -4.215087890625, -4.0771484375, -3.939208984375, -3.80126953125, -3.663330078125, -3.525390625, -3.387451171875, -3.24951171875, -3.111572265625, -2.9736328125, -2.835693359375, -2.69775390625, -2.559814453125, -2.421875, -2.283935546875, -2.14599609375, -2.008056640625, -1.8701171875, -1.732177734375, -1.59423828125, -1.456298828125, -1.318359375, -1.180419921875, -1.04248046875, -0.904541015625, -0.7666015625, -0.628662109375, -0.49072265625, -0.352783203125, -0.21484375, -0.076904296875, 0.06103515625, 0.198974609375, 0.3369140625, 0.474853515625, 0.61279296875, 0.750732421875, 0.888671875, 1.026611328125, 1.16455078125, 1.302490234375, 1.4404296875, 1.578369140625, 1.71630859375, 1.854248046875, 1.9921875, 2.130126953125, 2.26806640625, 2.406005859375, 2.5439453125, 2.681884765625, 2.81982421875, 2.957763671875, 3.095703125, 3.233642578125, 3.37158203125, 3.509521484375, 3.6474609375, 3.785400390625, 3.92333984375, 4.061279296875, 4.19921875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 6.0, 7.0, 10.0, 11.0, 19.0, 17.0, 22.0, 16.0, 24.0, 38.0, 37.0, 30.0, 38.0, 69.0, 79.0, 147.0, 312.0, 1437.0, 200.0, 85.0, 78.0, 44.0, 48.0, 52.0, 33.0, 30.0, 33.0, 24.0, 19.0, 14.0, 15.0, 11.0, 5.0, 12.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0, -10.6241455078125, -10.248291015625, -9.8724365234375, -9.49658203125, -9.1207275390625, -8.744873046875, -8.3690185546875, -7.9931640625, -7.6173095703125, -7.241455078125, -6.8656005859375, -6.48974609375, -6.1138916015625, -5.738037109375, -5.3621826171875, -4.986328125, -4.6104736328125, -4.234619140625, -3.8587646484375, -3.48291015625, -3.1070556640625, -2.731201171875, -2.3553466796875, -1.9794921875, -1.6036376953125, -1.227783203125, -0.8519287109375, -0.47607421875, -0.1002197265625, 0.275634765625, 0.6514892578125, 1.02734375, 1.4031982421875, 1.779052734375, 2.1549072265625, 2.53076171875, 2.9066162109375, 3.282470703125, 3.6583251953125, 4.0341796875, 4.4100341796875, 4.785888671875, 5.1617431640625, 5.53759765625, 5.9134521484375, 6.289306640625, 6.6651611328125, 7.041015625, 7.4168701171875, 7.792724609375, 8.1685791015625, 8.54443359375, 8.9202880859375, 9.296142578125, 9.6719970703125, 10.0478515625, 10.4237060546875, 10.799560546875, 11.1754150390625, 11.55126953125, 11.9271240234375, 12.302978515625, 12.6788330078125, 13.0546875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 7.0, 6.0, 18.0, 12.0, 26.0, 30.0, 38.0, 62.0, 95.0, 141.0, 192.0, 324.0, 536.0, 1421.0, 8718.0, 101479.0, 2569599.0, 435031.0, 23252.0, 2940.0, 694.0, 351.0, 231.0, 146.0, 97.0, 70.0, 52.0, 40.0, 28.0, 16.0, 16.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.8203125, -12.3404541015625, -11.860595703125, -11.3807373046875, -10.90087890625, -10.4210205078125, -9.941162109375, -9.4613037109375, -8.9814453125, -8.5015869140625, -8.021728515625, -7.5418701171875, -7.06201171875, -6.5821533203125, -6.102294921875, -5.6224365234375, -5.142578125, -4.6627197265625, -4.182861328125, -3.7030029296875, -3.22314453125, -2.7432861328125, -2.263427734375, -1.7835693359375, -1.3037109375, -0.8238525390625, -0.343994140625, 0.1358642578125, 0.61572265625, 1.0955810546875, 1.575439453125, 2.0552978515625, 2.53515625, 3.0150146484375, 3.494873046875, 3.9747314453125, 4.45458984375, 4.9344482421875, 5.414306640625, 5.8941650390625, 6.3740234375, 6.8538818359375, 7.333740234375, 7.8135986328125, 8.29345703125, 8.7733154296875, 9.253173828125, 9.7330322265625, 10.212890625, 10.6927490234375, 11.172607421875, 11.6524658203125, 12.13232421875, 12.6121826171875, 13.092041015625, 13.5718994140625, 14.0517578125, 14.5316162109375, 15.011474609375, 15.4913330078125, 15.97119140625, 16.4510498046875, 16.930908203125, 17.4107666015625, 17.890625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 12.0, 35.0, 86.0, 159.0, 226.0, 214.0, 137.0, 75.0, 46.0, 14.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.617773056030273, -25.552270889282227, -24.486770629882812, -23.421268463134766, -22.35576629638672, -21.290264129638672, -20.224761962890625, -19.15926170349121, -18.093759536743164, -17.028257369995117, -15.962756156921387, -14.897254943847656, -13.83175277709961, -12.766250610351562, -11.700749397277832, -10.635248184204102, -9.569746017456055, -8.504243850708008, -7.438742637634277, -6.373240947723389, -5.3077392578125, -4.242237567901611, -3.1767358779907227, -2.111234188079834, -1.0457324981689453, 0.01976919174194336, 1.085270881652832, 2.1507725715637207, 3.2162742614746094, 4.281775951385498, 5.347277641296387, 6.412779331207275, 7.478279113769531, 8.543781280517578, 9.609282493591309, 10.674783706665039, 11.740285873413086, 12.805788040161133, 13.871289253234863, 14.936790466308594, 16.00229263305664, 17.067794799804688, 18.133296966552734, 19.19879722595215, 20.264299392700195, 21.329801559448242, 22.395301818847656, 23.460803985595703, 24.52630615234375, 25.591808319091797, 26.657310485839844, 27.722810745239258, 28.788312911987305, 29.85381507873535, 30.919315338134766, 31.984817504882812, 33.05031967163086, 34.115821838378906, 35.18132400512695, 36.246826171875, 37.31232452392578, 38.37782669067383, 39.443328857421875, 40.50883102416992, 41.57433319091797]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 12.0, 12.0, 17.0, 23.0, 21.0, 27.0, 24.0, 33.0, 42.0, 32.0, 32.0, 37.0, 33.0, 38.0, 44.0, 40.0, 47.0, 62.0, 38.0, 41.0, 41.0, 40.0, 32.0, 29.0, 28.0, 28.0, 24.0, 20.0, 18.0, 11.0, 11.0, 7.0, 6.0, 8.0, 8.0, 7.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.093063354492188, -26.272998809814453, -25.45293617248535, -24.632871627807617, -23.812808990478516, -22.99274444580078, -22.172679901123047, -21.352615356445312, -20.53255271911621, -19.712488174438477, -18.892425537109375, -18.07236099243164, -17.252296447753906, -16.432233810424805, -15.61216926574707, -14.792105674743652, -13.972042083740234, -13.151978492736816, -12.331914901733398, -11.511850357055664, -10.691786766052246, -9.871723175048828, -9.051658630371094, -8.231595039367676, -7.411531448364258, -6.59146785736084, -5.771403789520264, -4.9513397216796875, -4.1312761306762695, -3.3112125396728516, -2.4911484718322754, -1.6710844039916992, -0.8510208129882812, -0.03095698356628418, 0.7891068458557129, 1.60917067527771, 2.429234504699707, 3.249298095703125, 4.069362163543701, 4.889426231384277, 5.709489822387695, 6.529553413391113, 7.3496174812316895, 8.169681549072266, 8.989745140075684, 9.809808731079102, 10.629873275756836, 11.449936866760254, 12.270000457763672, 13.09006404876709, 13.910127639770508, 14.730192184448242, 15.55025577545166, 16.370319366455078, 17.190383911132812, 18.010448455810547, 18.83051109313965, 19.650575637817383, 20.470638275146484, 21.29070281982422, 22.110767364501953, 22.930830001831055, 23.75089454650879, 24.57095718383789, 25.391021728515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 8.0, 10.0, 8.0, 13.0, 12.0, 15.0, 20.0, 17.0, 22.0, 32.0, 41.0, 39.0, 31.0, 35.0, 38.0, 47.0, 48.0, 30.0, 44.0, 42.0, 49.0, 33.0, 37.0, 40.0, 39.0, 35.0, 26.0, 33.0, 23.0, 21.0, 25.0, 14.0, 15.0, 10.0, 10.0, 9.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.921875, -4.780029296875, -4.63818359375, -4.496337890625, -4.3544921875, -4.212646484375, -4.07080078125, -3.928955078125, -3.787109375, -3.645263671875, -3.50341796875, -3.361572265625, -3.2197265625, -3.077880859375, -2.93603515625, -2.794189453125, -2.65234375, -2.510498046875, -2.36865234375, -2.226806640625, -2.0849609375, -1.943115234375, -1.80126953125, -1.659423828125, -1.517578125, -1.375732421875, -1.23388671875, -1.092041015625, -0.9501953125, -0.808349609375, -0.66650390625, -0.524658203125, -0.3828125, -0.240966796875, -0.09912109375, 0.042724609375, 0.1845703125, 0.326416015625, 0.46826171875, 0.610107421875, 0.751953125, 0.893798828125, 1.03564453125, 1.177490234375, 1.3193359375, 1.461181640625, 1.60302734375, 1.744873046875, 1.88671875, 2.028564453125, 2.17041015625, 2.312255859375, 2.4541015625, 2.595947265625, 2.73779296875, 2.879638671875, 3.021484375, 3.163330078125, 3.30517578125, 3.447021484375, 3.5888671875, 3.730712890625, 3.87255859375, 4.014404296875, 4.15625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 10.0, 8.0, 16.0, 17.0, 15.0, 22.0, 21.0, 37.0, 44.0, 65.0, 66.0, 73.0, 160.0, 260.0, 808.0, 7470.0, 1531569.0, 2640324.0, 11469.0, 945.0, 330.0, 135.0, 98.0, 62.0, 49.0, 44.0, 37.0, 30.0, 19.0, 13.0, 13.0, 13.0, 12.0, 4.0, 8.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.7021484375, -22.857421875, -22.0126953125, -21.16796875, -20.3232421875, -19.478515625, -18.6337890625, -17.7890625, -16.9443359375, -16.099609375, -15.2548828125, -14.41015625, -13.5654296875, -12.720703125, -11.8759765625, -11.03125, -10.1865234375, -9.341796875, -8.4970703125, -7.65234375, -6.8076171875, -5.962890625, -5.1181640625, -4.2734375, -3.4287109375, -2.583984375, -1.7392578125, -0.89453125, -0.0498046875, 0.794921875, 1.6396484375, 2.484375, 3.3291015625, 4.173828125, 5.0185546875, 5.86328125, 6.7080078125, 7.552734375, 8.3974609375, 9.2421875, 10.0869140625, 10.931640625, 11.7763671875, 12.62109375, 13.4658203125, 14.310546875, 15.1552734375, 16.0, 16.8447265625, 17.689453125, 18.5341796875, 19.37890625, 20.2236328125, 21.068359375, 21.9130859375, 22.7578125, 23.6025390625, 24.447265625, 25.2919921875, 26.13671875, 26.9814453125, 27.826171875, 28.6708984375, 29.515625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 5.0, 14.0, 14.0, 20.0, 29.0, 34.0, 60.0, 95.0, 98.0, 143.0, 184.0, 229.0, 330.0, 428.0, 460.0, 420.0, 363.0, 289.0, 235.0, 160.0, 134.0, 84.0, 53.0, 40.0, 37.0, 32.0, 16.0, 8.0, 7.0, 10.0, 7.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.34765625, -5.16754150390625, -4.9874267578125, -4.80731201171875, -4.627197265625, -4.44708251953125, -4.2669677734375, -4.08685302734375, -3.90673828125, -3.72662353515625, -3.5465087890625, -3.36639404296875, -3.186279296875, -3.00616455078125, -2.8260498046875, -2.64593505859375, -2.4658203125, -2.28570556640625, -2.1055908203125, -1.92547607421875, -1.745361328125, -1.56524658203125, -1.3851318359375, -1.20501708984375, -1.02490234375, -0.84478759765625, -0.6646728515625, -0.48455810546875, -0.304443359375, -0.12432861328125, 0.0557861328125, 0.23590087890625, 0.416015625, 0.59613037109375, 0.7762451171875, 0.95635986328125, 1.136474609375, 1.31658935546875, 1.4967041015625, 1.67681884765625, 1.85693359375, 2.03704833984375, 2.2171630859375, 2.39727783203125, 2.577392578125, 2.75750732421875, 2.9376220703125, 3.11773681640625, 3.2978515625, 3.47796630859375, 3.6580810546875, 3.83819580078125, 4.018310546875, 4.19842529296875, 4.3785400390625, 4.55865478515625, 4.73876953125, 4.91888427734375, 5.0989990234375, 5.27911376953125, 5.459228515625, 5.63934326171875, 5.8194580078125, 5.99957275390625, 6.1796875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 6.0, 1.0, 2.0, 0.0, 5.0, 14.0, 14.0, 15.0, 10.0, 23.0, 28.0, 36.0, 40.0, 72.0, 130.0, 271.0, 821.0, 4083.0, 54890.0, 2166716.0, 1912594.0, 49293.0, 3836.0, 764.0, 244.0, 101.0, 82.0, 42.0, 37.0, 18.0, 18.0, 12.0, 10.0, 6.0, 6.0, 8.0, 7.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.175048828125, -17.56884765625, -16.962646484375, -16.3564453125, -15.750244140625, -15.14404296875, -14.537841796875, -13.931640625, -13.325439453125, -12.71923828125, -12.113037109375, -11.5068359375, -10.900634765625, -10.29443359375, -9.688232421875, -9.08203125, -8.475830078125, -7.86962890625, -7.263427734375, -6.6572265625, -6.051025390625, -5.44482421875, -4.838623046875, -4.232421875, -3.626220703125, -3.02001953125, -2.413818359375, -1.8076171875, -1.201416015625, -0.59521484375, 0.010986328125, 0.6171875, 1.223388671875, 1.82958984375, 2.435791015625, 3.0419921875, 3.648193359375, 4.25439453125, 4.860595703125, 5.466796875, 6.072998046875, 6.67919921875, 7.285400390625, 7.8916015625, 8.497802734375, 9.10400390625, 9.710205078125, 10.31640625, 10.922607421875, 11.52880859375, 12.135009765625, 12.7412109375, 13.347412109375, 13.95361328125, 14.559814453125, 15.166015625, 15.772216796875, 16.37841796875, 16.984619140625, 17.5908203125, 18.197021484375, 18.80322265625, 19.409423828125, 20.015625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 19.0, 81.0, 222.0, 343.0, 237.0, 93.0, 20.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.66642761230469, -117.24757385253906, -114.82872009277344, -112.40987396240234, -109.99102020263672, -107.5721664428711, -105.15331268310547, -102.73445892333984, -100.31561279296875, -97.89675903320312, -95.4779052734375, -93.0590591430664, -90.64020538330078, -88.22135162353516, -85.80249786376953, -83.3836441040039, -80.96479034423828, -78.54593658447266, -76.12708282470703, -73.70823669433594, -71.28938293457031, -68.87052917480469, -66.45167541503906, -64.03282165527344, -61.61397171020508, -59.19511795043945, -56.776268005371094, -54.35741424560547, -51.938560485839844, -49.519710540771484, -47.10085678100586, -44.6820068359375, -42.263160705566406, -39.84430694580078, -37.42545700073242, -35.0066032409668, -32.58775329589844, -30.168899536132812, -27.750045776367188, -25.331193923950195, -22.912342071533203, -20.49349021911621, -18.07463836669922, -15.655784606933594, -13.236932754516602, -10.81808090209961, -8.3992280960083, -5.980375289916992, -3.5615234375, -1.1426711082458496, 1.2761812210083008, 3.695033550262451, 6.113885879516602, 8.532737731933594, 10.951590538024902, 13.370443344116211, 15.789295196533203, 18.208147048950195, 20.626998901367188, 23.045852661132812, 25.464704513549805, 27.883556365966797, 30.302410125732422, 32.72126007080078, 35.140113830566406]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 7.0, 8.0, 9.0, 13.0, 7.0, 11.0, 18.0, 18.0, 22.0, 22.0, 33.0, 35.0, 43.0, 28.0, 31.0, 30.0, 45.0, 31.0, 41.0, 43.0, 38.0, 35.0, 42.0, 49.0, 42.0, 40.0, 33.0, 32.0, 27.0, 20.0, 20.0, 23.0, 9.0, 15.0, 10.0, 15.0, 12.0, 9.0, 17.0, 2.0, 3.0, 2.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.02873992919922, -19.442766189575195, -18.856794357299805, -18.27082061767578, -17.684846878051758, -17.098873138427734, -16.512901306152344, -15.92692756652832, -15.340954780578613, -14.754981994628906, -14.169008255004883, -13.583035469055176, -12.997062683105469, -12.411088943481445, -11.825116157531738, -11.239143371582031, -10.653169631958008, -10.0671968460083, -9.481223106384277, -8.89525032043457, -8.309276580810547, -7.72330379486084, -7.137331008911133, -6.551357746124268, -5.965384483337402, -5.379411220550537, -4.793437957763672, -4.207465171813965, -3.6214919090270996, -3.0355186462402344, -2.4495456218719482, -1.863572597503662, -1.277597427368164, -0.6916242837905884, -0.1056511402130127, 0.480322003364563, 1.0662951469421387, 1.652268409729004, 2.23824143409729, 2.824214458465576, 3.4101877212524414, 3.9961609840393066, 4.582134246826172, 5.168107032775879, 5.754080295562744, 6.340053558349609, 6.926026344299316, 7.511999607086182, 8.097972869873047, 8.683945655822754, 9.269919395446777, 9.855892181396484, 10.441865921020508, 11.027838706970215, 11.613811492919922, 12.199785232543945, 12.785758018493652, 13.37173080444336, 13.957704544067383, 14.54367733001709, 15.129650115966797, 15.71562385559082, 16.301597595214844, 16.887569427490234, 17.473543167114258]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 12.0, 13.0, 8.0, 11.0, 17.0, 18.0, 16.0, 14.0, 24.0, 29.0, 36.0, 31.0, 29.0, 33.0, 37.0, 40.0, 38.0, 43.0, 49.0, 32.0, 50.0, 47.0, 52.0, 33.0, 36.0, 17.0, 27.0, 22.0, 31.0, 21.0, 20.0, 12.0, 12.0, 19.0, 15.0, 9.0, 14.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.3046875, -4.16973876953125, -4.0347900390625, -3.89984130859375, -3.764892578125, -3.62994384765625, -3.4949951171875, -3.36004638671875, -3.22509765625, -3.09014892578125, -2.9552001953125, -2.82025146484375, -2.685302734375, -2.55035400390625, -2.4154052734375, -2.28045654296875, -2.1455078125, -2.01055908203125, -1.8756103515625, -1.74066162109375, -1.605712890625, -1.47076416015625, -1.3358154296875, -1.20086669921875, -1.06591796875, -0.93096923828125, -0.7960205078125, -0.66107177734375, -0.526123046875, -0.39117431640625, -0.2562255859375, -0.12127685546875, 0.013671875, 0.14862060546875, 0.2835693359375, 0.41851806640625, 0.553466796875, 0.68841552734375, 0.8233642578125, 0.95831298828125, 1.09326171875, 1.22821044921875, 1.3631591796875, 1.49810791015625, 1.633056640625, 1.76800537109375, 1.9029541015625, 2.03790283203125, 2.1728515625, 2.30780029296875, 2.4427490234375, 2.57769775390625, 2.712646484375, 2.84759521484375, 2.9825439453125, 3.11749267578125, 3.25244140625, 3.38739013671875, 3.5223388671875, 3.65728759765625, 3.792236328125, 3.92718505859375, 4.0621337890625, 4.19708251953125, 4.33203125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 8.0, 15.0, 15.0, 26.0, 42.0, 64.0, 99.0, 151.0, 243.0, 345.0, 549.0, 791.0, 1247.0, 1871.0, 2936.0, 4738.0, 7129.0, 10904.0, 16663.0, 24289.0, 35691.0, 51087.0, 69612.0, 90927.0, 110398.0, 122153.0, 118619.0, 102642.0, 81303.0, 61076.0, 43265.0, 29876.0, 20445.0, 13698.0, 9149.0, 5842.0, 3763.0, 2427.0, 1570.0, 1047.0, 660.0, 404.0, 259.0, 170.0, 112.0, 80.0, 60.0, 26.0, 32.0, 11.0, 10.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.269775390625, -0.26154327392578125, -0.2533111572265625, -0.24507904052734375, -0.236846923828125, -0.22861480712890625, -0.2203826904296875, -0.21215057373046875, -0.20391845703125, -0.19568634033203125, -0.1874542236328125, -0.17922210693359375, -0.170989990234375, -0.16275787353515625, -0.1545257568359375, -0.14629364013671875, -0.1380615234375, -0.12982940673828125, -0.1215972900390625, -0.11336517333984375, -0.105133056640625, -0.09690093994140625, -0.0886688232421875, -0.08043670654296875, -0.07220458984375, -0.06397247314453125, -0.0557403564453125, -0.04750823974609375, -0.039276123046875, -0.03104400634765625, -0.0228118896484375, -0.01457977294921875, -0.00634765625, 0.00188446044921875, 0.0101165771484375, 0.01834869384765625, 0.026580810546875, 0.03481292724609375, 0.0430450439453125, 0.05127716064453125, 0.05950927734375, 0.06774139404296875, 0.0759735107421875, 0.08420562744140625, 0.092437744140625, 0.10066986083984375, 0.1089019775390625, 0.11713409423828125, 0.1253662109375, 0.13359832763671875, 0.1418304443359375, 0.15006256103515625, 0.158294677734375, 0.16652679443359375, 0.1747589111328125, 0.18299102783203125, 0.19122314453125, 0.19945526123046875, 0.2076873779296875, 0.21591949462890625, 0.224151611328125, 0.23238372802734375, 0.2406158447265625, 0.24884796142578125, 0.257080078125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 6.0, 4.0, 7.0, 12.0, 6.0, 9.0, 11.0, 17.0, 23.0, 21.0, 27.0, 26.0, 45.0, 34.0, 39.0, 37.0, 45.0, 37.0, 43.0, 43.0, 1077.0, 40.0, 42.0, 47.0, 40.0, 40.0, 32.0, 30.0, 35.0, 26.0, 24.0, 18.0, 19.0, 16.0, 12.0, 10.0, 6.0, 5.0, 6.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.159759521484375, -3.05584716796875, -2.951934814453125, -2.8480224609375, -2.744110107421875, -2.64019775390625, -2.536285400390625, -2.432373046875, -2.328460693359375, -2.22454833984375, -2.120635986328125, -2.0167236328125, -1.912811279296875, -1.80889892578125, -1.704986572265625, -1.60107421875, -1.497161865234375, -1.39324951171875, -1.289337158203125, -1.1854248046875, -1.081512451171875, -0.97760009765625, -0.873687744140625, -0.769775390625, -0.665863037109375, -0.56195068359375, -0.458038330078125, -0.3541259765625, -0.250213623046875, -0.14630126953125, -0.042388916015625, 0.0615234375, 0.165435791015625, 0.26934814453125, 0.373260498046875, 0.4771728515625, 0.581085205078125, 0.68499755859375, 0.788909912109375, 0.892822265625, 0.996734619140625, 1.10064697265625, 1.204559326171875, 1.3084716796875, 1.412384033203125, 1.51629638671875, 1.620208740234375, 1.72412109375, 1.828033447265625, 1.93194580078125, 2.035858154296875, 2.1397705078125, 2.243682861328125, 2.34759521484375, 2.451507568359375, 2.555419921875, 2.659332275390625, 2.76324462890625, 2.867156982421875, 2.9710693359375, 3.074981689453125, 3.17889404296875, 3.282806396484375, 3.38671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 18.0, 9.0, 28.0, 37.0, 59.0, 103.0, 212.0, 366.0, 575.0, 1066.0, 1685.0, 2879.0, 5094.0, 8700.0, 14570.0, 24689.0, 39536.0, 61447.0, 90854.0, 125348.0, 680790.0, 661744.0, 124880.0, 91416.0, 61409.0, 39581.0, 24501.0, 14534.0, 8611.0, 5192.0, 2965.0, 1748.0, 1030.0, 601.0, 351.0, 194.0, 117.0, 85.0, 43.0, 23.0, 8.0, 10.0, 9.0, 10.0, 4.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.2242431640625, -0.21801376342773438, -0.21178436279296875, -0.20555496215820312, -0.1993255615234375, -0.19309616088867188, -0.18686676025390625, -0.18063735961914062, -0.174407958984375, -0.16817855834960938, -0.16194915771484375, -0.15571975708007812, -0.1494903564453125, -0.14326095581054688, -0.13703155517578125, -0.13080215454101562, -0.12457275390625, -0.11834335327148438, -0.11211395263671875, -0.10588455200195312, -0.0996551513671875, -0.09342575073242188, -0.08719635009765625, -0.08096694946289062, -0.074737548828125, -0.06850814819335938, -0.06227874755859375, -0.056049346923828125, -0.0498199462890625, -0.043590545654296875, -0.03736114501953125, -0.031131744384765625, -0.02490234375, -0.018672943115234375, -0.01244354248046875, -0.006214141845703125, 1.52587890625e-05, 0.006244659423828125, 0.01247406005859375, 0.018703460693359375, 0.024932861328125, 0.031162261962890625, 0.03739166259765625, 0.043621063232421875, 0.0498504638671875, 0.056079864501953125, 0.06230926513671875, 0.06853866577148438, 0.07476806640625, 0.08099746704101562, 0.08722686767578125, 0.09345626831054688, 0.0996856689453125, 0.10591506958007812, 0.11214447021484375, 0.11837387084960938, 0.124603271484375, 0.13083267211914062, 0.13706207275390625, 0.14329147338867188, 0.1495208740234375, 0.15575027465820312, 0.16197967529296875, 0.16820907592773438, 0.1744384765625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 11.0, 9.0, 16.0, 20.0, 18.0, 21.0, 38.0, 51.0, 60.0, 68.0, 84.0, 108.0, 104.0, 72.0, 58.0, 60.0, 41.0, 32.0, 22.0, 21.0, 15.0, 9.0, 8.0, 12.0, 4.0, 5.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.03349637985229492, -0.032202720642089844, -0.030909061431884766, -0.029615402221679688, -0.02832174301147461, -0.02702808380126953, -0.025734424591064453, -0.024440765380859375, -0.023147106170654297, -0.02185344696044922, -0.02055978775024414, -0.019266128540039062, -0.017972469329833984, -0.016678810119628906, -0.015385150909423828, -0.01409149169921875, -0.012797832489013672, -0.011504173278808594, -0.010210514068603516, -0.008916854858398438, -0.007623195648193359, -0.006329536437988281, -0.005035877227783203, -0.003742218017578125, -0.002448558807373047, -0.0011548995971679688, 0.00013875961303710938, 0.0014324188232421875, 0.0027260780334472656, 0.004019737243652344, 0.005313396453857422, 0.0066070556640625, 0.007900714874267578, 0.009194374084472656, 0.010488033294677734, 0.011781692504882812, 0.01307535171508789, 0.014369010925292969, 0.015662670135498047, 0.016956329345703125, 0.018249988555908203, 0.01954364776611328, 0.02083730697631836, 0.022130966186523438, 0.023424625396728516, 0.024718284606933594, 0.026011943817138672, 0.02730560302734375, 0.028599262237548828, 0.029892921447753906, 0.031186580657958984, 0.03248023986816406, 0.03377389907836914, 0.03506755828857422, 0.0363612174987793, 0.037654876708984375, 0.03894853591918945, 0.04024219512939453, 0.04153585433959961, 0.04282951354980469, 0.044123172760009766, 0.045416831970214844, 0.04671049118041992, 0.048004150390625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 9.0, 3.0, 6.0, 8.0, 12.0, 9.0, 6.0, 25.0, 25.0, 34.0, 47.0, 86.0, 144.0, 242.0, 668.0, 9209.0, 1035554.0, 1497.0, 427.0, 207.0, 108.0, 70.0, 35.0, 32.0, 30.0, 19.0, 8.0, 12.0, 3.0, 7.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0419921875, -1.0140380859375, -0.986083984375, -0.9581298828125, -0.93017578125, -0.9022216796875, -0.874267578125, -0.8463134765625, -0.818359375, -0.7904052734375, -0.762451171875, -0.7344970703125, -0.70654296875, -0.6785888671875, -0.650634765625, -0.6226806640625, -0.5947265625, -0.5667724609375, -0.538818359375, -0.5108642578125, -0.48291015625, -0.4549560546875, -0.427001953125, -0.3990478515625, -0.37109375, -0.3431396484375, -0.315185546875, -0.2872314453125, -0.25927734375, -0.2313232421875, -0.203369140625, -0.1754150390625, -0.1474609375, -0.1195068359375, -0.091552734375, -0.0635986328125, -0.03564453125, -0.0076904296875, 0.020263671875, 0.0482177734375, 0.076171875, 0.1041259765625, 0.132080078125, 0.1600341796875, 0.18798828125, 0.2159423828125, 0.243896484375, 0.2718505859375, 0.2998046875, 0.3277587890625, 0.355712890625, 0.3836669921875, 0.41162109375, 0.4395751953125, 0.467529296875, 0.4954833984375, 0.5234375, 0.5513916015625, 0.579345703125, 0.6072998046875, 0.63525390625, 0.6632080078125, 0.691162109375, 0.7191162109375, 0.7470703125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 67.0, 737.0, 182.0, 16.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5472573637962341, -0.5355329513549805, -0.5238085985183716, -0.5120841860771179, -0.500359833240509, -0.48863542079925537, -0.4769110381603241, -0.4651866555213928, -0.45346227288246155, -0.4417378902435303, -0.430013507604599, -0.4182891249656677, -0.40656471252441406, -0.3948403298854828, -0.3831159472465515, -0.37139156460762024, -0.35966718196868896, -0.3479427993297577, -0.3362184166908264, -0.32449403405189514, -0.31276965141296387, -0.3010452389717102, -0.28932085633277893, -0.27759647369384766, -0.2658720910549164, -0.2541477084159851, -0.24242332577705383, -0.23069892823696136, -0.2189745455980301, -0.20725016295909882, -0.19552576541900635, -0.18380138278007507, -0.1720769703388214, -0.16035258769989014, -0.14862820506095886, -0.1369038075208664, -0.12517942488193512, -0.11345504224300385, -0.10173065215349197, -0.0900062620639801, -0.07828187942504883, -0.06655749678611755, -0.05483310669660568, -0.04310872033238411, -0.03138433396816254, -0.019659947603940964, -0.007935561239719391, 0.0037888288497924805, 0.015513211488723755, 0.027237597852945328, 0.0389619842171669, 0.050686370581388474, 0.062410756945610046, 0.07413513958454132, 0.08585952967405319, 0.09758391976356506, 0.10930830240249634, 0.12103268504142761, 0.1327570676803589, 0.14448146522045135, 0.15620584785938263, 0.1679302304983139, 0.17965462803840637, 0.19137901067733765, 0.20310339331626892]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 1.0, 4.0, 6.0, 1.0, 5.0, 6.0, 10.0, 7.0, 4.0, 8.0, 9.0, 9.0, 22.0, 22.0, 17.0, 20.0, 19.0, 24.0, 27.0, 21.0, 31.0, 26.0, 32.0, 24.0, 36.0, 39.0, 27.0, 32.0, 29.0, 35.0, 35.0, 30.0, 33.0, 27.0, 36.0, 27.0, 30.0, 21.0, 21.0, 25.0, 26.0, 22.0, 11.0, 21.0, 15.0, 15.0, 10.0, 6.0, 9.0, 8.0, 8.0, 4.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07363152503967285, -0.07130121439695358, -0.06897090375423431, -0.06664058566093445, -0.06431027501821518, -0.06197996437549591, -0.05964965000748634, -0.057319335639476776, -0.05498902499675751, -0.05265871435403824, -0.05032839998602867, -0.047998085618019104, -0.045667774975299835, -0.043337464332580566, -0.041007149964571, -0.03867683559656143, -0.03634652495384216, -0.034016214311122894, -0.03168589994311333, -0.02935558743774891, -0.02702527493238449, -0.024694962427020073, -0.022364649921655655, -0.020034337416291237, -0.01770402491092682, -0.0153737124055624, -0.013043399900197983, -0.010713087394833565, -0.008382774889469147, -0.006052462384104729, -0.0037221498787403107, -0.0013918373733758926, 0.0009384751319885254, 0.0032687876373529434, 0.0055991001427173615, 0.00792941264808178, 0.010259725153446198, 0.012590037658810616, 0.014920350164175034, 0.01725066266953945, 0.01958097517490387, 0.021911287680268288, 0.024241600185632706, 0.026571912690997124, 0.028902225196361542, 0.03123253770172596, 0.03356285020709038, 0.035893164575099945, 0.038223475217819214, 0.04055378586053848, 0.04288410022854805, 0.04521441459655762, 0.047544725239276886, 0.049875035881996155, 0.05220535025000572, 0.05453566461801529, 0.05686597526073456, 0.05919628590345383, 0.061526600271463394, 0.06385691463947296, 0.06618722528219223, 0.0685175359249115, 0.07084785401821136, 0.07317816466093063, 0.0755084753036499]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 9.0, 10.0, 11.0, 16.0, 14.0, 18.0, 19.0, 28.0, 30.0, 28.0, 29.0, 33.0, 27.0, 32.0, 32.0, 45.0, 41.0, 48.0, 39.0, 48.0, 54.0, 48.0, 36.0, 26.0, 36.0, 33.0, 29.0, 28.0, 22.0, 16.0, 19.0, 13.0, 13.0, 11.0, 10.0, 5.0, 6.0, 11.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.578125, -4.44036865234375, -4.3026123046875, -4.16485595703125, -4.027099609375, -3.88934326171875, -3.7515869140625, -3.61383056640625, -3.47607421875, -3.33831787109375, -3.2005615234375, -3.06280517578125, -2.925048828125, -2.78729248046875, -2.6495361328125, -2.51177978515625, -2.3740234375, -2.23626708984375, -2.0985107421875, -1.96075439453125, -1.822998046875, -1.68524169921875, -1.5474853515625, -1.40972900390625, -1.27197265625, -1.13421630859375, -0.9964599609375, -0.85870361328125, -0.720947265625, -0.58319091796875, -0.4454345703125, -0.30767822265625, -0.169921875, -0.03216552734375, 0.1055908203125, 0.24334716796875, 0.381103515625, 0.51885986328125, 0.6566162109375, 0.79437255859375, 0.93212890625, 1.06988525390625, 1.2076416015625, 1.34539794921875, 1.483154296875, 1.62091064453125, 1.7586669921875, 1.89642333984375, 2.0341796875, 2.17193603515625, 2.3096923828125, 2.44744873046875, 2.585205078125, 2.72296142578125, 2.8607177734375, 2.99847412109375, 3.13623046875, 3.27398681640625, 3.4117431640625, 3.54949951171875, 3.687255859375, 3.82501220703125, 3.9627685546875, 4.10052490234375, 4.23828125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 0.0, 5.0, 3.0, 8.0, 8.0, 11.0, 14.0, 30.0, 20.0, 33.0, 52.0, 62.0, 104.0, 140.0, 272.0, 389.0, 669.0, 1180.0, 2145.0, 4178.0, 8134.0, 15512.0, 31426.0, 64192.0, 143748.0, 296393.0, 256337.0, 115918.0, 53331.0, 26248.0, 13143.0, 6813.0, 3487.0, 1865.0, 1074.0, 572.0, 354.0, 228.0, 131.0, 106.0, 52.0, 49.0, 33.0, 21.0, 14.0, 12.0, 9.0, 15.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0], "bins": [-5.62109375, -5.45513916015625, -5.2891845703125, -5.12322998046875, -4.957275390625, -4.79132080078125, -4.6253662109375, -4.45941162109375, -4.29345703125, -4.12750244140625, -3.9615478515625, -3.79559326171875, -3.629638671875, -3.46368408203125, -3.2977294921875, -3.13177490234375, -2.9658203125, -2.79986572265625, -2.6339111328125, -2.46795654296875, -2.302001953125, -2.13604736328125, -1.9700927734375, -1.80413818359375, -1.63818359375, -1.47222900390625, -1.3062744140625, -1.14031982421875, -0.974365234375, -0.80841064453125, -0.6424560546875, -0.47650146484375, -0.310546875, -0.14459228515625, 0.0213623046875, 0.18731689453125, 0.353271484375, 0.51922607421875, 0.6851806640625, 0.85113525390625, 1.01708984375, 1.18304443359375, 1.3489990234375, 1.51495361328125, 1.680908203125, 1.84686279296875, 2.0128173828125, 2.17877197265625, 2.3447265625, 2.51068115234375, 2.6766357421875, 2.84259033203125, 3.008544921875, 3.17449951171875, 3.3404541015625, 3.50640869140625, 3.67236328125, 3.83831787109375, 4.0042724609375, 4.17022705078125, 4.336181640625, 4.50213623046875, 4.6680908203125, 4.83404541015625, 5.0]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 7.0, 15.0, 9.0, 19.0, 13.0, 27.0, 21.0, 20.0, 28.0, 32.0, 54.0, 49.0, 65.0, 85.0, 140.0, 239.0, 1421.0, 192.0, 133.0, 83.0, 66.0, 55.0, 40.0, 31.0, 31.0, 21.0, 24.0, 21.0, 12.0, 14.0, 15.0, 8.0, 11.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.0703125, -11.6971435546875, -11.323974609375, -10.9508056640625, -10.57763671875, -10.2044677734375, -9.831298828125, -9.4581298828125, -9.0849609375, -8.7117919921875, -8.338623046875, -7.9654541015625, -7.59228515625, -7.2191162109375, -6.845947265625, -6.4727783203125, -6.099609375, -5.7264404296875, -5.353271484375, -4.9801025390625, -4.60693359375, -4.2337646484375, -3.860595703125, -3.4874267578125, -3.1142578125, -2.7410888671875, -2.367919921875, -1.9947509765625, -1.62158203125, -1.2484130859375, -0.875244140625, -0.5020751953125, -0.12890625, 0.2442626953125, 0.617431640625, 0.9906005859375, 1.36376953125, 1.7369384765625, 2.110107421875, 2.4832763671875, 2.8564453125, 3.2296142578125, 3.602783203125, 3.9759521484375, 4.34912109375, 4.7222900390625, 5.095458984375, 5.4686279296875, 5.841796875, 6.2149658203125, 6.588134765625, 6.9613037109375, 7.33447265625, 7.7076416015625, 8.080810546875, 8.4539794921875, 8.8271484375, 9.2003173828125, 9.573486328125, 9.9466552734375, 10.31982421875, 10.6929931640625, 11.066162109375, 11.4393310546875, 11.8125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 12.0, 12.0, 16.0, 21.0, 37.0, 38.0, 57.0, 75.0, 103.0, 149.0, 238.0, 304.0, 495.0, 927.0, 3357.0, 33993.0, 1040373.0, 2007627.0, 50548.0, 4526.0, 1053.0, 563.0, 354.0, 245.0, 164.0, 105.0, 81.0, 62.0, 50.0, 28.0, 20.0, 20.0, 5.0, 4.0, 8.0, 4.0, 4.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.265625, -15.7421875, -15.21875, -14.6953125, -14.171875, -13.6484375, -13.125, -12.6015625, -12.078125, -11.5546875, -11.03125, -10.5078125, -9.984375, -9.4609375, -8.9375, -8.4140625, -7.890625, -7.3671875, -6.84375, -6.3203125, -5.796875, -5.2734375, -4.75, -4.2265625, -3.703125, -3.1796875, -2.65625, -2.1328125, -1.609375, -1.0859375, -0.5625, -0.0390625, 0.484375, 1.0078125, 1.53125, 2.0546875, 2.578125, 3.1015625, 3.625, 4.1484375, 4.671875, 5.1953125, 5.71875, 6.2421875, 6.765625, 7.2890625, 7.8125, 8.3359375, 8.859375, 9.3828125, 9.90625, 10.4296875, 10.953125, 11.4765625, 12.0, 12.5234375, 13.046875, 13.5703125, 14.09375, 14.6171875, 15.140625, 15.6640625, 16.1875, 16.7109375, 17.234375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 23.0, 197.0, 461.0, 279.0, 46.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.618183135986328, -15.837410926818848, -13.056638717651367, -10.275867462158203, -7.495095252990723, -4.714323043823242, -1.9335517883300781, 0.8472213745117188, 3.627992630004883, 6.408764839172363, 9.189537048339844, 11.970308303833008, 14.751080513000488, 17.53185272216797, 20.312623977661133, 23.09339714050293, 25.874168395996094, 28.654939651489258, 31.435712814331055, 34.21648406982422, 36.997257232666016, 39.77803039550781, 42.558799743652344, 45.33957290649414, 48.12034606933594, 50.901119232177734, 53.681888580322266, 56.46266174316406, 59.24343490600586, 62.024208068847656, 64.80497741699219, 67.58575439453125, 70.36652374267578, 73.14729309082031, 75.92807006835938, 78.7088394165039, 81.48960876464844, 84.2703857421875, 87.05115509033203, 89.83192443847656, 92.61270141601562, 95.39347076416016, 98.17424774169922, 100.95501708984375, 103.73578643798828, 106.51656341552734, 109.29733276367188, 112.07810974121094, 114.85887145996094, 117.63964080810547, 120.42041778564453, 123.20118713378906, 125.9819564819336, 128.76272583007812, 131.5435028076172, 134.32427978515625, 137.1050567626953, 139.88583374023438, 142.66659545898438, 145.44737243652344, 148.2281494140625, 151.0089111328125, 153.78968811035156, 156.57046508789062, 159.35122680664062]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 6.0, 8.0, 9.0, 9.0, 16.0, 16.0, 18.0, 27.0, 12.0, 26.0, 31.0, 39.0, 34.0, 30.0, 40.0, 41.0, 46.0, 47.0, 40.0, 43.0, 50.0, 47.0, 49.0, 37.0, 48.0, 36.0, 38.0, 27.0, 21.0, 22.0, 18.0, 10.0, 13.0, 8.0, 7.0, 13.0, 2.0, 2.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.131559371948242, -29.266071319580078, -28.400583267211914, -27.53509521484375, -26.669607162475586, -25.804119110107422, -24.938629150390625, -24.073143005371094, -23.207653045654297, -22.342164993286133, -21.47667694091797, -20.611188888549805, -19.74570083618164, -18.880212783813477, -18.014724731445312, -17.149234771728516, -16.283748626708984, -15.41826057434082, -14.552772521972656, -13.687284469604492, -12.821796417236328, -11.956308364868164, -11.090819358825684, -10.22533130645752, -9.359843254089355, -8.494355201721191, -7.628867149353027, -6.763378620147705, -5.897890567779541, -5.032402515411377, -4.166913986206055, -3.3014259338378906, -2.4359397888183594, -1.5704516172409058, -0.7049634456634521, 0.16052484512329102, 1.026012897491455, 1.8915009498596191, 2.7569894790649414, 3.6224775314331055, 4.4879655838012695, 5.353453636169434, 6.218941688537598, 7.08443021774292, 7.949918270111084, 8.815406799316406, 9.68089485168457, 10.546382904052734, 11.411870956420898, 12.277359008789062, 13.142847061157227, 14.00833511352539, 14.873823165893555, 15.739311218261719, 16.604801177978516, 17.470287322998047, 18.335777282714844, 19.201265335083008, 20.066753387451172, 20.932241439819336, 21.7977294921875, 22.663217544555664, 23.528705596923828, 24.394195556640625, 25.259681701660156]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 2.0, 9.0, 8.0, 11.0, 12.0, 18.0, 15.0, 23.0, 18.0, 23.0, 16.0, 23.0, 24.0, 36.0, 28.0, 39.0, 41.0, 39.0, 35.0, 36.0, 36.0, 59.0, 37.0, 29.0, 32.0, 32.0, 42.0, 27.0, 28.0, 27.0, 22.0, 18.0, 21.0, 23.0, 16.0, 9.0, 8.0, 15.0, 9.0, 8.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.33203125, -4.20147705078125, -4.0709228515625, -3.94036865234375, -3.809814453125, -3.67926025390625, -3.5487060546875, -3.41815185546875, -3.28759765625, -3.15704345703125, -3.0264892578125, -2.89593505859375, -2.765380859375, -2.63482666015625, -2.5042724609375, -2.37371826171875, -2.2431640625, -2.11260986328125, -1.9820556640625, -1.85150146484375, -1.720947265625, -1.59039306640625, -1.4598388671875, -1.32928466796875, -1.19873046875, -1.06817626953125, -0.9376220703125, -0.80706787109375, -0.676513671875, -0.54595947265625, -0.4154052734375, -0.28485107421875, -0.154296875, -0.02374267578125, 0.1068115234375, 0.23736572265625, 0.367919921875, 0.49847412109375, 0.6290283203125, 0.75958251953125, 0.89013671875, 1.02069091796875, 1.1512451171875, 1.28179931640625, 1.412353515625, 1.54290771484375, 1.6734619140625, 1.80401611328125, 1.9345703125, 2.06512451171875, 2.1956787109375, 2.32623291015625, 2.456787109375, 2.58734130859375, 2.7178955078125, 2.84844970703125, 2.97900390625, 3.10955810546875, 3.2401123046875, 3.37066650390625, 3.501220703125, 3.63177490234375, 3.7623291015625, 3.89288330078125, 4.0234375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 10.0, 13.0, 13.0, 17.0, 20.0, 29.0, 43.0, 47.0, 48.0, 70.0, 101.0, 136.0, 202.0, 316.0, 411.0, 975.0, 35557.0, 4142691.0, 11304.0, 847.0, 430.0, 277.0, 168.0, 127.0, 109.0, 51.0, 64.0, 42.0, 33.0, 27.0, 13.0, 15.0, 15.0, 12.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.4375, -49.89794921875, -48.3583984375, -46.81884765625, -45.279296875, -43.73974609375, -42.2001953125, -40.66064453125, -39.12109375, -37.58154296875, -36.0419921875, -34.50244140625, -32.962890625, -31.42333984375, -29.8837890625, -28.34423828125, -26.8046875, -25.26513671875, -23.7255859375, -22.18603515625, -20.646484375, -19.10693359375, -17.5673828125, -16.02783203125, -14.48828125, -12.94873046875, -11.4091796875, -9.86962890625, -8.330078125, -6.79052734375, -5.2509765625, -3.71142578125, -2.171875, -0.63232421875, 0.9072265625, 2.44677734375, 3.986328125, 5.52587890625, 7.0654296875, 8.60498046875, 10.14453125, 11.68408203125, 13.2236328125, 14.76318359375, 16.302734375, 17.84228515625, 19.3818359375, 20.92138671875, 22.4609375, 24.00048828125, 25.5400390625, 27.07958984375, 28.619140625, 30.15869140625, 31.6982421875, 33.23779296875, 34.77734375, 36.31689453125, 37.8564453125, 39.39599609375, 40.935546875, 42.47509765625, 44.0146484375, 45.55419921875, 47.09375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 8.0, 8.0, 7.0, 8.0, 14.0, 14.0, 28.0, 30.0, 62.0, 79.0, 103.0, 132.0, 212.0, 280.0, 372.0, 566.0, 599.0, 428.0, 342.0, 256.0, 162.0, 113.0, 78.0, 38.0, 29.0, 25.0, 23.0, 21.0, 8.0, 6.0, 7.0, 6.0, 2.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69140625, -6.4619140625, -6.232421875, -6.0029296875, -5.7734375, -5.5439453125, -5.314453125, -5.0849609375, -4.85546875, -4.6259765625, -4.396484375, -4.1669921875, -3.9375, -3.7080078125, -3.478515625, -3.2490234375, -3.01953125, -2.7900390625, -2.560546875, -2.3310546875, -2.1015625, -1.8720703125, -1.642578125, -1.4130859375, -1.18359375, -0.9541015625, -0.724609375, -0.4951171875, -0.265625, -0.0361328125, 0.193359375, 0.4228515625, 0.65234375, 0.8818359375, 1.111328125, 1.3408203125, 1.5703125, 1.7998046875, 2.029296875, 2.2587890625, 2.48828125, 2.7177734375, 2.947265625, 3.1767578125, 3.40625, 3.6357421875, 3.865234375, 4.0947265625, 4.32421875, 4.5537109375, 4.783203125, 5.0126953125, 5.2421875, 5.4716796875, 5.701171875, 5.9306640625, 6.16015625, 6.3896484375, 6.619140625, 6.8486328125, 7.078125, 7.3076171875, 7.537109375, 7.7666015625, 7.99609375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 6.0, 11.0, 9.0, 23.0, 26.0, 19.0, 26.0, 45.0, 58.0, 107.0, 171.0, 343.0, 925.0, 4873.0, 79250.0, 3289163.0, 793608.0, 21949.0, 2316.0, 650.0, 237.0, 106.0, 81.0, 59.0, 36.0, 27.0, 28.0, 21.0, 17.0, 15.0, 12.0, 11.0, 4.0, 6.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0], "bins": [-24.75, -24.05859375, -23.3671875, -22.67578125, -21.984375, -21.29296875, -20.6015625, -19.91015625, -19.21875, -18.52734375, -17.8359375, -17.14453125, -16.453125, -15.76171875, -15.0703125, -14.37890625, -13.6875, -12.99609375, -12.3046875, -11.61328125, -10.921875, -10.23046875, -9.5390625, -8.84765625, -8.15625, -7.46484375, -6.7734375, -6.08203125, -5.390625, -4.69921875, -4.0078125, -3.31640625, -2.625, -1.93359375, -1.2421875, -0.55078125, 0.140625, 0.83203125, 1.5234375, 2.21484375, 2.90625, 3.59765625, 4.2890625, 4.98046875, 5.671875, 6.36328125, 7.0546875, 7.74609375, 8.4375, 9.12890625, 9.8203125, 10.51171875, 11.203125, 11.89453125, 12.5859375, 13.27734375, 13.96875, 14.66015625, 15.3515625, 16.04296875, 16.734375, 17.42578125, 18.1171875, 18.80859375, 19.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 12.0, 22.0, 38.0, 105.0, 138.0, 187.0, 177.0, 144.0, 102.0, 53.0, 14.0, 9.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.380802154541016, -42.95361328125, -41.526424407958984, -40.09923553466797, -38.67204666137695, -37.24485778808594, -35.81767272949219, -34.390480041503906, -32.963294982910156, -31.53610610961914, -30.108917236328125, -28.68172836303711, -27.254539489746094, -25.827350616455078, -24.400163650512695, -22.97297477722168, -21.54578399658203, -20.118595123291016, -18.69140625, -17.264217376708984, -15.837029457092285, -14.40984058380127, -12.98265266418457, -11.555463790893555, -10.128274917602539, -8.701086044311523, -7.273897647857666, -5.846709251403809, -4.419520378112793, -2.9923315048217773, -1.5651435852050781, -0.1379547119140625, 1.2892341613769531, 2.7164227962493896, 4.143611431121826, 5.570799827575684, 6.997988700866699, 8.425177574157715, 9.852365493774414, 11.27955436706543, 12.706743240356445, 14.133932113647461, 15.561120986938477, 16.98830795288086, 18.415496826171875, 19.84268569946289, 21.269874572753906, 22.697063446044922, 24.124252319335938, 25.551441192626953, 26.97863006591797, 28.405818939208984, 29.8330078125, 31.260196685791016, 32.68738555908203, 34.11457061767578, 35.54176330566406, 36.96895217895508, 38.396141052246094, 39.82332992553711, 41.250518798828125, 42.67770767211914, 44.104896545410156, 45.532081604003906, 46.95927047729492]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 1.0, 7.0, 3.0, 8.0, 6.0, 8.0, 19.0, 9.0, 11.0, 23.0, 15.0, 29.0, 25.0, 22.0, 23.0, 25.0, 40.0, 34.0, 32.0, 35.0, 30.0, 42.0, 47.0, 40.0, 43.0, 41.0, 29.0, 37.0, 34.0, 35.0, 38.0, 26.0, 28.0, 28.0, 20.0, 24.0, 14.0, 10.0, 18.0, 11.0, 5.0, 5.0, 8.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-22.891695022583008, -22.246932983398438, -21.602170944213867, -20.957408905029297, -20.312646865844727, -19.667884826660156, -19.023122787475586, -18.378360748291016, -17.733596801757812, -17.088834762573242, -16.444072723388672, -15.799310684204102, -15.154548645019531, -14.509786605834961, -13.865023612976074, -13.220261573791504, -12.57550048828125, -11.93073844909668, -11.28597640991211, -10.641214370727539, -9.996452331542969, -9.351690292358398, -8.706927299499512, -8.062165260314941, -7.417403221130371, -6.772641181945801, -6.1278791427612305, -5.483116626739502, -4.838354587554932, -4.193592548370361, -3.548830270767212, -2.9040679931640625, -2.259307861328125, -1.6145457029342651, -0.9697835445404053, -0.3250213861465454, 0.31974077224731445, 0.9645028114318848, 1.6092650890350342, 2.2540273666381836, 2.898789405822754, 3.543551445007324, 4.1883134841918945, 4.833076000213623, 5.477838039398193, 6.122600078582764, 6.767362594604492, 7.4121246337890625, 8.056886672973633, 8.701648712158203, 9.346410751342773, 9.991172790527344, 10.635934829711914, 11.280696868896484, 11.925459861755371, 12.570221900939941, 13.214983940124512, 13.859745979309082, 14.504508018493652, 15.149270057678223, 15.79403305053711, 16.43879508972168, 17.08355712890625, 17.72831916809082, 18.37308120727539]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 8.0, 7.0, 9.0, 12.0, 9.0, 13.0, 11.0, 9.0, 22.0, 26.0, 24.0, 26.0, 24.0, 31.0, 23.0, 38.0, 34.0, 43.0, 36.0, 41.0, 41.0, 44.0, 38.0, 33.0, 41.0, 29.0, 33.0, 36.0, 36.0, 30.0, 25.0, 21.0, 20.0, 16.0, 15.0, 12.0, 17.0, 7.0, 11.0, 9.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.17578125, -4.04083251953125, -3.9058837890625, -3.77093505859375, -3.635986328125, -3.50103759765625, -3.3660888671875, -3.23114013671875, -3.09619140625, -2.96124267578125, -2.8262939453125, -2.69134521484375, -2.556396484375, -2.42144775390625, -2.2864990234375, -2.15155029296875, -2.0166015625, -1.88165283203125, -1.7467041015625, -1.61175537109375, -1.476806640625, -1.34185791015625, -1.2069091796875, -1.07196044921875, -0.93701171875, -0.80206298828125, -0.6671142578125, -0.53216552734375, -0.397216796875, -0.26226806640625, -0.1273193359375, 0.00762939453125, 0.142578125, 0.27752685546875, 0.4124755859375, 0.54742431640625, 0.682373046875, 0.81732177734375, 0.9522705078125, 1.08721923828125, 1.22216796875, 1.35711669921875, 1.4920654296875, 1.62701416015625, 1.761962890625, 1.89691162109375, 2.0318603515625, 2.16680908203125, 2.3017578125, 2.43670654296875, 2.5716552734375, 2.70660400390625, 2.841552734375, 2.97650146484375, 3.1114501953125, 3.24639892578125, 3.38134765625, 3.51629638671875, 3.6512451171875, 3.78619384765625, 3.921142578125, 4.05609130859375, 4.1910400390625, 4.32598876953125, 4.4609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 6.0, 12.0, 17.0, 20.0, 37.0, 48.0, 73.0, 128.0, 169.0, 247.0, 409.0, 530.0, 785.0, 1146.0, 1723.0, 2488.0, 3573.0, 5115.0, 7581.0, 11050.0, 15834.0, 22940.0, 32454.0, 45991.0, 61715.0, 81568.0, 100548.0, 115169.0, 116326.0, 104308.0, 85488.0, 66519.0, 48796.0, 35254.0, 24921.0, 17164.0, 11935.0, 8209.0, 5682.0, 4017.0, 2652.0, 1876.0, 1293.0, 856.0, 618.0, 410.0, 268.0, 189.0, 151.0, 87.0, 57.0, 31.0, 31.0, 20.0, 13.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2423095703125, -0.23452186584472656, -0.22673416137695312, -0.2189464569091797, -0.21115875244140625, -0.2033710479736328, -0.19558334350585938, -0.18779563903808594, -0.1800079345703125, -0.17222023010253906, -0.16443252563476562, -0.1566448211669922, -0.14885711669921875, -0.1410694122314453, -0.13328170776367188, -0.12549400329589844, -0.117706298828125, -0.10991859436035156, -0.10213088989257812, -0.09434318542480469, -0.08655548095703125, -0.07876777648925781, -0.07098007202148438, -0.06319236755371094, -0.0554046630859375, -0.04761695861816406, -0.039829254150390625, -0.03204154968261719, -0.02425384521484375, -0.016466140747070312, -0.008678436279296875, -0.0008907318115234375, 0.00689697265625, 0.014684677124023438, 0.022472381591796875, 0.030260086059570312, 0.03804779052734375, 0.04583549499511719, 0.053623199462890625, 0.06141090393066406, 0.0691986083984375, 0.07698631286621094, 0.08477401733398438, 0.09256172180175781, 0.10034942626953125, 0.10813713073730469, 0.11592483520507812, 0.12371253967285156, 0.131500244140625, 0.13928794860839844, 0.14707565307617188, 0.1548633575439453, 0.16265106201171875, 0.1704387664794922, 0.17822647094726562, 0.18601417541503906, 0.1938018798828125, 0.20158958435058594, 0.20937728881835938, 0.2171649932861328, 0.22495269775390625, 0.2327404022216797, 0.24052810668945312, 0.24831581115722656, 0.256103515625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 6.0, 8.0, 16.0, 22.0, 16.0, 13.0, 14.0, 21.0, 33.0, 20.0, 30.0, 28.0, 40.0, 36.0, 38.0, 45.0, 43.0, 48.0, 1069.0, 49.0, 41.0, 40.0, 40.0, 40.0, 32.0, 30.0, 27.0, 25.0, 17.0, 24.0, 24.0, 14.0, 14.0, 13.0, 11.0, 6.0, 2.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.84765625, -3.733551025390625, -3.61944580078125, -3.505340576171875, -3.3912353515625, -3.277130126953125, -3.16302490234375, -3.048919677734375, -2.934814453125, -2.820709228515625, -2.70660400390625, -2.592498779296875, -2.4783935546875, -2.364288330078125, -2.25018310546875, -2.136077880859375, -2.02197265625, -1.907867431640625, -1.79376220703125, -1.679656982421875, -1.5655517578125, -1.451446533203125, -1.33734130859375, -1.223236083984375, -1.109130859375, -0.995025634765625, -0.88092041015625, -0.766815185546875, -0.6527099609375, -0.538604736328125, -0.42449951171875, -0.310394287109375, -0.1962890625, -0.082183837890625, 0.03192138671875, 0.146026611328125, 0.2601318359375, 0.374237060546875, 0.48834228515625, 0.602447509765625, 0.716552734375, 0.830657958984375, 0.94476318359375, 1.058868408203125, 1.1729736328125, 1.287078857421875, 1.40118408203125, 1.515289306640625, 1.62939453125, 1.743499755859375, 1.85760498046875, 1.971710205078125, 2.0858154296875, 2.199920654296875, 2.31402587890625, 2.428131103515625, 2.542236328125, 2.656341552734375, 2.77044677734375, 2.884552001953125, 2.9986572265625, 3.112762451171875, 3.22686767578125, 3.340972900390625, 3.455078125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 4.0, 14.0, 20.0, 39.0, 43.0, 66.0, 109.0, 154.0, 239.0, 410.0, 582.0, 934.0, 1507.0, 2278.0, 3745.0, 5896.0, 9275.0, 14295.0, 22589.0, 34253.0, 51431.0, 74120.0, 101461.0, 147325.0, 1120058.0, 168581.0, 105180.0, 77112.0, 54350.0, 35981.0, 23799.0, 15096.0, 9536.0, 6037.0, 3934.0, 2442.0, 1553.0, 952.0, 613.0, 394.0, 249.0, 172.0, 112.0, 64.0, 46.0, 31.0, 22.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1903076171875, -0.1844635009765625, -0.178619384765625, -0.1727752685546875, -0.16693115234375, -0.1610870361328125, -0.155242919921875, -0.1493988037109375, -0.1435546875, -0.1377105712890625, -0.131866455078125, -0.1260223388671875, -0.12017822265625, -0.1143341064453125, -0.108489990234375, -0.1026458740234375, -0.0968017578125, -0.0909576416015625, -0.085113525390625, -0.0792694091796875, -0.07342529296875, -0.0675811767578125, -0.061737060546875, -0.0558929443359375, -0.050048828125, -0.0442047119140625, -0.038360595703125, -0.0325164794921875, -0.02667236328125, -0.0208282470703125, -0.014984130859375, -0.0091400146484375, -0.0032958984375, 0.0025482177734375, 0.008392333984375, 0.0142364501953125, 0.02008056640625, 0.0259246826171875, 0.031768798828125, 0.0376129150390625, 0.04345703125, 0.0493011474609375, 0.055145263671875, 0.0609893798828125, 0.06683349609375, 0.0726776123046875, 0.078521728515625, 0.0843658447265625, 0.0902099609375, 0.0960540771484375, 0.101898193359375, 0.1077423095703125, 0.11358642578125, 0.1194305419921875, 0.125274658203125, 0.1311187744140625, 0.136962890625, 0.1428070068359375, 0.148651123046875, 0.1544952392578125, 0.16033935546875, 0.1661834716796875, 0.172027587890625, 0.1778717041015625, 0.1837158203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 6.0, 13.0, 11.0, 11.0, 23.0, 15.0, 32.0, 40.0, 39.0, 48.0, 48.0, 62.0, 47.0, 70.0, 64.0, 53.0, 61.0, 46.0, 51.0, 49.0, 30.0, 29.0, 26.0, 23.0, 19.0, 16.0, 10.0, 10.0, 9.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.042572021484375, -0.04148054122924805, -0.040389060974121094, -0.03929758071899414, -0.03820610046386719, -0.037114620208740234, -0.03602313995361328, -0.03493165969848633, -0.033840179443359375, -0.03274869918823242, -0.03165721893310547, -0.030565738677978516, -0.029474258422851562, -0.02838277816772461, -0.027291297912597656, -0.026199817657470703, -0.02510833740234375, -0.024016857147216797, -0.022925376892089844, -0.02183389663696289, -0.020742416381835938, -0.019650936126708984, -0.01855945587158203, -0.017467975616455078, -0.016376495361328125, -0.015285015106201172, -0.014193534851074219, -0.013102054595947266, -0.012010574340820312, -0.01091909408569336, -0.009827613830566406, -0.008736133575439453, -0.0076446533203125, -0.006553173065185547, -0.005461692810058594, -0.004370212554931641, -0.0032787322998046875, -0.0021872520446777344, -0.0010957717895507812, -4.291534423828125e-06, 0.001087188720703125, 0.002178668975830078, 0.0032701492309570312, 0.004361629486083984, 0.0054531097412109375, 0.006544589996337891, 0.007636070251464844, 0.008727550506591797, 0.00981903076171875, 0.010910511016845703, 0.012001991271972656, 0.01309347152709961, 0.014184951782226562, 0.015276432037353516, 0.01636791229248047, 0.017459392547607422, 0.018550872802734375, 0.019642353057861328, 0.02073383331298828, 0.021825313568115234, 0.022916793823242188, 0.02400827407836914, 0.025099754333496094, 0.026191234588623047, 0.02728271484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 14.0, 10.0, 21.0, 28.0, 26.0, 45.0, 64.0, 67.0, 105.0, 152.0, 286.0, 496.0, 1073.0, 687285.0, 356617.0, 1003.0, 449.0, 241.0, 171.0, 113.0, 83.0, 46.0, 30.0, 31.0, 21.0, 16.0, 17.0, 5.0, 7.0, 9.0, 6.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54833984375, -0.5263900756835938, -0.5044403076171875, -0.48249053955078125, -0.460540771484375, -0.43859100341796875, -0.4166412353515625, -0.39469146728515625, -0.37274169921875, -0.35079193115234375, -0.3288421630859375, -0.30689239501953125, -0.284942626953125, -0.26299285888671875, -0.2410430908203125, -0.21909332275390625, -0.1971435546875, -0.17519378662109375, -0.1532440185546875, -0.13129425048828125, -0.109344482421875, -0.08739471435546875, -0.0654449462890625, -0.04349517822265625, -0.02154541015625, 0.00040435791015625, 0.0223541259765625, 0.04430389404296875, 0.066253662109375, 0.08820343017578125, 0.1101531982421875, 0.13210296630859375, 0.154052734375, 0.17600250244140625, 0.1979522705078125, 0.21990203857421875, 0.241851806640625, 0.26380157470703125, 0.2857513427734375, 0.30770111083984375, 0.32965087890625, 0.35160064697265625, 0.3735504150390625, 0.39550018310546875, 0.417449951171875, 0.43939971923828125, 0.4613494873046875, 0.48329925537109375, 0.5052490234375, 0.5271987915039062, 0.5491485595703125, 0.5710983276367188, 0.593048095703125, 0.6149978637695312, 0.6369476318359375, 0.6588973999023438, 0.68084716796875, 0.7027969360351562, 0.7247467041015625, 0.7466964721679688, 0.768646240234375, 0.7905960083007812, 0.8125457763671875, 0.8344955444335938, 0.8564453125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 776.0, 228.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8343996405601501, -0.814490795135498, -0.794581949710846, -0.7746731042861938, -0.7547642588615417, -0.7348554134368896, -0.7149465680122375, -0.6950377225875854, -0.6751288175582886, -0.6552199721336365, -0.6353111267089844, -0.6154022812843323, -0.5954934358596802, -0.5755845904350281, -0.555675745010376, -0.5357668399810791, -0.5158580541610718, -0.4959492087364197, -0.4760403633117676, -0.4561315178871155, -0.4362226724624634, -0.4163138270378113, -0.3964049518108368, -0.3764961063861847, -0.3565872609615326, -0.3366784155368805, -0.3167695701122284, -0.2968607246875763, -0.2769518494606018, -0.2570430040359497, -0.2371341586112976, -0.2172253131866455, -0.1973164975643158, -0.1774076521396637, -0.1574988067150116, -0.1375899463891983, -0.1176811009645462, -0.0977722555398941, -0.07786340266466141, -0.05795454978942871, -0.03804570436477661, -0.018136855214834213, 0.0017719939351081848, 0.021680843085050583, 0.04158969223499298, 0.06149853765964508, 0.08140739053487778, 0.10131624341011047, 0.12122508883476257, 0.14113393425941467, 0.16104277968406677, 0.18095164000988007, 0.20086048543453217, 0.22076933085918427, 0.24067819118499756, 0.26058703660964966, 0.28049588203430176, 0.30040472745895386, 0.32031357288360596, 0.34022241830825806, 0.36013126373291016, 0.38004010915756226, 0.39994898438453674, 0.41985782980918884, 0.43976667523384094]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 10.0, 5.0, 5.0, 16.0, 11.0, 19.0, 20.0, 22.0, 19.0, 27.0, 25.0, 36.0, 28.0, 28.0, 38.0, 39.0, 40.0, 44.0, 47.0, 35.0, 41.0, 32.0, 52.0, 33.0, 37.0, 35.0, 34.0, 30.0, 25.0, 29.0, 18.0, 22.0, 20.0, 12.0, 14.0, 12.0, 6.0, 9.0, 2.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09104681015014648, -0.08815265446901321, -0.08525849878787994, -0.08236434310674667, -0.0794701874256134, -0.07657602429389954, -0.07368186861276627, -0.070787712931633, -0.06789355725049973, -0.06499940156936646, -0.062105245888233185, -0.059211086481809616, -0.056316930800676346, -0.053422775119543076, -0.05052861571311951, -0.04763446003198624, -0.044740304350852966, -0.041846148669719696, -0.038951992988586426, -0.03605783358216286, -0.03316367790102959, -0.030269522219896317, -0.027375364676117897, -0.024481207132339478, -0.021587051451206207, -0.018692895770072937, -0.015798738226294518, -0.012904581613838673, -0.010010425001382828, -0.007116268388926983, -0.004222111776471138, -0.0013279542326927185, 0.0015662014484405518, 0.004460358060896397, 0.0073545146733522415, 0.010248671285808086, 0.013142827898263931, 0.0160369835793972, 0.01893114112317562, 0.02182529866695404, 0.02471945434808731, 0.02761361002922058, 0.030507767572999, 0.03340192511677742, 0.03629608079791069, 0.03919023647904396, 0.04208439588546753, 0.0449785515666008, 0.04787270724773407, 0.05076686292886734, 0.05366101861000061, 0.05655517801642418, 0.05944933369755745, 0.06234348937869072, 0.06523764878511429, 0.06813180446624756, 0.07102596014738083, 0.0739201158285141, 0.07681427150964737, 0.07970842719078064, 0.0826025903224945, 0.08549674600362778, 0.08839090168476105, 0.09128505736589432, 0.09417921304702759]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 1.0, 5.0, 6.0, 3.0, 11.0, 7.0, 7.0, 7.0, 12.0, 13.0, 29.0, 14.0, 20.0, 25.0, 40.0, 34.0, 37.0, 33.0, 32.0, 54.0, 33.0, 39.0, 48.0, 47.0, 38.0, 48.0, 48.0, 35.0, 34.0, 27.0, 27.0, 32.0, 16.0, 18.0, 24.0, 19.0, 16.0, 17.0, 9.0, 10.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.453125, -4.3077392578125, -4.162353515625, -4.0169677734375, -3.87158203125, -3.7261962890625, -3.580810546875, -3.4354248046875, -3.2900390625, -3.1446533203125, -2.999267578125, -2.8538818359375, -2.70849609375, -2.5631103515625, -2.417724609375, -2.2723388671875, -2.126953125, -1.9815673828125, -1.836181640625, -1.6907958984375, -1.54541015625, -1.4000244140625, -1.254638671875, -1.1092529296875, -0.9638671875, -0.8184814453125, -0.673095703125, -0.5277099609375, -0.38232421875, -0.2369384765625, -0.091552734375, 0.0538330078125, 0.19921875, 0.3446044921875, 0.489990234375, 0.6353759765625, 0.78076171875, 0.9261474609375, 1.071533203125, 1.2169189453125, 1.3623046875, 1.5076904296875, 1.653076171875, 1.7984619140625, 1.94384765625, 2.0892333984375, 2.234619140625, 2.3800048828125, 2.525390625, 2.6707763671875, 2.816162109375, 2.9615478515625, 3.10693359375, 3.2523193359375, 3.397705078125, 3.5430908203125, 3.6884765625, 3.8338623046875, 3.979248046875, 4.1246337890625, 4.27001953125, 4.4154052734375, 4.560791015625, 4.7061767578125, 4.8515625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 6.0, 5.0, 8.0, 4.0, 12.0, 14.0, 10.0, 9.0, 35.0, 31.0, 42.0, 50.0, 68.0, 97.0, 124.0, 185.0, 240.0, 402.0, 572.0, 975.0, 1603.0, 3151.0, 6231.0, 13316.0, 28464.0, 62666.0, 142451.0, 289677.0, 268289.0, 125099.0, 55232.0, 25189.0, 11715.0, 5490.0, 2777.0, 1602.0, 910.0, 595.0, 333.0, 234.0, 162.0, 114.0, 104.0, 73.0, 45.0, 43.0, 34.0, 17.0, 11.0, 12.0, 12.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 3.0], "bins": [-5.37109375, -5.20794677734375, -5.0447998046875, -4.88165283203125, -4.718505859375, -4.55535888671875, -4.3922119140625, -4.22906494140625, -4.06591796875, -3.90277099609375, -3.7396240234375, -3.57647705078125, -3.413330078125, -3.25018310546875, -3.0870361328125, -2.92388916015625, -2.7607421875, -2.59759521484375, -2.4344482421875, -2.27130126953125, -2.108154296875, -1.94500732421875, -1.7818603515625, -1.61871337890625, -1.45556640625, -1.29241943359375, -1.1292724609375, -0.96612548828125, -0.802978515625, -0.63983154296875, -0.4766845703125, -0.31353759765625, -0.150390625, 0.01275634765625, 0.1759033203125, 0.33905029296875, 0.502197265625, 0.66534423828125, 0.8284912109375, 0.99163818359375, 1.15478515625, 1.31793212890625, 1.4810791015625, 1.64422607421875, 1.807373046875, 1.97052001953125, 2.1336669921875, 2.29681396484375, 2.4599609375, 2.62310791015625, 2.7862548828125, 2.94940185546875, 3.112548828125, 3.27569580078125, 3.4388427734375, 3.60198974609375, 3.76513671875, 3.92828369140625, 4.0914306640625, 4.25457763671875, 4.417724609375, 4.58087158203125, 4.7440185546875, 4.90716552734375, 5.0703125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 3.0, 4.0, 7.0, 9.0, 6.0, 18.0, 15.0, 30.0, 32.0, 42.0, 46.0, 53.0, 61.0, 77.0, 110.0, 249.0, 1438.0, 260.0, 149.0, 88.0, 58.0, 53.0, 37.0, 35.0, 21.0, 29.0, 21.0, 21.0, 10.0, 12.0, 12.0, 9.0, 8.0, 6.0, 9.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-16.65625, -16.2359619140625, -15.815673828125, -15.3953857421875, -14.97509765625, -14.5548095703125, -14.134521484375, -13.7142333984375, -13.2939453125, -12.8736572265625, -12.453369140625, -12.0330810546875, -11.61279296875, -11.1925048828125, -10.772216796875, -10.3519287109375, -9.931640625, -9.5113525390625, -9.091064453125, -8.6707763671875, -8.25048828125, -7.8302001953125, -7.409912109375, -6.9896240234375, -6.5693359375, -6.1490478515625, -5.728759765625, -5.3084716796875, -4.88818359375, -4.4678955078125, -4.047607421875, -3.6273193359375, -3.20703125, -2.7867431640625, -2.366455078125, -1.9461669921875, -1.52587890625, -1.1055908203125, -0.685302734375, -0.2650146484375, 0.1552734375, 0.5755615234375, 0.995849609375, 1.4161376953125, 1.83642578125, 2.2567138671875, 2.677001953125, 3.0972900390625, 3.517578125, 3.9378662109375, 4.358154296875, 4.7784423828125, 5.19873046875, 5.6190185546875, 6.039306640625, 6.4595947265625, 6.8798828125, 7.3001708984375, 7.720458984375, 8.1407470703125, 8.56103515625, 8.9813232421875, 9.401611328125, 9.8218994140625, 10.2421875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 7.0, 6.0, 6.0, 8.0, 16.0, 9.0, 12.0, 20.0, 26.0, 26.0, 40.0, 62.0, 96.0, 117.0, 189.0, 273.0, 446.0, 742.0, 1568.0, 32052.0, 3097894.0, 8918.0, 1348.0, 615.0, 379.0, 220.0, 150.0, 107.0, 91.0, 51.0, 46.0, 31.0, 26.0, 22.0, 19.0, 19.0, 8.0, 9.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.40625, -33.23583984375, -32.0654296875, -30.89501953125, -29.724609375, -28.55419921875, -27.3837890625, -26.21337890625, -25.04296875, -23.87255859375, -22.7021484375, -21.53173828125, -20.361328125, -19.19091796875, -18.0205078125, -16.85009765625, -15.6796875, -14.50927734375, -13.3388671875, -12.16845703125, -10.998046875, -9.82763671875, -8.6572265625, -7.48681640625, -6.31640625, -5.14599609375, -3.9755859375, -2.80517578125, -1.634765625, -0.46435546875, 0.7060546875, 1.87646484375, 3.046875, 4.21728515625, 5.3876953125, 6.55810546875, 7.728515625, 8.89892578125, 10.0693359375, 11.23974609375, 12.41015625, 13.58056640625, 14.7509765625, 15.92138671875, 17.091796875, 18.26220703125, 19.4326171875, 20.60302734375, 21.7734375, 22.94384765625, 24.1142578125, 25.28466796875, 26.455078125, 27.62548828125, 28.7958984375, 29.96630859375, 31.13671875, 32.30712890625, 33.4775390625, 34.64794921875, 35.818359375, 36.98876953125, 38.1591796875, 39.32958984375, 40.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 65.0, 458.0, 437.0, 50.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.62403869628906, -207.70347595214844, -203.78289794921875, -199.86233520507812, -195.94175720214844, -192.0211944580078, -188.10061645507812, -184.1800537109375, -180.25949096679688, -176.33892822265625, -172.41835021972656, -168.49778747558594, -164.57720947265625, -160.65664672851562, -156.73606872558594, -152.8155059814453, -148.89492797851562, -144.974365234375, -141.0537872314453, -137.1332244873047, -133.212646484375, -129.29208374023438, -125.37151336669922, -121.45094299316406, -117.5303726196289, -113.60980224609375, -109.6892318725586, -105.76866149902344, -101.84809875488281, -97.92752075195312, -94.0069580078125, -90.08638763427734, -86.16582489013672, -82.24525451660156, -78.3246841430664, -74.40411376953125, -70.48355102539062, -66.56297302246094, -62.64241027832031, -58.721839904785156, -54.80126953125, -50.880699157714844, -46.96012878417969, -43.0395622253418, -39.11899185180664, -35.198421478271484, -31.27785301208496, -27.357284545898438, -23.43671417236328, -19.516143798828125, -15.595575332641602, -11.675005912780762, -7.754436492919922, -3.8338661193847656, 0.08670234680175781, 4.007270812988281, 7.9278411865234375, 11.848410606384277, 15.768980026245117, 19.68954849243164, 23.610118865966797, 27.530689239501953, 31.451257705688477, 35.371826171875, 39.292396545410156]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 7.0, 15.0, 6.0, 10.0, 16.0, 23.0, 18.0, 19.0, 26.0, 34.0, 21.0, 36.0, 33.0, 39.0, 51.0, 40.0, 39.0, 40.0, 42.0, 44.0, 37.0, 51.0, 40.0, 30.0, 30.0, 29.0, 30.0, 31.0, 24.0, 24.0, 14.0, 14.0, 11.0, 13.0, 10.0, 12.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.30635643005371, -26.326505661010742, -25.346656799316406, -24.366806030273438, -23.38695526123047, -22.4071044921875, -21.427255630493164, -20.447404861450195, -19.46755599975586, -18.48770523071289, -17.507856369018555, -16.528005599975586, -15.548154830932617, -14.568305015563965, -13.588455200195312, -12.608604431152344, -11.628753662109375, -10.648903846740723, -9.669053077697754, -8.689203262329102, -7.709352970123291, -6.7295026779174805, -5.749652862548828, -4.769802570343018, -3.789952278137207, -2.8101019859313965, -1.830251932144165, -0.8504018783569336, 0.12944841384887695, 1.1092987060546875, 2.08914852142334, 3.0689988136291504, 4.048847198486328, 5.028697490692139, 6.008547782897949, 6.988397598266602, 7.968247890472412, 8.948098182678223, 9.927947998046875, 10.907798767089844, 11.887648582458496, 12.867498397827148, 13.847349166870117, 14.82719898223877, 15.807048797607422, 16.78689956665039, 17.76675033569336, 18.746599197387695, 19.726449966430664, 20.706300735473633, 21.68614959716797, 22.666000366210938, 23.645851135253906, 24.625701904296875, 25.60555076599121, 26.58540153503418, 27.565250396728516, 28.545101165771484, 29.52495002746582, 30.50480079650879, 31.484651565551758, 32.464500427246094, 33.44435119628906, 34.42420196533203, 35.404052734375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 7.0, 8.0, 4.0, 12.0, 15.0, 16.0, 12.0, 13.0, 16.0, 20.0, 28.0, 31.0, 35.0, 30.0, 28.0, 49.0, 38.0, 44.0, 46.0, 39.0, 39.0, 30.0, 42.0, 40.0, 39.0, 40.0, 36.0, 27.0, 26.0, 26.0, 20.0, 22.0, 20.0, 18.0, 12.0, 11.0, 17.0, 8.0, 6.0, 8.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.19921875, -5.0511474609375, -4.903076171875, -4.7550048828125, -4.60693359375, -4.4588623046875, -4.310791015625, -4.1627197265625, -4.0146484375, -3.8665771484375, -3.718505859375, -3.5704345703125, -3.42236328125, -3.2742919921875, -3.126220703125, -2.9781494140625, -2.830078125, -2.6820068359375, -2.533935546875, -2.3858642578125, -2.23779296875, -2.0897216796875, -1.941650390625, -1.7935791015625, -1.6455078125, -1.4974365234375, -1.349365234375, -1.2012939453125, -1.05322265625, -0.9051513671875, -0.757080078125, -0.6090087890625, -0.4609375, -0.3128662109375, -0.164794921875, -0.0167236328125, 0.13134765625, 0.2794189453125, 0.427490234375, 0.5755615234375, 0.7236328125, 0.8717041015625, 1.019775390625, 1.1678466796875, 1.31591796875, 1.4639892578125, 1.612060546875, 1.7601318359375, 1.908203125, 2.0562744140625, 2.204345703125, 2.3524169921875, 2.50048828125, 2.6485595703125, 2.796630859375, 2.9447021484375, 3.0927734375, 3.2408447265625, 3.388916015625, 3.5369873046875, 3.68505859375, 3.8331298828125, 3.981201171875, 4.1292724609375, 4.27734375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 2.0, 7.0, 5.0, 12.0, 13.0, 14.0, 30.0, 28.0, 36.0, 50.0, 78.0, 92.0, 132.0, 181.0, 256.0, 424.0, 712.0, 1379.0, 3192.0, 8648.0, 33422.0, 205145.0, 1115541.0, 2052146.0, 635853.0, 105914.0, 20076.0, 5879.0, 2272.0, 1069.0, 556.0, 339.0, 213.0, 135.0, 105.0, 69.0, 53.0, 57.0, 37.0, 27.0, 19.0, 18.0, 13.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.0078125, -7.760009765625, -7.51220703125, -7.264404296875, -7.0166015625, -6.768798828125, -6.52099609375, -6.273193359375, -6.025390625, -5.777587890625, -5.52978515625, -5.281982421875, -5.0341796875, -4.786376953125, -4.53857421875, -4.290771484375, -4.04296875, -3.795166015625, -3.54736328125, -3.299560546875, -3.0517578125, -2.803955078125, -2.55615234375, -2.308349609375, -2.060546875, -1.812744140625, -1.56494140625, -1.317138671875, -1.0693359375, -0.821533203125, -0.57373046875, -0.325927734375, -0.078125, 0.169677734375, 0.41748046875, 0.665283203125, 0.9130859375, 1.160888671875, 1.40869140625, 1.656494140625, 1.904296875, 2.152099609375, 2.39990234375, 2.647705078125, 2.8955078125, 3.143310546875, 3.39111328125, 3.638916015625, 3.88671875, 4.134521484375, 4.38232421875, 4.630126953125, 4.8779296875, 5.125732421875, 5.37353515625, 5.621337890625, 5.869140625, 6.116943359375, 6.36474609375, 6.612548828125, 6.8603515625, 7.108154296875, 7.35595703125, 7.603759765625, 7.8515625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 14.0, 22.0, 8.0, 19.0, 31.0, 49.0, 62.0, 60.0, 90.0, 104.0, 157.0, 219.0, 237.0, 313.0, 441.0, 461.0, 404.0, 317.0, 224.0, 196.0, 145.0, 109.0, 84.0, 69.0, 60.0, 39.0, 34.0, 24.0, 21.0, 15.0, 7.0, 5.0, 7.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.37109375, -7.15625, -6.94140625, -6.7265625, -6.51171875, -6.296875, -6.08203125, -5.8671875, -5.65234375, -5.4375, -5.22265625, -5.0078125, -4.79296875, -4.578125, -4.36328125, -4.1484375, -3.93359375, -3.71875, -3.50390625, -3.2890625, -3.07421875, -2.859375, -2.64453125, -2.4296875, -2.21484375, -2.0, -1.78515625, -1.5703125, -1.35546875, -1.140625, -0.92578125, -0.7109375, -0.49609375, -0.28125, -0.06640625, 0.1484375, 0.36328125, 0.578125, 0.79296875, 1.0078125, 1.22265625, 1.4375, 1.65234375, 1.8671875, 2.08203125, 2.296875, 2.51171875, 2.7265625, 2.94140625, 3.15625, 3.37109375, 3.5859375, 3.80078125, 4.015625, 4.23046875, 4.4453125, 4.66015625, 4.875, 5.08984375, 5.3046875, 5.51953125, 5.734375, 5.94921875, 6.1640625, 6.37890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 6.0, 5.0, 5.0, 9.0, 28.0, 20.0, 36.0, 52.0, 75.0, 132.0, 203.0, 322.0, 689.0, 1395.0, 3560.0, 12721.0, 97328.0, 1354299.0, 2502392.0, 192416.0, 20232.0, 4800.0, 1769.0, 771.0, 406.0, 208.0, 130.0, 84.0, 71.0, 44.0, 21.0, 17.0, 13.0, 14.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.2109375, -9.8046875, -9.3984375, -8.9921875, -8.5859375, -8.1796875, -7.7734375, -7.3671875, -6.9609375, -6.5546875, -6.1484375, -5.7421875, -5.3359375, -4.9296875, -4.5234375, -4.1171875, -3.7109375, -3.3046875, -2.8984375, -2.4921875, -2.0859375, -1.6796875, -1.2734375, -0.8671875, -0.4609375, -0.0546875, 0.3515625, 0.7578125, 1.1640625, 1.5703125, 1.9765625, 2.3828125, 2.7890625, 3.1953125, 3.6015625, 4.0078125, 4.4140625, 4.8203125, 5.2265625, 5.6328125, 6.0390625, 6.4453125, 6.8515625, 7.2578125, 7.6640625, 8.0703125, 8.4765625, 8.8828125, 9.2890625, 9.6953125, 10.1015625, 10.5078125, 10.9140625, 11.3203125, 11.7265625, 12.1328125, 12.5390625, 12.9453125, 13.3515625, 13.7578125, 14.1640625, 14.5703125, 14.9765625, 15.3828125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 130.0, 723.0, 154.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-395.3408508300781, -387.9526062011719, -380.56439208984375, -373.1761474609375, -365.7879333496094, -358.3996887207031, -351.0114440917969, -343.62322998046875, -336.2349853515625, -328.84674072265625, -321.4585266113281, -314.0702819824219, -306.68206787109375, -299.2938232421875, -291.90557861328125, -284.5173645019531, -277.1291198730469, -269.7408752441406, -262.3526611328125, -254.96441650390625, -247.57618713378906, -240.18795776367188, -232.7997283935547, -225.4114990234375, -218.0232696533203, -210.63504028320312, -203.24681091308594, -195.8585662841797, -188.4703369140625, -181.0821075439453, -173.69387817382812, -166.30563354492188, -158.91741943359375, -151.52919006347656, -144.14096069335938, -136.75271606445312, -129.36448669433594, -121.97625732421875, -114.58802795410156, -107.19979095458984, -99.81155395507812, -92.42332458496094, -85.03508758544922, -77.64685821533203, -70.25862121582031, -62.870391845703125, -55.48215866088867, -48.09392547607422, -40.7056884765625, -33.31745529174805, -25.929222106933594, -18.540990829467773, -11.15275764465332, -3.7645263671875, 3.623706817626953, 11.011940002441406, 18.40017318725586, 25.788406372070312, 33.176639556884766, 40.56487274169922, 47.953102111816406, 55.34133529663086, 62.72956848144531, 70.1177978515625, 77.50603485107422]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 3.0, 8.0, 2.0, 5.0, 8.0, 11.0, 10.0, 17.0, 17.0, 27.0, 34.0, 24.0, 31.0, 32.0, 35.0, 28.0, 26.0, 40.0, 32.0, 30.0, 34.0, 36.0, 39.0, 38.0, 44.0, 41.0, 36.0, 40.0, 26.0, 28.0, 32.0, 28.0, 18.0, 18.0, 14.0, 21.0, 17.0, 17.0, 10.0, 11.0, 4.0, 3.0, 9.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.094703674316406, -26.293514251708984, -25.492326736450195, -24.691137313842773, -23.88994789123535, -23.088760375976562, -22.28757095336914, -21.48638153076172, -20.685192108154297, -19.884002685546875, -19.082815170288086, -18.281625747680664, -17.480436325073242, -16.679248809814453, -15.878059387207031, -15.07686996459961, -14.27568244934082, -13.474493980407715, -12.673304557800293, -11.872116088867188, -11.070926666259766, -10.26973819732666, -9.468549728393555, -8.667360305786133, -7.866171836853027, -7.064982891082764, -6.2637939453125, -5.4626054763793945, -4.661416530609131, -3.860227584838867, -3.0590391159057617, -2.257850170135498, -1.4566612243652344, -0.6554723978042603, 0.14571642875671387, 0.9469051361083984, 1.748094081878662, 2.549283027648926, 3.3504714965820312, 4.151660442352295, 4.952849388122559, 5.754038333892822, 6.555227279663086, 7.356415748596191, 8.157604217529297, 8.958793640136719, 9.759982109069824, 10.56117057800293, 11.362360000610352, 12.163548469543457, 12.964737892150879, 13.765926361083984, 14.567115783691406, 15.368304252624512, 16.169492721557617, 16.97068214416504, 17.771869659423828, 18.57305908203125, 19.37424659729004, 20.17543601989746, 20.976625442504883, 21.777812957763672, 22.579002380371094, 23.380191802978516, 24.181381225585938]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 2.0, 6.0, 3.0, 11.0, 13.0, 12.0, 15.0, 19.0, 16.0, 22.0, 20.0, 30.0, 33.0, 36.0, 31.0, 31.0, 39.0, 42.0, 28.0, 53.0, 38.0, 34.0, 42.0, 42.0, 33.0, 33.0, 39.0, 35.0, 38.0, 27.0, 31.0, 26.0, 19.0, 17.0, 10.0, 16.0, 7.0, 6.0, 4.0, 11.0, 6.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.1875, -4.06036376953125, -3.9332275390625, -3.80609130859375, -3.678955078125, -3.55181884765625, -3.4246826171875, -3.29754638671875, -3.17041015625, -3.04327392578125, -2.9161376953125, -2.78900146484375, -2.661865234375, -2.53472900390625, -2.4075927734375, -2.28045654296875, -2.1533203125, -2.02618408203125, -1.8990478515625, -1.77191162109375, -1.644775390625, -1.51763916015625, -1.3905029296875, -1.26336669921875, -1.13623046875, -1.00909423828125, -0.8819580078125, -0.75482177734375, -0.627685546875, -0.50054931640625, -0.3734130859375, -0.24627685546875, -0.119140625, 0.00799560546875, 0.1351318359375, 0.26226806640625, 0.389404296875, 0.51654052734375, 0.6436767578125, 0.77081298828125, 0.89794921875, 1.02508544921875, 1.1522216796875, 1.27935791015625, 1.406494140625, 1.53363037109375, 1.6607666015625, 1.78790283203125, 1.9150390625, 2.04217529296875, 2.1693115234375, 2.29644775390625, 2.423583984375, 2.55072021484375, 2.6778564453125, 2.80499267578125, 2.93212890625, 3.05926513671875, 3.1864013671875, 3.31353759765625, 3.440673828125, 3.56781005859375, 3.6949462890625, 3.82208251953125, 3.94921875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 10.0, 16.0, 17.0, 37.0, 50.0, 83.0, 134.0, 235.0, 362.0, 556.0, 974.0, 1663.0, 2695.0, 4393.0, 7197.0, 11202.0, 18019.0, 27908.0, 42898.0, 63838.0, 90156.0, 117869.0, 137005.0, 136201.0, 116880.0, 88708.0, 62533.0, 42165.0, 27684.0, 17796.0, 11270.0, 6985.0, 4242.0, 2653.0, 1573.0, 966.0, 655.0, 362.0, 222.0, 120.0, 85.0, 40.0, 34.0, 24.0, 12.0, 5.0, 11.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248291015625, -0.24027633666992188, -0.23226165771484375, -0.22424697875976562, -0.2162322998046875, -0.20821762084960938, -0.20020294189453125, -0.19218826293945312, -0.184173583984375, -0.17615890502929688, -0.16814422607421875, -0.16012954711914062, -0.1521148681640625, -0.14410018920898438, -0.13608551025390625, -0.12807083129882812, -0.12005615234375, -0.11204147338867188, -0.10402679443359375, -0.09601211547851562, -0.0879974365234375, -0.07998275756835938, -0.07196807861328125, -0.06395339965820312, -0.055938720703125, -0.047924041748046875, -0.03990936279296875, -0.031894683837890625, -0.0238800048828125, -0.015865325927734375, -0.00785064697265625, 0.000164031982421875, 0.0081787109375, 0.016193389892578125, 0.02420806884765625, 0.032222747802734375, 0.0402374267578125, 0.048252105712890625, 0.05626678466796875, 0.06428146362304688, 0.072296142578125, 0.08031082153320312, 0.08832550048828125, 0.09634017944335938, 0.1043548583984375, 0.11236953735351562, 0.12038421630859375, 0.12839889526367188, 0.13641357421875, 0.14442825317382812, 0.15244293212890625, 0.16045761108398438, 0.1684722900390625, 0.17648696899414062, 0.18450164794921875, 0.19251632690429688, 0.200531005859375, 0.20854568481445312, 0.21656036376953125, 0.22457504272460938, 0.2325897216796875, 0.24060440063476562, 0.24861907958984375, 0.2566337585449219, 0.2646484375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 9.0, 10.0, 15.0, 13.0, 18.0, 19.0, 30.0, 33.0, 33.0, 34.0, 43.0, 28.0, 53.0, 55.0, 42.0, 44.0, 1067.0, 42.0, 46.0, 43.0, 42.0, 42.0, 26.0, 36.0, 36.0, 29.0, 27.0, 25.0, 15.0, 14.0, 15.0, 10.0, 10.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.328125, -3.227752685546875, -3.12738037109375, -3.027008056640625, -2.9266357421875, -2.826263427734375, -2.72589111328125, -2.625518798828125, -2.525146484375, -2.424774169921875, -2.32440185546875, -2.224029541015625, -2.1236572265625, -2.023284912109375, -1.92291259765625, -1.822540283203125, -1.72216796875, -1.621795654296875, -1.52142333984375, -1.421051025390625, -1.3206787109375, -1.220306396484375, -1.11993408203125, -1.019561767578125, -0.919189453125, -0.818817138671875, -0.71844482421875, -0.618072509765625, -0.5177001953125, -0.417327880859375, -0.31695556640625, -0.216583251953125, -0.1162109375, -0.015838623046875, 0.08453369140625, 0.184906005859375, 0.2852783203125, 0.385650634765625, 0.48602294921875, 0.586395263671875, 0.686767578125, 0.787139892578125, 0.88751220703125, 0.987884521484375, 1.0882568359375, 1.188629150390625, 1.28900146484375, 1.389373779296875, 1.48974609375, 1.590118408203125, 1.69049072265625, 1.790863037109375, 1.8912353515625, 1.991607666015625, 2.09197998046875, 2.192352294921875, 2.292724609375, 2.393096923828125, 2.49346923828125, 2.593841552734375, 2.6942138671875, 2.794586181640625, 2.89495849609375, 2.995330810546875, 3.095703125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 14.0, 26.0, 29.0, 48.0, 76.0, 97.0, 179.0, 260.0, 425.0, 669.0, 1030.0, 1449.0, 2260.0, 3488.0, 5485.0, 8150.0, 12378.0, 18718.0, 27670.0, 40571.0, 57271.0, 77589.0, 99796.0, 138982.0, 1145913.0, 119982.0, 94948.0, 72916.0, 53265.0, 37342.0, 25459.0, 17350.0, 11579.0, 7355.0, 4973.0, 3215.0, 2156.0, 1451.0, 914.0, 585.0, 364.0, 239.0, 149.0, 104.0, 75.0, 49.0, 27.0, 26.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.15234375, -0.14764022827148438, -0.14293670654296875, -0.13823318481445312, -0.1335296630859375, -0.12882614135742188, -0.12412261962890625, -0.11941909790039062, -0.114715576171875, -0.11001205444335938, -0.10530853271484375, -0.10060501098632812, -0.0959014892578125, -0.09119796752929688, -0.08649444580078125, -0.08179092407226562, -0.07708740234375, -0.07238388061523438, -0.06768035888671875, -0.06297683715820312, -0.0582733154296875, -0.053569793701171875, -0.04886627197265625, -0.044162750244140625, -0.039459228515625, -0.034755706787109375, -0.03005218505859375, -0.025348663330078125, -0.0206451416015625, -0.015941619873046875, -0.01123809814453125, -0.006534576416015625, -0.0018310546875, 0.002872467041015625, 0.00757598876953125, 0.012279510498046875, 0.0169830322265625, 0.021686553955078125, 0.02639007568359375, 0.031093597412109375, 0.035797119140625, 0.040500640869140625, 0.04520416259765625, 0.049907684326171875, 0.0546112060546875, 0.059314727783203125, 0.06401824951171875, 0.06872177124023438, 0.07342529296875, 0.07812881469726562, 0.08283233642578125, 0.08753585815429688, 0.0922393798828125, 0.09694290161132812, 0.10164642333984375, 0.10634994506835938, 0.111053466796875, 0.11575698852539062, 0.12046051025390625, 0.12516403198242188, 0.1298675537109375, 0.13457107543945312, 0.13927459716796875, 0.14397811889648438, 0.148681640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 8.0, 5.0, 6.0, 9.0, 13.0, 15.0, 19.0, 8.0, 20.0, 24.0, 20.0, 31.0, 36.0, 39.0, 42.0, 48.0, 53.0, 57.0, 60.0, 56.0, 55.0, 69.0, 36.0, 38.0, 40.0, 22.0, 24.0, 16.0, 18.0, 13.0, 10.0, 14.0, 14.0, 11.0, 8.0, 0.0, 5.0, 5.0, 5.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01134490966796875, -0.010989069938659668, -0.010633230209350586, -0.010277390480041504, -0.009921550750732422, -0.00956571102142334, -0.009209871292114258, -0.008854031562805176, -0.008498191833496094, -0.008142352104187012, -0.00778651237487793, -0.007430672645568848, -0.007074832916259766, -0.006718993186950684, -0.0063631534576416016, -0.0060073137283325195, -0.0056514739990234375, -0.0052956342697143555, -0.0049397945404052734, -0.004583954811096191, -0.004228115081787109, -0.0038722753524780273, -0.0035164356231689453, -0.0031605958938598633, -0.0028047561645507812, -0.0024489164352416992, -0.002093076705932617, -0.0017372369766235352, -0.0013813972473144531, -0.001025557518005371, -0.0006697177886962891, -0.00031387805938720703, 4.1961669921875e-05, 0.00039780139923095703, 0.0007536411285400391, 0.001109480857849121, 0.0014653205871582031, 0.0018211603164672852, 0.002177000045776367, 0.0025328397750854492, 0.0028886795043945312, 0.0032445192337036133, 0.0036003589630126953, 0.003956198692321777, 0.004312038421630859, 0.004667878150939941, 0.0050237178802490234, 0.0053795576095581055, 0.0057353973388671875, 0.0060912370681762695, 0.0064470767974853516, 0.006802916526794434, 0.007158756256103516, 0.007514595985412598, 0.00787043571472168, 0.008226275444030762, 0.008582115173339844, 0.008937954902648926, 0.009293794631958008, 0.00964963436126709, 0.010005474090576172, 0.010361313819885254, 0.010717153549194336, 0.011072993278503418, 0.0114288330078125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 6.0, 11.0, 4.0, 8.0, 10.0, 21.0, 22.0, 29.0, 47.0, 42.0, 75.0, 99.0, 145.0, 244.0, 466.0, 1184.0, 773286.0, 270492.0, 1065.0, 456.0, 225.0, 164.0, 120.0, 83.0, 43.0, 49.0, 29.0, 29.0, 20.0, 15.0, 11.0, 9.0, 10.0, 4.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26953125, -0.2613525390625, -0.253173828125, -0.2449951171875, -0.23681640625, -0.2286376953125, -0.220458984375, -0.2122802734375, -0.2041015625, -0.1959228515625, -0.187744140625, -0.1795654296875, -0.17138671875, -0.1632080078125, -0.155029296875, -0.1468505859375, -0.138671875, -0.1304931640625, -0.122314453125, -0.1141357421875, -0.10595703125, -0.0977783203125, -0.089599609375, -0.0814208984375, -0.0732421875, -0.0650634765625, -0.056884765625, -0.0487060546875, -0.04052734375, -0.0323486328125, -0.024169921875, -0.0159912109375, -0.0078125, 0.0003662109375, 0.008544921875, 0.0167236328125, 0.02490234375, 0.0330810546875, 0.041259765625, 0.0494384765625, 0.0576171875, 0.0657958984375, 0.073974609375, 0.0821533203125, 0.09033203125, 0.0985107421875, 0.106689453125, 0.1148681640625, 0.123046875, 0.1312255859375, 0.139404296875, 0.1475830078125, 0.15576171875, 0.1639404296875, 0.172119140625, 0.1802978515625, 0.1884765625, 0.1966552734375, 0.204833984375, 0.2130126953125, 0.22119140625, 0.2293701171875, 0.237548828125, 0.2457275390625, 0.25390625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 83.0, 926.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2616235315799713, -0.25420960783958435, -0.24679569900035858, -0.2393817901611328, -0.23196786642074585, -0.2245539426803589, -0.21714003384113312, -0.20972612500190735, -0.20231220126152039, -0.19489827752113342, -0.18748436868190765, -0.18007045984268188, -0.17265653610229492, -0.16524261236190796, -0.1578287035226822, -0.15041479468345642, -0.14300087094306946, -0.1355869472026825, -0.12817303836345673, -0.12075912207365036, -0.113345205783844, -0.10593128949403763, -0.09851737320423126, -0.0911034569144249, -0.08368954062461853, -0.07627562433481216, -0.0688617080450058, -0.06144779175519943, -0.054033875465393066, -0.0466199591755867, -0.039206042885780334, -0.03179212659597397, -0.024378225207328796, -0.01696430891752243, -0.009550392627716064, -0.0021364763379096985, 0.0052774399518966675, 0.012691356241703033, 0.0201052725315094, 0.027519188821315765, 0.03493310511112213, 0.0423470214009285, 0.04976093769073486, 0.05717485398054123, 0.0645887702703476, 0.07200268656015396, 0.07941660284996033, 0.0868305191397667, 0.09424443542957306, 0.10165835171937943, 0.10907226800918579, 0.11648618429899216, 0.12390010058879852, 0.1313140094280243, 0.13872793316841125, 0.14614185690879822, 0.153555765748024, 0.16096967458724976, 0.16838359832763672, 0.17579752206802368, 0.18321143090724945, 0.19062533974647522, 0.19803926348686218, 0.20545318722724915, 0.21286709606647491]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 3.0, 7.0, 4.0, 11.0, 21.0, 22.0, 26.0, 21.0, 43.0, 29.0, 39.0, 37.0, 47.0, 45.0, 54.0, 59.0, 69.0, 53.0, 57.0, 42.0, 52.0, 36.0, 42.0, 42.0, 35.0, 22.0, 20.0, 18.0, 23.0, 7.0, 4.0, 9.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031251490116119385, -0.03008616715669632, -0.028920846059918404, -0.027755524963140488, -0.026590202003717422, -0.025424879044294357, -0.02425955794751644, -0.023094236850738525, -0.02192891389131546, -0.020763590931892395, -0.01959826983511448, -0.018432948738336563, -0.017267625778913498, -0.016102302819490433, -0.014936981722712517, -0.013771659694612026, -0.012606337666511536, -0.011441015638411045, -0.010275693610310555, -0.009110371582210064, -0.007945049554109573, -0.006779727526009083, -0.005614405497908592, -0.004449083469808102, -0.003283761441707611, -0.0021184394136071205, -0.0009531173855066299, 0.00021220464259386063, 0.0013775266706943512, 0.0025428486987948418, 0.0037081707268953323, 0.004873492754995823, 0.0060388147830963135, 0.007204136811196804, 0.008369458839297295, 0.009534780867397785, 0.010700102895498276, 0.011865424923598766, 0.013030746951699257, 0.014196068979799747, 0.015361391007900238, 0.016526713967323303, 0.01769203506410122, 0.018857356160879135, 0.0200226791203022, 0.021188002079725266, 0.02235332317650318, 0.023518644273281097, 0.024683967232704163, 0.025849290192127228, 0.027014611288905144, 0.02817993238568306, 0.029345255345106125, 0.03051057830452919, 0.03167589753866196, 0.03284122049808502, 0.03400654345750809, 0.03517186641693115, 0.03633718937635422, 0.037502508610486984, 0.03866783156991005, 0.039833154529333115, 0.04099847376346588, 0.04216379672288895, 0.04332911968231201]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 0.0, 2.0, 5.0, 8.0, 9.0, 11.0, 9.0, 12.0, 12.0, 22.0, 21.0, 21.0, 21.0, 33.0, 31.0, 32.0, 33.0, 41.0, 43.0, 30.0, 32.0, 40.0, 32.0, 43.0, 40.0, 41.0, 49.0, 39.0, 35.0, 34.0, 29.0, 22.0, 21.0, 25.0, 20.0, 17.0, 12.0, 11.0, 5.0, 13.0, 6.0, 4.0, 5.0, 8.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.776824951171875, -3.65325927734375, -3.529693603515625, -3.4061279296875, -3.282562255859375, -3.15899658203125, -3.035430908203125, -2.911865234375, -2.788299560546875, -2.66473388671875, -2.541168212890625, -2.4176025390625, -2.294036865234375, -2.17047119140625, -2.046905517578125, -1.92333984375, -1.799774169921875, -1.67620849609375, -1.552642822265625, -1.4290771484375, -1.305511474609375, -1.18194580078125, -1.058380126953125, -0.934814453125, -0.811248779296875, -0.68768310546875, -0.564117431640625, -0.4405517578125, -0.316986083984375, -0.19342041015625, -0.069854736328125, 0.0537109375, 0.177276611328125, 0.30084228515625, 0.424407958984375, 0.5479736328125, 0.671539306640625, 0.79510498046875, 0.918670654296875, 1.042236328125, 1.165802001953125, 1.28936767578125, 1.412933349609375, 1.5364990234375, 1.660064697265625, 1.78363037109375, 1.907196044921875, 2.03076171875, 2.154327392578125, 2.27789306640625, 2.401458740234375, 2.5250244140625, 2.648590087890625, 2.77215576171875, 2.895721435546875, 3.019287109375, 3.142852783203125, 3.26641845703125, 3.389984130859375, 3.5135498046875, 3.637115478515625, 3.76068115234375, 3.884246826171875, 4.0078125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 5.0, 6.0, 7.0, 12.0, 19.0, 20.0, 31.0, 38.0, 47.0, 56.0, 56.0, 90.0, 119.0, 164.0, 226.0, 311.0, 383.0, 604.0, 930.0, 1549.0, 2730.0, 5598.0, 13055.0, 34109.0, 104126.0, 369769.0, 355584.0, 100684.0, 32679.0, 12741.0, 5434.0, 2716.0, 1504.0, 939.0, 609.0, 421.0, 299.0, 231.0, 172.0, 114.0, 104.0, 82.0, 41.0, 31.0, 31.0, 20.0, 20.0, 19.0, 7.0, 10.0, 1.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.5440673828125, -5.345947265625, -5.1478271484375, -4.94970703125, -4.7515869140625, -4.553466796875, -4.3553466796875, -4.1572265625, -3.9591064453125, -3.760986328125, -3.5628662109375, -3.36474609375, -3.1666259765625, -2.968505859375, -2.7703857421875, -2.572265625, -2.3741455078125, -2.176025390625, -1.9779052734375, -1.77978515625, -1.5816650390625, -1.383544921875, -1.1854248046875, -0.9873046875, -0.7891845703125, -0.591064453125, -0.3929443359375, -0.19482421875, 0.0032958984375, 0.201416015625, 0.3995361328125, 0.59765625, 0.7957763671875, 0.993896484375, 1.1920166015625, 1.39013671875, 1.5882568359375, 1.786376953125, 1.9844970703125, 2.1826171875, 2.3807373046875, 2.578857421875, 2.7769775390625, 2.97509765625, 3.1732177734375, 3.371337890625, 3.5694580078125, 3.767578125, 3.9656982421875, 4.163818359375, 4.3619384765625, 4.56005859375, 4.7581787109375, 4.956298828125, 5.1544189453125, 5.3525390625, 5.5506591796875, 5.748779296875, 5.9468994140625, 6.14501953125, 6.3431396484375, 6.541259765625, 6.7393798828125, 6.9375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 11.0, 10.0, 9.0, 13.0, 18.0, 13.0, 32.0, 16.0, 33.0, 38.0, 44.0, 51.0, 67.0, 88.0, 185.0, 1486.0, 358.0, 120.0, 77.0, 61.0, 47.0, 45.0, 33.0, 37.0, 32.0, 18.0, 14.0, 9.0, 14.0, 5.0, 12.0, 10.0, 4.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.3828125, -10.0460205078125, -9.709228515625, -9.3724365234375, -9.03564453125, -8.6988525390625, -8.362060546875, -8.0252685546875, -7.6884765625, -7.3516845703125, -7.014892578125, -6.6781005859375, -6.34130859375, -6.0045166015625, -5.667724609375, -5.3309326171875, -4.994140625, -4.6573486328125, -4.320556640625, -3.9837646484375, -3.64697265625, -3.3101806640625, -2.973388671875, -2.6365966796875, -2.2998046875, -1.9630126953125, -1.626220703125, -1.2894287109375, -0.95263671875, -0.6158447265625, -0.279052734375, 0.0577392578125, 0.39453125, 0.7313232421875, 1.068115234375, 1.4049072265625, 1.74169921875, 2.0784912109375, 2.415283203125, 2.7520751953125, 3.0888671875, 3.4256591796875, 3.762451171875, 4.0992431640625, 4.43603515625, 4.7728271484375, 5.109619140625, 5.4464111328125, 5.783203125, 6.1199951171875, 6.456787109375, 6.7935791015625, 7.13037109375, 7.4671630859375, 7.803955078125, 8.1407470703125, 8.4775390625, 8.8143310546875, 9.151123046875, 9.4879150390625, 9.82470703125, 10.1614990234375, 10.498291015625, 10.8350830078125, 11.171875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 10.0, 5.0, 1.0, 4.0, 15.0, 9.0, 18.0, 14.0, 16.0, 28.0, 37.0, 66.0, 80.0, 129.0, 146.0, 206.0, 309.0, 556.0, 1123.0, 4946.0, 3080673.0, 53627.0, 1649.0, 704.0, 414.0, 254.0, 188.0, 107.0, 99.0, 74.0, 53.0, 29.0, 28.0, 15.0, 12.0, 13.0, 15.0, 8.0, 4.0, 6.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.421875, -29.431396484375, -28.44091796875, -27.450439453125, -26.4599609375, -25.469482421875, -24.47900390625, -23.488525390625, -22.498046875, -21.507568359375, -20.51708984375, -19.526611328125, -18.5361328125, -17.545654296875, -16.55517578125, -15.564697265625, -14.57421875, -13.583740234375, -12.59326171875, -11.602783203125, -10.6123046875, -9.621826171875, -8.63134765625, -7.640869140625, -6.650390625, -5.659912109375, -4.66943359375, -3.678955078125, -2.6884765625, -1.697998046875, -0.70751953125, 0.282958984375, 1.2734375, 2.263916015625, 3.25439453125, 4.244873046875, 5.2353515625, 6.225830078125, 7.21630859375, 8.206787109375, 9.197265625, 10.187744140625, 11.17822265625, 12.168701171875, 13.1591796875, 14.149658203125, 15.14013671875, 16.130615234375, 17.12109375, 18.111572265625, 19.10205078125, 20.092529296875, 21.0830078125, 22.073486328125, 23.06396484375, 24.054443359375, 25.044921875, 26.035400390625, 27.02587890625, 28.016357421875, 29.0068359375, 29.997314453125, 30.98779296875, 31.978271484375, 32.96875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 14.0, 16.0, 25.0, 45.0, 64.0, 78.0, 118.0, 134.0, 122.0, 103.0, 99.0, 73.0, 50.0, 37.0, 16.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.8044490814209, -29.020065307617188, -28.235681533813477, -27.451297760009766, -26.666912078857422, -25.88252830505371, -25.09814453125, -24.31376075744629, -23.529376983642578, -22.744993209838867, -21.960609436035156, -21.176223754882812, -20.3918399810791, -19.60745620727539, -18.82307243347168, -18.03868865966797, -17.254302978515625, -16.469919204711914, -15.685534477233887, -14.901150703430176, -14.116765975952148, -13.332382202148438, -12.547998428344727, -11.763614654541016, -10.979229927062988, -10.194846153259277, -9.41046142578125, -8.626077651977539, -7.84169340133667, -7.057309150695801, -6.27292537689209, -5.488541126251221, -4.704158782958984, -3.9197745323181152, -3.135390520095825, -2.351006507873535, -1.566622257232666, -0.7822380065917969, 0.0021457672119140625, 0.7865300178527832, 1.5709142684936523, 2.3552985191345215, 3.1396825313568115, 3.9240665435791016, 4.708450794219971, 5.49283504486084, 6.277218818664551, 7.06160306930542, 7.845987319946289, 8.63037109375, 9.414755821228027, 10.199139595031738, 10.983524322509766, 11.767908096313477, 12.552291870117188, 13.336675643920898, 14.121060371398926, 14.905444145202637, 15.689828872680664, 16.474212646484375, 17.258596420288086, 18.042980194091797, 18.82736587524414, 19.61174964904785, 20.396133422851562]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 4.0, 5.0, 11.0, 12.0, 13.0, 8.0, 16.0, 19.0, 24.0, 33.0, 28.0, 28.0, 34.0, 35.0, 42.0, 31.0, 41.0, 46.0, 36.0, 43.0, 47.0, 40.0, 43.0, 33.0, 41.0, 28.0, 45.0, 30.0, 31.0, 29.0, 15.0, 18.0, 19.0, 13.0, 14.0, 10.0, 9.0, 13.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.280887603759766, -24.459938049316406, -23.638988494873047, -22.818038940429688, -21.997089385986328, -21.17613983154297, -20.35519027709961, -19.53424072265625, -18.71329116821289, -17.89234161376953, -17.071392059326172, -16.250442504882812, -15.429492950439453, -14.608543395996094, -13.787593841552734, -12.966644287109375, -12.145694732666016, -11.324745178222656, -10.503795623779297, -9.682846069335938, -8.861896514892578, -8.040946960449219, -7.219997406005859, -6.3990478515625, -5.578098297119141, -4.757148742675781, -3.936199188232422, -3.1152496337890625, -2.294300079345703, -1.4733505249023438, -0.6524009704589844, 0.168548583984375, 0.9894981384277344, 1.8104476928710938, 2.631397247314453, 3.4523468017578125, 4.273296356201172, 5.094245910644531, 5.915195465087891, 6.73614501953125, 7.557094573974609, 8.378044128417969, 9.198993682861328, 10.019943237304688, 10.840892791748047, 11.661842346191406, 12.482791900634766, 13.303741455078125, 14.124691009521484, 14.945640563964844, 15.766590118408203, 16.587539672851562, 17.408489227294922, 18.22943878173828, 19.05038833618164, 19.871337890625, 20.69228744506836, 21.51323699951172, 22.334186553955078, 23.155136108398438, 23.976085662841797, 24.797035217285156, 25.617984771728516, 26.438934326171875, 27.259883880615234]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 3.0, 9.0, 6.0, 5.0, 12.0, 8.0, 12.0, 9.0, 16.0, 17.0, 20.0, 26.0, 37.0, 40.0, 24.0, 36.0, 31.0, 34.0, 40.0, 45.0, 51.0, 44.0, 43.0, 43.0, 42.0, 35.0, 36.0, 39.0, 28.0, 23.0, 36.0, 22.0, 19.0, 21.0, 13.0, 15.0, 9.0, 7.0, 5.0, 8.0, 8.0, 5.0, 12.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.23828125, -4.1029052734375, -3.967529296875, -3.8321533203125, -3.69677734375, -3.5614013671875, -3.426025390625, -3.2906494140625, -3.1552734375, -3.0198974609375, -2.884521484375, -2.7491455078125, -2.61376953125, -2.4783935546875, -2.343017578125, -2.2076416015625, -2.072265625, -1.9368896484375, -1.801513671875, -1.6661376953125, -1.53076171875, -1.3953857421875, -1.260009765625, -1.1246337890625, -0.9892578125, -0.8538818359375, -0.718505859375, -0.5831298828125, -0.44775390625, -0.3123779296875, -0.177001953125, -0.0416259765625, 0.09375, 0.2291259765625, 0.364501953125, 0.4998779296875, 0.63525390625, 0.7706298828125, 0.906005859375, 1.0413818359375, 1.1767578125, 1.3121337890625, 1.447509765625, 1.5828857421875, 1.71826171875, 1.8536376953125, 1.989013671875, 2.1243896484375, 2.259765625, 2.3951416015625, 2.530517578125, 2.6658935546875, 2.80126953125, 2.9366455078125, 3.072021484375, 3.2073974609375, 3.3427734375, 3.4781494140625, 3.613525390625, 3.7489013671875, 3.88427734375, 4.0196533203125, 4.155029296875, 4.2904052734375, 4.42578125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 7.0, 4.0, 4.0, 11.0, 12.0, 9.0, 17.0, 28.0, 29.0, 40.0, 43.0, 62.0, 81.0, 136.0, 181.0, 255.0, 449.0, 715.0, 1388.0, 2991.0, 7427.0, 23874.0, 127766.0, 874293.0, 2279117.0, 736290.0, 105498.0, 20851.0, 6761.0, 2702.0, 1347.0, 653.0, 362.0, 269.0, 152.0, 102.0, 77.0, 63.0, 63.0, 23.0, 37.0, 22.0, 17.0, 20.0, 6.0, 9.0, 11.0, 5.0, 1.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-8.5625, -8.3065185546875, -8.050537109375, -7.7945556640625, -7.53857421875, -7.2825927734375, -7.026611328125, -6.7706298828125, -6.5146484375, -6.2586669921875, -6.002685546875, -5.7467041015625, -5.49072265625, -5.2347412109375, -4.978759765625, -4.7227783203125, -4.466796875, -4.2108154296875, -3.954833984375, -3.6988525390625, -3.44287109375, -3.1868896484375, -2.930908203125, -2.6749267578125, -2.4189453125, -2.1629638671875, -1.906982421875, -1.6510009765625, -1.39501953125, -1.1390380859375, -0.883056640625, -0.6270751953125, -0.37109375, -0.1151123046875, 0.140869140625, 0.3968505859375, 0.65283203125, 0.9088134765625, 1.164794921875, 1.4207763671875, 1.6767578125, 1.9327392578125, 2.188720703125, 2.4447021484375, 2.70068359375, 2.9566650390625, 3.212646484375, 3.4686279296875, 3.724609375, 3.9805908203125, 4.236572265625, 4.4925537109375, 4.74853515625, 5.0045166015625, 5.260498046875, 5.5164794921875, 5.7724609375, 6.0284423828125, 6.284423828125, 6.5404052734375, 6.79638671875, 7.0523681640625, 7.308349609375, 7.5643310546875, 7.8203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 3.0, 5.0, 14.0, 16.0, 28.0, 28.0, 73.0, 61.0, 87.0, 128.0, 130.0, 217.0, 312.0, 371.0, 403.0, 437.0, 420.0, 298.0, 277.0, 198.0, 145.0, 107.0, 75.0, 62.0, 46.0, 41.0, 22.0, 19.0, 14.0, 7.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.890625, -7.68963623046875, -7.4886474609375, -7.28765869140625, -7.086669921875, -6.88568115234375, -6.6846923828125, -6.48370361328125, -6.28271484375, -6.08172607421875, -5.8807373046875, -5.67974853515625, -5.478759765625, -5.27777099609375, -5.0767822265625, -4.87579345703125, -4.6748046875, -4.47381591796875, -4.2728271484375, -4.07183837890625, -3.870849609375, -3.66986083984375, -3.4688720703125, -3.26788330078125, -3.06689453125, -2.86590576171875, -2.6649169921875, -2.46392822265625, -2.262939453125, -2.06195068359375, -1.8609619140625, -1.65997314453125, -1.458984375, -1.25799560546875, -1.0570068359375, -0.85601806640625, -0.655029296875, -0.45404052734375, -0.2530517578125, -0.05206298828125, 0.14892578125, 0.34991455078125, 0.5509033203125, 0.75189208984375, 0.952880859375, 1.15386962890625, 1.3548583984375, 1.55584716796875, 1.7568359375, 1.95782470703125, 2.1588134765625, 2.35980224609375, 2.560791015625, 2.76177978515625, 2.9627685546875, 3.16375732421875, 3.36474609375, 3.56573486328125, 3.7667236328125, 3.96771240234375, 4.168701171875, 4.36968994140625, 4.5706787109375, 4.77166748046875, 4.97265625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 16.0, 25.0, 37.0, 58.0, 65.0, 98.0, 152.0, 277.0, 481.0, 1002.0, 2376.0, 7313.0, 40261.0, 609738.0, 3181315.0, 315518.0, 26134.0, 5544.0, 1905.0, 831.0, 440.0, 233.0, 147.0, 104.0, 59.0, 33.0, 28.0, 19.0, 11.0, 8.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.109375, -9.726318359375, -9.34326171875, -8.960205078125, -8.5771484375, -8.194091796875, -7.81103515625, -7.427978515625, -7.044921875, -6.661865234375, -6.27880859375, -5.895751953125, -5.5126953125, -5.129638671875, -4.74658203125, -4.363525390625, -3.98046875, -3.597412109375, -3.21435546875, -2.831298828125, -2.4482421875, -2.065185546875, -1.68212890625, -1.299072265625, -0.916015625, -0.532958984375, -0.14990234375, 0.233154296875, 0.6162109375, 0.999267578125, 1.38232421875, 1.765380859375, 2.1484375, 2.531494140625, 2.91455078125, 3.297607421875, 3.6806640625, 4.063720703125, 4.44677734375, 4.829833984375, 5.212890625, 5.595947265625, 5.97900390625, 6.362060546875, 6.7451171875, 7.128173828125, 7.51123046875, 7.894287109375, 8.27734375, 8.660400390625, 9.04345703125, 9.426513671875, 9.8095703125, 10.192626953125, 10.57568359375, 10.958740234375, 11.341796875, 11.724853515625, 12.10791015625, 12.490966796875, 12.8740234375, 13.257080078125, 13.64013671875, 14.023193359375, 14.40625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 44.0, 319.0, 491.0, 141.0, 13.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.48143005371094, -124.89381408691406, -120.30619812011719, -115.71857452392578, -111.1309585571289, -106.54334259033203, -101.95571899414062, -97.36810302734375, -92.78048706054688, -88.19287109375, -83.60525512695312, -79.01763153076172, -74.43001556396484, -69.84239959716797, -65.25477600097656, -60.66716003417969, -56.07954406738281, -51.49192810058594, -46.9043083190918, -42.316688537597656, -37.72907257080078, -33.141456604003906, -28.553836822509766, -23.966217041015625, -19.37860107421875, -14.790983200073242, -10.203365325927734, -5.615747451782227, -1.0281295776367188, 3.559488296508789, 8.147106170654297, 12.734725952148438, 17.32232666015625, 21.909944534301758, 26.497562408447266, 31.085180282592773, 35.67279815673828, 40.260414123535156, 44.8480339050293, 49.43565368652344, 54.02326965332031, 58.61088562011719, 63.19850540161133, 67.78612518310547, 72.37374114990234, 76.96135711669922, 81.54898071289062, 86.1365966796875, 90.72421264648438, 95.31182861328125, 99.89944458007812, 104.48706817626953, 109.0746841430664, 113.66230010986328, 118.24992370605469, 122.83753967285156, 127.42515563964844, 132.0127716064453, 136.6003875732422, 141.18800354003906, 145.775634765625, 150.36325073242188, 154.95086669921875, 159.53848266601562, 164.1260986328125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 10.0, 9.0, 18.0, 11.0, 14.0, 24.0, 19.0, 27.0, 31.0, 25.0, 40.0, 29.0, 38.0, 39.0, 39.0, 39.0, 52.0, 38.0, 38.0, 54.0, 48.0, 39.0, 41.0, 37.0, 38.0, 25.0, 17.0, 22.0, 15.0, 15.0, 23.0, 18.0, 10.0, 8.0, 7.0, 8.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-26.379919052124023, -25.61302375793457, -24.84613037109375, -24.079235076904297, -23.312339782714844, -22.54544448852539, -21.778549194335938, -21.011655807495117, -20.244760513305664, -19.47786521911621, -18.71097183227539, -17.944076538085938, -17.177181243896484, -16.41028594970703, -15.643391609191895, -14.876497268676758, -14.109601974487305, -13.342706680297852, -12.575812339782715, -11.808917999267578, -11.042022705078125, -10.275127410888672, -9.508233070373535, -8.741338729858398, -7.974443435668945, -7.20754861831665, -6.4406538009643555, -5.6737589836120605, -4.906864166259766, -4.139969348907471, -3.373074531555176, -2.606179714202881, -1.8392829895019531, -1.0723881721496582, -0.3054933547973633, 0.46140146255493164, 1.2282962799072266, 1.9951910972595215, 2.7620859146118164, 3.5289807319641113, 4.295875549316406, 5.062770366668701, 5.829665184020996, 6.596560001373291, 7.363454818725586, 8.130350112915039, 8.897244453430176, 9.664138793945312, 10.431034088134766, 11.197929382324219, 11.964823722839355, 12.731718063354492, 13.498613357543945, 14.265508651733398, 15.032402992248535, 15.799297332763672, 16.566192626953125, 17.333087921142578, 18.09998321533203, 18.86687660217285, 19.633771896362305, 20.400667190551758, 21.167560577392578, 21.93445587158203, 22.701351165771484]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 1.0, 9.0, 4.0, 5.0, 3.0, 9.0, 16.0, 18.0, 16.0, 12.0, 25.0, 15.0, 13.0, 26.0, 27.0, 31.0, 41.0, 39.0, 34.0, 41.0, 38.0, 31.0, 48.0, 46.0, 48.0, 36.0, 46.0, 38.0, 28.0, 30.0, 30.0, 29.0, 20.0, 25.0, 21.0, 17.0, 16.0, 13.0, 11.0, 10.0, 6.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.638671875, -3.52362060546875, -3.4085693359375, -3.29351806640625, -3.178466796875, -3.06341552734375, -2.9483642578125, -2.83331298828125, -2.71826171875, -2.60321044921875, -2.4881591796875, -2.37310791015625, -2.258056640625, -2.14300537109375, -2.0279541015625, -1.91290283203125, -1.7978515625, -1.68280029296875, -1.5677490234375, -1.45269775390625, -1.337646484375, -1.22259521484375, -1.1075439453125, -0.99249267578125, -0.87744140625, -0.76239013671875, -0.6473388671875, -0.53228759765625, -0.417236328125, -0.30218505859375, -0.1871337890625, -0.07208251953125, 0.04296875, 0.15802001953125, 0.2730712890625, 0.38812255859375, 0.503173828125, 0.61822509765625, 0.7332763671875, 0.84832763671875, 0.96337890625, 1.07843017578125, 1.1934814453125, 1.30853271484375, 1.423583984375, 1.53863525390625, 1.6536865234375, 1.76873779296875, 1.8837890625, 1.99884033203125, 2.1138916015625, 2.22894287109375, 2.343994140625, 2.45904541015625, 2.5740966796875, 2.68914794921875, 2.80419921875, 2.91925048828125, 3.0343017578125, 3.14935302734375, 3.264404296875, 3.37945556640625, 3.4945068359375, 3.60955810546875, 3.724609375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 16.0, 25.0, 33.0, 67.0, 77.0, 123.0, 190.0, 281.0, 471.0, 683.0, 1121.0, 1710.0, 2754.0, 4086.0, 6394.0, 10420.0, 15608.0, 24369.0, 37308.0, 55193.0, 80415.0, 108007.0, 132059.0, 140477.0, 123649.0, 96609.0, 69614.0, 47493.0, 31518.0, 20586.0, 13360.0, 8653.0, 5472.0, 3504.0, 2248.0, 1442.0, 920.0, 588.0, 362.0, 224.0, 173.0, 100.0, 60.0, 31.0, 26.0, 17.0, 13.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2166748046875, -0.20952415466308594, -0.20237350463867188, -0.1952228546142578, -0.18807220458984375, -0.1809215545654297, -0.17377090454101562, -0.16662025451660156, -0.1594696044921875, -0.15231895446777344, -0.14516830444335938, -0.1380176544189453, -0.13086700439453125, -0.12371635437011719, -0.11656570434570312, -0.10941505432128906, -0.102264404296875, -0.09511375427246094, -0.08796310424804688, -0.08081245422363281, -0.07366180419921875, -0.06651115417480469, -0.059360504150390625, -0.05220985412597656, -0.0450592041015625, -0.03790855407714844, -0.030757904052734375, -0.023607254028320312, -0.01645660400390625, -0.009305953979492188, -0.002155303955078125, 0.0049953460693359375, 0.01214599609375, 0.019296646118164062, 0.026447296142578125, 0.03359794616699219, 0.04074859619140625, 0.04789924621582031, 0.055049896240234375, 0.06220054626464844, 0.0693511962890625, 0.07650184631347656, 0.08365249633789062, 0.09080314636230469, 0.09795379638671875, 0.10510444641113281, 0.11225509643554688, 0.11940574645996094, 0.126556396484375, 0.13370704650878906, 0.14085769653320312, 0.1480083465576172, 0.15515899658203125, 0.1623096466064453, 0.16946029663085938, 0.17661094665527344, 0.1837615966796875, 0.19091224670410156, 0.19806289672851562, 0.2052135467529297, 0.21236419677734375, 0.2195148468017578, 0.22666549682617188, 0.23381614685058594, 0.240966796875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 5.0, 10.0, 8.0, 16.0, 20.0, 22.0, 25.0, 20.0, 44.0, 21.0, 37.0, 38.0, 36.0, 47.0, 47.0, 44.0, 1062.0, 31.0, 49.0, 35.0, 47.0, 42.0, 40.0, 42.0, 34.0, 34.0, 22.0, 24.0, 18.0, 17.0, 13.0, 10.0, 13.0, 7.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.736785888671875, -2.64544677734375, -2.554107666015625, -2.4627685546875, -2.371429443359375, -2.28009033203125, -2.188751220703125, -2.097412109375, -2.006072998046875, -1.91473388671875, -1.823394775390625, -1.7320556640625, -1.640716552734375, -1.54937744140625, -1.458038330078125, -1.36669921875, -1.275360107421875, -1.18402099609375, -1.092681884765625, -1.0013427734375, -0.910003662109375, -0.81866455078125, -0.727325439453125, -0.635986328125, -0.544647216796875, -0.45330810546875, -0.361968994140625, -0.2706298828125, -0.179290771484375, -0.08795166015625, 0.003387451171875, 0.0947265625, 0.186065673828125, 0.27740478515625, 0.368743896484375, 0.4600830078125, 0.551422119140625, 0.64276123046875, 0.734100341796875, 0.825439453125, 0.916778564453125, 1.00811767578125, 1.099456787109375, 1.1907958984375, 1.282135009765625, 1.37347412109375, 1.464813232421875, 1.55615234375, 1.647491455078125, 1.73883056640625, 1.830169677734375, 1.9215087890625, 2.012847900390625, 2.10418701171875, 2.195526123046875, 2.286865234375, 2.378204345703125, 2.46954345703125, 2.560882568359375, 2.6522216796875, 2.743560791015625, 2.83489990234375, 2.926239013671875, 3.017578125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 12.0, 22.0, 35.0, 46.0, 69.0, 130.0, 170.0, 315.0, 525.0, 814.0, 1367.0, 2338.0, 3619.0, 5805.0, 9105.0, 14573.0, 22508.0, 34117.0, 51274.0, 73381.0, 99306.0, 133726.0, 1130506.0, 166673.0, 105520.0, 79066.0, 55932.0, 37931.0, 24923.0, 16096.0, 10173.0, 6430.0, 4009.0, 2484.0, 1592.0, 968.0, 598.0, 372.0, 216.0, 141.0, 82.0, 57.0, 44.0, 24.0, 11.0, 10.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.15771484375, -0.1527271270751953, -0.14773941040039062, -0.14275169372558594, -0.13776397705078125, -0.13277626037597656, -0.12778854370117188, -0.12280082702636719, -0.1178131103515625, -0.11282539367675781, -0.10783767700195312, -0.10284996032714844, -0.09786224365234375, -0.09287452697753906, -0.08788681030273438, -0.08289909362792969, -0.077911376953125, -0.07292366027832031, -0.06793594360351562, -0.06294822692871094, -0.05796051025390625, -0.05297279357910156, -0.047985076904296875, -0.04299736022949219, -0.0380096435546875, -0.03302192687988281, -0.028034210205078125, -0.023046493530273438, -0.01805877685546875, -0.013071060180664062, -0.008083343505859375, -0.0030956268310546875, 0.00189208984375, 0.0068798065185546875, 0.011867523193359375, 0.016855239868164062, 0.02184295654296875, 0.026830673217773438, 0.031818389892578125, 0.03680610656738281, 0.0417938232421875, 0.04678153991699219, 0.051769256591796875, 0.05675697326660156, 0.06174468994140625, 0.06673240661621094, 0.07172012329101562, 0.07670783996582031, 0.081695556640625, 0.08668327331542969, 0.09167098999023438, 0.09665870666503906, 0.10164642333984375, 0.10663414001464844, 0.11162185668945312, 0.11660957336425781, 0.1215972900390625, 0.1265850067138672, 0.13157272338867188, 0.13656044006347656, 0.14154815673828125, 0.14653587341308594, 0.15152359008789062, 0.1565113067626953, 0.1614990234375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 5.0, 7.0, 14.0, 8.0, 10.0, 20.0, 15.0, 26.0, 28.0, 39.0, 65.0, 60.0, 75.0, 58.0, 77.0, 71.0, 65.0, 58.0, 46.0, 42.0, 35.0, 16.0, 26.0, 26.0, 13.0, 20.0, 6.0, 6.0, 13.0, 8.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01385498046875, -0.01340329647064209, -0.01295161247253418, -0.01249992847442627, -0.01204824447631836, -0.01159656047821045, -0.011144876480102539, -0.010693192481994629, -0.010241508483886719, -0.009789824485778809, -0.009338140487670898, -0.008886456489562988, -0.008434772491455078, -0.007983088493347168, -0.007531404495239258, -0.007079720497131348, -0.0066280364990234375, -0.006176352500915527, -0.005724668502807617, -0.005272984504699707, -0.004821300506591797, -0.004369616508483887, -0.0039179325103759766, -0.0034662485122680664, -0.0030145645141601562, -0.002562880516052246, -0.002111196517944336, -0.0016595125198364258, -0.0012078285217285156, -0.0007561445236206055, -0.0003044605255126953, 0.00014722347259521484, 0.000598907470703125, 0.0010505914688110352, 0.0015022754669189453, 0.0019539594650268555, 0.0024056434631347656, 0.0028573274612426758, 0.003309011459350586, 0.003760695457458496, 0.004212379455566406, 0.004664063453674316, 0.0051157474517822266, 0.005567431449890137, 0.006019115447998047, 0.006470799446105957, 0.006922483444213867, 0.007374167442321777, 0.007825851440429688, 0.008277535438537598, 0.008729219436645508, 0.009180903434753418, 0.009632587432861328, 0.010084271430969238, 0.010535955429077148, 0.010987639427185059, 0.011439323425292969, 0.011891007423400879, 0.012342691421508789, 0.0127943754196167, 0.01324605941772461, 0.01369774341583252, 0.01414942741394043, 0.01460111141204834, 0.01505279541015625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 3.0, 4.0, 5.0, 15.0, 12.0, 14.0, 25.0, 29.0, 34.0, 26.0, 42.0, 45.0, 88.0, 77.0, 113.0, 193.0, 256.0, 441.0, 862.0, 3888.0, 1035625.0, 4416.0, 894.0, 476.0, 261.0, 198.0, 104.0, 85.0, 69.0, 46.0, 33.0, 24.0, 37.0, 18.0, 14.0, 10.0, 10.0, 10.0, 6.0, 11.0, 3.0, 3.0, 7.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.2354736328125, -0.22864913940429688, -0.22182464599609375, -0.21500015258789062, -0.2081756591796875, -0.20135116577148438, -0.19452667236328125, -0.18770217895507812, -0.180877685546875, -0.17405319213867188, -0.16722869873046875, -0.16040420532226562, -0.1535797119140625, -0.14675521850585938, -0.13993072509765625, -0.13310623168945312, -0.12628173828125, -0.11945724487304688, -0.11263275146484375, -0.10580825805664062, -0.0989837646484375, -0.09215927124023438, -0.08533477783203125, -0.07851028442382812, -0.071685791015625, -0.06486129760742188, -0.05803680419921875, -0.051212310791015625, -0.0443878173828125, -0.037563323974609375, -0.03073883056640625, -0.023914337158203125, -0.01708984375, -0.010265350341796875, -0.00344085693359375, 0.003383636474609375, 0.0102081298828125, 0.017032623291015625, 0.02385711669921875, 0.030681610107421875, 0.037506103515625, 0.044330596923828125, 0.05115509033203125, 0.057979583740234375, 0.0648040771484375, 0.07162857055664062, 0.07845306396484375, 0.08527755737304688, 0.09210205078125, 0.09892654418945312, 0.10575103759765625, 0.11257553100585938, 0.1194000244140625, 0.12622451782226562, 0.13304901123046875, 0.13987350463867188, 0.146697998046875, 0.15352249145507812, 0.16034698486328125, 0.16717147827148438, 0.1739959716796875, 0.18082046508789062, 0.18764495849609375, 0.19446945190429688, 0.2012939453125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 992.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24821829795837402, -0.24036775529384613, -0.23251722753047943, -0.22466668486595154, -0.21681615710258484, -0.20896561443805695, -0.20111507177352905, -0.19326454401016235, -0.18541401624679565, -0.17756347358226776, -0.16971294581890106, -0.16186240315437317, -0.15401187539100647, -0.14616133272647858, -0.13831079006195068, -0.13046026229858398, -0.12260971963405609, -0.1147591844201088, -0.1069086492061615, -0.0990581065416336, -0.0912075787782669, -0.08335703611373901, -0.07550650089979172, -0.06765596568584442, -0.059805430471897125, -0.05195489525794983, -0.04410436004400253, -0.03625382110476494, -0.028403285890817642, -0.020552750676870346, -0.012702211737632751, -0.004851676523685455, 0.002998858690261841, 0.010849394835531712, 0.018699930980801582, 0.026550468057394028, 0.034401003271341324, 0.04225153848528862, 0.050102077424526215, 0.05795261263847351, 0.0658031478524208, 0.0736536830663681, 0.0815042182803154, 0.0893547534942627, 0.09720529615879059, 0.10505582392215729, 0.11290636658668518, 0.12075690180063248, 0.12860743701457977, 0.13645797967910767, 0.14430850744247437, 0.15215905010700226, 0.16000957787036896, 0.16786012053489685, 0.17571064829826355, 0.18356119096279144, 0.19141173362731934, 0.19926227629184723, 0.20711280405521393, 0.21496334671974182, 0.22281387448310852, 0.2306644171476364, 0.2385149598121643, 0.246365487575531, 0.2542160153388977]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 20.0, 16.0, 21.0, 31.0, 26.0, 44.0, 40.0, 55.0, 52.0, 76.0, 75.0, 60.0, 65.0, 66.0, 56.0, 45.0, 55.0, 37.0, 38.0, 24.0, 21.0, 23.0, 15.0, 8.0, 7.0, 9.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041773974895477295, -0.04045841097831726, -0.03914284333586693, -0.037827275693416595, -0.03651171177625656, -0.03519614785909653, -0.033880580216646194, -0.03256501257419586, -0.031249448657035828, -0.029933882877230644, -0.02861831709742546, -0.027302751317620277, -0.025987185537815094, -0.02467161975800991, -0.023356053978204727, -0.022040488198399544, -0.02072492241859436, -0.019409356638789177, -0.018093790858983994, -0.01677822507917881, -0.015462659299373627, -0.014147093519568443, -0.01283152773976326, -0.011515961959958076, -0.010200396180152893, -0.00888483040034771, -0.007569264620542526, -0.006253698840737343, -0.004938133060932159, -0.003622567281126976, -0.0023070015013217926, -0.0009914357215166092, 0.0003241300582885742, 0.0016396958380937576, 0.002955261617898941, 0.0042708273977041245, 0.005586393177509308, 0.006901958957314491, 0.008217524737119675, 0.009533090516924858, 0.010848656296730042, 0.012164222076535225, 0.013479787856340408, 0.014795353636145592, 0.016110919415950775, 0.01742648519575596, 0.018742050975561142, 0.020057616755366325, 0.02137318253517151, 0.022688748314976692, 0.024004314094781876, 0.02531987987458706, 0.026635445654392242, 0.027951011434197426, 0.02926657721400261, 0.030582142993807793, 0.031897708773612976, 0.03321327269077301, 0.03452884033322334, 0.035844407975673676, 0.03715997189283371, 0.038475535809993744, 0.03979110345244408, 0.04110667109489441, 0.04242223501205444]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 9.0, 5.0, 17.0, 17.0, 8.0, 21.0, 15.0, 22.0, 12.0, 26.0, 19.0, 30.0, 45.0, 46.0, 43.0, 31.0, 38.0, 36.0, 53.0, 44.0, 36.0, 36.0, 48.0, 34.0, 32.0, 24.0, 32.0, 24.0, 26.0, 18.0, 28.0, 13.0, 20.0, 18.0, 15.0, 4.0, 9.0, 8.0, 3.0, 11.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.765625, -3.65081787109375, -3.5360107421875, -3.42120361328125, -3.306396484375, -3.19158935546875, -3.0767822265625, -2.96197509765625, -2.84716796875, -2.73236083984375, -2.6175537109375, -2.50274658203125, -2.387939453125, -2.27313232421875, -2.1583251953125, -2.04351806640625, -1.9287109375, -1.81390380859375, -1.6990966796875, -1.58428955078125, -1.469482421875, -1.35467529296875, -1.2398681640625, -1.12506103515625, -1.01025390625, -0.89544677734375, -0.7806396484375, -0.66583251953125, -0.551025390625, -0.43621826171875, -0.3214111328125, -0.20660400390625, -0.091796875, 0.02301025390625, 0.1378173828125, 0.25262451171875, 0.367431640625, 0.48223876953125, 0.5970458984375, 0.71185302734375, 0.82666015625, 0.94146728515625, 1.0562744140625, 1.17108154296875, 1.285888671875, 1.40069580078125, 1.5155029296875, 1.63031005859375, 1.7451171875, 1.85992431640625, 1.9747314453125, 2.08953857421875, 2.204345703125, 2.31915283203125, 2.4339599609375, 2.54876708984375, 2.66357421875, 2.77838134765625, 2.8931884765625, 3.00799560546875, 3.122802734375, 3.23760986328125, 3.3524169921875, 3.46722412109375, 3.58203125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 15.0, 17.0, 24.0, 25.0, 47.0, 50.0, 57.0, 103.0, 113.0, 152.0, 219.0, 295.0, 461.0, 706.0, 1237.0, 2166.0, 4618.0, 12129.0, 39323.0, 165330.0, 481844.0, 251713.0, 58735.0, 16497.0, 6112.0, 2609.0, 1341.0, 772.0, 509.0, 367.0, 270.0, 171.0, 160.0, 92.0, 66.0, 57.0, 41.0, 33.0, 18.0, 15.0, 15.0, 8.0, 8.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.234375, -5.0689697265625, -4.903564453125, -4.7381591796875, -4.57275390625, -4.4073486328125, -4.241943359375, -4.0765380859375, -3.9111328125, -3.7457275390625, -3.580322265625, -3.4149169921875, -3.24951171875, -3.0841064453125, -2.918701171875, -2.7532958984375, -2.587890625, -2.4224853515625, -2.257080078125, -2.0916748046875, -1.92626953125, -1.7608642578125, -1.595458984375, -1.4300537109375, -1.2646484375, -1.0992431640625, -0.933837890625, -0.7684326171875, -0.60302734375, -0.4376220703125, -0.272216796875, -0.1068115234375, 0.05859375, 0.2239990234375, 0.389404296875, 0.5548095703125, 0.72021484375, 0.8856201171875, 1.051025390625, 1.2164306640625, 1.3818359375, 1.5472412109375, 1.712646484375, 1.8780517578125, 2.04345703125, 2.2088623046875, 2.374267578125, 2.5396728515625, 2.705078125, 2.8704833984375, 3.035888671875, 3.2012939453125, 3.36669921875, 3.5321044921875, 3.697509765625, 3.8629150390625, 4.0283203125, 4.1937255859375, 4.359130859375, 4.5245361328125, 4.68994140625, 4.8553466796875, 5.020751953125, 5.1861572265625, 5.3515625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 10.0, 14.0, 11.0, 16.0, 20.0, 25.0, 30.0, 36.0, 38.0, 31.0, 53.0, 80.0, 128.0, 264.0, 1492.0, 282.0, 120.0, 68.0, 53.0, 47.0, 42.0, 32.0, 32.0, 23.0, 19.0, 19.0, 18.0, 11.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.66845703125, -12.3212890625, -11.97412109375, -11.626953125, -11.27978515625, -10.9326171875, -10.58544921875, -10.23828125, -9.89111328125, -9.5439453125, -9.19677734375, -8.849609375, -8.50244140625, -8.1552734375, -7.80810546875, -7.4609375, -7.11376953125, -6.7666015625, -6.41943359375, -6.072265625, -5.72509765625, -5.3779296875, -5.03076171875, -4.68359375, -4.33642578125, -3.9892578125, -3.64208984375, -3.294921875, -2.94775390625, -2.6005859375, -2.25341796875, -1.90625, -1.55908203125, -1.2119140625, -0.86474609375, -0.517578125, -0.17041015625, 0.1767578125, 0.52392578125, 0.87109375, 1.21826171875, 1.5654296875, 1.91259765625, 2.259765625, 2.60693359375, 2.9541015625, 3.30126953125, 3.6484375, 3.99560546875, 4.3427734375, 4.68994140625, 5.037109375, 5.38427734375, 5.7314453125, 6.07861328125, 6.42578125, 6.77294921875, 7.1201171875, 7.46728515625, 7.814453125, 8.16162109375, 8.5087890625, 8.85595703125, 9.203125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 13.0, 19.0, 15.0, 29.0, 42.0, 44.0, 73.0, 83.0, 120.0, 203.0, 338.0, 662.0, 1923.0, 216058.0, 2919410.0, 4586.0, 889.0, 426.0, 256.0, 119.0, 94.0, 74.0, 48.0, 43.0, 30.0, 19.0, 24.0, 14.0, 14.0, 5.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.890625, -16.24560546875, -15.6005859375, -14.95556640625, -14.310546875, -13.66552734375, -13.0205078125, -12.37548828125, -11.73046875, -11.08544921875, -10.4404296875, -9.79541015625, -9.150390625, -8.50537109375, -7.8603515625, -7.21533203125, -6.5703125, -5.92529296875, -5.2802734375, -4.63525390625, -3.990234375, -3.34521484375, -2.7001953125, -2.05517578125, -1.41015625, -0.76513671875, -0.1201171875, 0.52490234375, 1.169921875, 1.81494140625, 2.4599609375, 3.10498046875, 3.75, 4.39501953125, 5.0400390625, 5.68505859375, 6.330078125, 6.97509765625, 7.6201171875, 8.26513671875, 8.91015625, 9.55517578125, 10.2001953125, 10.84521484375, 11.490234375, 12.13525390625, 12.7802734375, 13.42529296875, 14.0703125, 14.71533203125, 15.3603515625, 16.00537109375, 16.650390625, 17.29541015625, 17.9404296875, 18.58544921875, 19.23046875, 19.87548828125, 20.5205078125, 21.16552734375, 21.810546875, 22.45556640625, 23.1005859375, 23.74560546875, 24.390625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 160.0, 764.0, 87.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.9982681274414, -86.53752136230469, -82.07676696777344, -77.61602020263672, -73.1552734375, -68.69451904296875, -64.23377227783203, -59.77302551269531, -55.31227493286133, -50.851524353027344, -46.390777587890625, -41.93002700805664, -37.469276428222656, -33.00852966308594, -28.547779083251953, -24.0870304107666, -19.62628173828125, -15.165533065795898, -10.70478343963623, -6.2440338134765625, -1.783285140991211, 2.6774635314941406, 7.138214111328125, 11.598962783813477, 16.059711456298828, 20.52046012878418, 24.98120880126953, 29.441959381103516, 33.9027099609375, 38.36345672607422, 42.8242073059082, 47.28495788574219, 51.74571228027344, 56.20646286010742, 60.66720962524414, 65.12796020507812, 69.58870697021484, 74.04945373535156, 78.51020812988281, 82.97095489501953, 87.43170166015625, 91.89244842529297, 96.35320281982422, 100.81394958496094, 105.27469635009766, 109.73544311523438, 114.19619750976562, 118.65694427490234, 123.1176986694336, 127.57844543457031, 132.03919982910156, 136.49993896484375, 140.960693359375, 145.42144775390625, 149.8822021484375, 154.3429412841797, 158.80369567871094, 163.2644500732422, 167.72518920898438, 172.18594360351562, 176.64669799804688, 181.10743713378906, 185.5681915283203, 190.02894592285156, 194.48968505859375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 7.0, 9.0, 11.0, 23.0, 12.0, 12.0, 21.0, 19.0, 34.0, 30.0, 32.0, 31.0, 33.0, 41.0, 48.0, 37.0, 42.0, 41.0, 35.0, 52.0, 43.0, 46.0, 45.0, 36.0, 34.0, 29.0, 26.0, 23.0, 24.0, 29.0, 18.0, 12.0, 10.0, 6.0, 11.0, 7.0, 9.0, 4.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.27055549621582, -18.587909698486328, -17.905261993408203, -17.22261619567871, -16.53997039794922, -15.857322692871094, -15.174676895141602, -14.492030143737793, -13.809383392333984, -13.126736640930176, -12.444089889526367, -11.761444091796875, -11.078797340393066, -10.396150588989258, -9.713504791259766, -9.030858039855957, -8.348211288452148, -7.66556453704834, -6.9829182624816895, -6.300271987915039, -5.6176252365112305, -4.934978485107422, -4.2523322105407715, -3.569685935974121, -2.8870391845703125, -2.204392671585083, -1.5217461585998535, -0.839099645614624, -0.15645313262939453, 0.526193380355835, 1.2088398933410645, 1.8914861679077148, 2.5741348266601562, 3.2567813396453857, 3.9394278526306152, 4.622074127197266, 5.304720878601074, 5.987367630004883, 6.670013904571533, 7.352660179138184, 8.035306930541992, 8.7179536819458, 9.40060043334961, 10.083246231079102, 10.76589298248291, 11.448539733886719, 12.131185531616211, 12.81383228302002, 13.496479034423828, 14.179125785827637, 14.861772537231445, 15.544418334960938, 16.227066040039062, 16.909711837768555, 17.592357635498047, 18.275005340576172, 18.957651138305664, 19.640296936035156, 20.32294464111328, 21.005590438842773, 21.688236236572266, 22.37088394165039, 23.053529739379883, 23.736175537109375, 24.4188232421875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 5.0, 17.0, 16.0, 17.0, 17.0, 19.0, 18.0, 22.0, 34.0, 20.0, 32.0, 36.0, 37.0, 40.0, 45.0, 37.0, 35.0, 40.0, 46.0, 43.0, 46.0, 37.0, 39.0, 36.0, 30.0, 27.0, 27.0, 22.0, 18.0, 15.0, 16.0, 17.0, 13.0, 10.0, 12.0, 12.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.88671875, -3.75628662109375, -3.6258544921875, -3.49542236328125, -3.364990234375, -3.23455810546875, -3.1041259765625, -2.97369384765625, -2.84326171875, -2.71282958984375, -2.5823974609375, -2.45196533203125, -2.321533203125, -2.19110107421875, -2.0606689453125, -1.93023681640625, -1.7998046875, -1.66937255859375, -1.5389404296875, -1.40850830078125, -1.278076171875, -1.14764404296875, -1.0172119140625, -0.88677978515625, -0.75634765625, -0.62591552734375, -0.4954833984375, -0.36505126953125, -0.234619140625, -0.10418701171875, 0.0262451171875, 0.15667724609375, 0.287109375, 0.41754150390625, 0.5479736328125, 0.67840576171875, 0.808837890625, 0.93927001953125, 1.0697021484375, 1.20013427734375, 1.33056640625, 1.46099853515625, 1.5914306640625, 1.72186279296875, 1.852294921875, 1.98272705078125, 2.1131591796875, 2.24359130859375, 2.3740234375, 2.50445556640625, 2.6348876953125, 2.76531982421875, 2.895751953125, 3.02618408203125, 3.1566162109375, 3.28704833984375, 3.41748046875, 3.54791259765625, 3.6783447265625, 3.80877685546875, 3.939208984375, 4.06964111328125, 4.2000732421875, 4.33050537109375, 4.4609375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 5.0, 9.0, 12.0, 20.0, 25.0, 40.0, 57.0, 81.0, 103.0, 158.0, 234.0, 328.0, 593.0, 942.0, 1839.0, 4339.0, 17013.0, 185128.0, 2604946.0, 1294229.0, 67439.0, 9890.0, 3206.0, 1443.0, 736.0, 450.0, 279.0, 198.0, 136.0, 102.0, 68.0, 53.0, 37.0, 31.0, 20.0, 21.0, 15.0, 11.0, 16.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.453125, -14.897705078125, -14.34228515625, -13.786865234375, -13.2314453125, -12.676025390625, -12.12060546875, -11.565185546875, -11.009765625, -10.454345703125, -9.89892578125, -9.343505859375, -8.7880859375, -8.232666015625, -7.67724609375, -7.121826171875, -6.56640625, -6.010986328125, -5.45556640625, -4.900146484375, -4.3447265625, -3.789306640625, -3.23388671875, -2.678466796875, -2.123046875, -1.567626953125, -1.01220703125, -0.456787109375, 0.0986328125, 0.654052734375, 1.20947265625, 1.764892578125, 2.3203125, 2.875732421875, 3.43115234375, 3.986572265625, 4.5419921875, 5.097412109375, 5.65283203125, 6.208251953125, 6.763671875, 7.319091796875, 7.87451171875, 8.429931640625, 8.9853515625, 9.540771484375, 10.09619140625, 10.651611328125, 11.20703125, 11.762451171875, 12.31787109375, 12.873291015625, 13.4287109375, 13.984130859375, 14.53955078125, 15.094970703125, 15.650390625, 16.205810546875, 16.76123046875, 17.316650390625, 17.8720703125, 18.427490234375, 18.98291015625, 19.538330078125, 20.09375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 11.0, 10.0, 8.0, 11.0, 23.0, 28.0, 33.0, 47.0, 55.0, 66.0, 109.0, 98.0, 141.0, 188.0, 168.0, 215.0, 280.0, 290.0, 339.0, 299.0, 276.0, 221.0, 236.0, 185.0, 163.0, 109.0, 91.0, 77.0, 58.0, 45.0, 36.0, 31.0, 18.0, 24.0, 19.0, 14.0, 13.0, 6.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.81640625, -5.614013671875, -5.41162109375, -5.209228515625, -5.0068359375, -4.804443359375, -4.60205078125, -4.399658203125, -4.197265625, -3.994873046875, -3.79248046875, -3.590087890625, -3.3876953125, -3.185302734375, -2.98291015625, -2.780517578125, -2.578125, -2.375732421875, -2.17333984375, -1.970947265625, -1.7685546875, -1.566162109375, -1.36376953125, -1.161376953125, -0.958984375, -0.756591796875, -0.55419921875, -0.351806640625, -0.1494140625, 0.052978515625, 0.25537109375, 0.457763671875, 0.66015625, 0.862548828125, 1.06494140625, 1.267333984375, 1.4697265625, 1.672119140625, 1.87451171875, 2.076904296875, 2.279296875, 2.481689453125, 2.68408203125, 2.886474609375, 3.0888671875, 3.291259765625, 3.49365234375, 3.696044921875, 3.8984375, 4.100830078125, 4.30322265625, 4.505615234375, 4.7080078125, 4.910400390625, 5.11279296875, 5.315185546875, 5.517578125, 5.719970703125, 5.92236328125, 6.124755859375, 6.3271484375, 6.529541015625, 6.73193359375, 6.934326171875, 7.13671875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 6.0, 13.0, 19.0, 34.0, 36.0, 67.0, 106.0, 233.0, 394.0, 741.0, 1550.0, 3292.0, 7116.0, 18878.0, 59214.0, 235883.0, 1011236.0, 1948863.0, 682045.0, 157534.0, 41884.0, 14075.0, 5730.0, 2622.0, 1182.0, 689.0, 368.0, 196.0, 115.0, 66.0, 40.0, 20.0, 14.0, 10.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.7197265625, -8.486328125, -8.2529296875, -8.01953125, -7.7861328125, -7.552734375, -7.3193359375, -7.0859375, -6.8525390625, -6.619140625, -6.3857421875, -6.15234375, -5.9189453125, -5.685546875, -5.4521484375, -5.21875, -4.9853515625, -4.751953125, -4.5185546875, -4.28515625, -4.0517578125, -3.818359375, -3.5849609375, -3.3515625, -3.1181640625, -2.884765625, -2.6513671875, -2.41796875, -2.1845703125, -1.951171875, -1.7177734375, -1.484375, -1.2509765625, -1.017578125, -0.7841796875, -0.55078125, -0.3173828125, -0.083984375, 0.1494140625, 0.3828125, 0.6162109375, 0.849609375, 1.0830078125, 1.31640625, 1.5498046875, 1.783203125, 2.0166015625, 2.25, 2.4833984375, 2.716796875, 2.9501953125, 3.18359375, 3.4169921875, 3.650390625, 3.8837890625, 4.1171875, 4.3505859375, 4.583984375, 4.8173828125, 5.05078125, 5.2841796875, 5.517578125, 5.7509765625, 5.984375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 6.0, 0.0, 7.0, 4.0, 4.0, 5.0, 8.0, 11.0, 17.0, 17.0, 16.0, 28.0, 28.0, 31.0, 47.0, 43.0, 58.0, 61.0, 68.0, 59.0, 59.0, 62.0, 44.0, 56.0, 55.0, 39.0, 28.0, 28.0, 21.0, 20.0, 18.0, 6.0, 12.0, 11.0, 9.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-49.271446228027344, -47.86446762084961, -46.457489013671875, -45.050514221191406, -43.64353561401367, -42.23655700683594, -40.8295783996582, -39.42259979248047, -38.015625, -36.608646392822266, -35.20166778564453, -33.79469299316406, -32.38771438598633, -30.980735778808594, -29.57375717163086, -28.166778564453125, -26.75979995727539, -25.352821350097656, -23.945844650268555, -22.53886604309082, -21.13188934326172, -19.724910736083984, -18.31793212890625, -16.910953521728516, -15.503976821899414, -14.096999168395996, -12.690021514892578, -11.283042907714844, -9.876065254211426, -8.469087600708008, -7.062108993530273, -5.6551313400268555, -4.2481536865234375, -2.8411757946014404, -1.4341979026794434, -0.027219772338867188, 1.3797578811645508, 2.7867355346679688, 4.193714141845703, 5.600691795349121, 7.007669448852539, 8.414647102355957, 9.821624755859375, 11.22860336303711, 12.635581016540527, 14.042558670043945, 15.44953727722168, 16.85651397705078, 18.263492584228516, 19.67047119140625, 21.07744789123535, 22.484426498413086, 23.891403198242188, 25.298381805419922, 26.705360412597656, 28.11233901977539, 29.519315719604492, 30.926294326782227, 32.33327102661133, 33.74024963378906, 35.1472282409668, 36.55420684814453, 37.961181640625, 39.368160247802734, 40.77513885498047]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 11.0, 5.0, 15.0, 16.0, 20.0, 15.0, 24.0, 26.0, 33.0, 35.0, 41.0, 45.0, 49.0, 43.0, 42.0, 46.0, 53.0, 44.0, 53.0, 43.0, 43.0, 44.0, 39.0, 36.0, 28.0, 23.0, 25.0, 19.0, 15.0, 13.0, 11.0, 6.0, 9.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-43.50050354003906, -42.15902328491211, -40.81754684448242, -39.47606658935547, -38.13459014892578, -36.79310989379883, -35.451629638671875, -34.11015319824219, -32.768672943115234, -31.427194595336914, -30.085716247558594, -28.74423599243164, -27.40275764465332, -26.061279296875, -24.719799041748047, -23.378320693969727, -22.036842346191406, -20.695363998413086, -19.353885650634766, -18.012405395507812, -16.670927047729492, -15.329448699951172, -13.987969398498535, -12.646490097045898, -11.305011749267578, -9.963533401489258, -8.622054100036621, -7.280575275421143, -5.939096450805664, -4.5976176261901855, -3.256138801574707, -1.9146595001220703, -0.5731773376464844, 0.7683014869689941, 2.1097803115844727, 3.451259136199951, 4.79273796081543, 6.134216785430908, 7.475695610046387, 8.817174911499023, 10.158653259277344, 11.500131607055664, 12.8416109085083, 14.183090209960938, 15.524568557739258, 16.866046905517578, 18.20752716064453, 19.54900550842285, 20.890483856201172, 22.231962203979492, 23.573440551757812, 24.914920806884766, 26.256399154663086, 27.597877502441406, 28.93935775756836, 30.28083610534668, 31.622314453125, 32.96379470825195, 34.30527114868164, 35.646751403808594, 36.98822784423828, 38.329708099365234, 39.67118835449219, 41.012664794921875, 42.35414505004883]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 3.0, 8.0, 11.0, 9.0, 13.0, 7.0, 25.0, 18.0, 21.0, 28.0, 28.0, 32.0, 40.0, 53.0, 38.0, 48.0, 58.0, 48.0, 54.0, 50.0, 49.0, 42.0, 51.0, 34.0, 30.0, 39.0, 33.0, 28.0, 21.0, 16.0, 11.0, 9.0, 6.0, 7.0, 7.0, 2.0, 6.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.4375, -68.0986328125, -65.759765625, -63.4208984375, -61.08203125, -58.7431640625, -56.404296875, -54.0654296875, -51.7265625, -49.3876953125, -47.048828125, -44.7099609375, -42.37109375, -40.0322265625, -37.693359375, -35.3544921875, -33.015625, -30.6767578125, -28.337890625, -25.9990234375, -23.66015625, -21.3212890625, -18.982421875, -16.6435546875, -14.3046875, -11.9658203125, -9.626953125, -7.2880859375, -4.94921875, -2.6103515625, -0.271484375, 2.0673828125, 4.40625, 6.7451171875, 9.083984375, 11.4228515625, 13.76171875, 16.1005859375, 18.439453125, 20.7783203125, 23.1171875, 25.4560546875, 27.794921875, 30.1337890625, 32.47265625, 34.8115234375, 37.150390625, 39.4892578125, 41.828125, 44.1669921875, 46.505859375, 48.8447265625, 51.18359375, 53.5224609375, 55.861328125, 58.2001953125, 60.5390625, 62.8779296875, 65.216796875, 67.5556640625, 69.89453125, 72.2333984375, 74.572265625, 76.9111328125, 79.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 6.0, 20.0, 20.0, 26.0, 52.0, 70.0, 118.0, 200.0, 317.0, 484.0, 704.0, 1181.0, 1906.0, 3018.0, 5031.0, 7892.0, 13045.0, 20944.0, 33695.0, 52442.0, 79969.0, 113057.0, 144930.0, 154492.0, 132245.0, 98607.0, 67313.0, 43881.0, 27771.0, 17299.0, 10556.0, 6605.0, 3981.0, 2481.0, 1520.0, 969.0, 613.0, 394.0, 246.0, 161.0, 104.0, 54.0, 45.0, 32.0, 18.0, 21.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.8359375, -2.74530029296875, -2.6546630859375, -2.56402587890625, -2.473388671875, -2.38275146484375, -2.2921142578125, -2.20147705078125, -2.11083984375, -2.02020263671875, -1.9295654296875, -1.83892822265625, -1.748291015625, -1.65765380859375, -1.5670166015625, -1.47637939453125, -1.3857421875, -1.29510498046875, -1.2044677734375, -1.11383056640625, -1.023193359375, -0.93255615234375, -0.8419189453125, -0.75128173828125, -0.66064453125, -0.57000732421875, -0.4793701171875, -0.38873291015625, -0.298095703125, -0.20745849609375, -0.1168212890625, -0.02618408203125, 0.064453125, 0.15509033203125, 0.2457275390625, 0.33636474609375, 0.427001953125, 0.51763916015625, 0.6082763671875, 0.69891357421875, 0.78955078125, 0.88018798828125, 0.9708251953125, 1.06146240234375, 1.152099609375, 1.24273681640625, 1.3333740234375, 1.42401123046875, 1.5146484375, 1.60528564453125, 1.6959228515625, 1.78656005859375, 1.877197265625, 1.96783447265625, 2.0584716796875, 2.14910888671875, 2.23974609375, 2.33038330078125, 2.4210205078125, 2.51165771484375, 2.602294921875, 2.69293212890625, 2.7835693359375, 2.87420654296875, 2.96484375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 8.0, 8.0, 9.0, 9.0, 9.0, 15.0, 23.0, 19.0, 14.0, 28.0, 31.0, 32.0, 29.0, 23.0, 31.0, 44.0, 40.0, 47.0, 28.0, 35.0, 1066.0, 41.0, 31.0, 53.0, 39.0, 24.0, 28.0, 42.0, 29.0, 31.0, 20.0, 18.0, 24.0, 11.0, 14.0, 16.0, 15.0, 9.0, 7.0, 10.0, 5.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.5625, -36.3671875, -35.171875, -33.9765625, -32.78125, -31.5859375, -30.390625, -29.1953125, -28.0, -26.8046875, -25.609375, -24.4140625, -23.21875, -22.0234375, -20.828125, -19.6328125, -18.4375, -17.2421875, -16.046875, -14.8515625, -13.65625, -12.4609375, -11.265625, -10.0703125, -8.875, -7.6796875, -6.484375, -5.2890625, -4.09375, -2.8984375, -1.703125, -0.5078125, 0.6875, 1.8828125, 3.078125, 4.2734375, 5.46875, 6.6640625, 7.859375, 9.0546875, 10.25, 11.4453125, 12.640625, 13.8359375, 15.03125, 16.2265625, 17.421875, 18.6171875, 19.8125, 21.0078125, 22.203125, 23.3984375, 24.59375, 25.7890625, 26.984375, 28.1796875, 29.375, 30.5703125, 31.765625, 32.9609375, 34.15625, 35.3515625, 36.546875, 37.7421875, 38.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 13.0, 14.0, 21.0, 41.0, 74.0, 95.0, 139.0, 228.0, 322.0, 469.0, 678.0, 1019.0, 1569.0, 2365.0, 3462.0, 4981.0, 7374.0, 11130.0, 15885.0, 23505.0, 33338.0, 46943.0, 64515.0, 84316.0, 103961.0, 634052.0, 648694.0, 104155.0, 84613.0, 64337.0, 47138.0, 33530.0, 23411.0, 16395.0, 10924.0, 7591.0, 5215.0, 3558.0, 2379.0, 1547.0, 1026.0, 712.0, 479.0, 319.0, 217.0, 132.0, 86.0, 70.0, 41.0, 27.0, 10.0, 8.0, 6.0, 3.0, 1.0, 2.0], "bins": [-2.048828125, -1.9885711669921875, -1.928314208984375, -1.8680572509765625, -1.80780029296875, -1.7475433349609375, -1.687286376953125, -1.6270294189453125, -1.5667724609375, -1.5065155029296875, -1.446258544921875, -1.3860015869140625, -1.32574462890625, -1.2654876708984375, -1.205230712890625, -1.1449737548828125, -1.084716796875, -1.0244598388671875, -0.964202880859375, -0.9039459228515625, -0.84368896484375, -0.7834320068359375, -0.723175048828125, -0.6629180908203125, -0.6026611328125, -0.5424041748046875, -0.482147216796875, -0.4218902587890625, -0.36163330078125, -0.3013763427734375, -0.241119384765625, -0.1808624267578125, -0.12060546875, -0.0603485107421875, -9.1552734375e-05, 0.0601654052734375, 0.12042236328125, 0.1806793212890625, 0.240936279296875, 0.3011932373046875, 0.3614501953125, 0.4217071533203125, 0.481964111328125, 0.5422210693359375, 0.60247802734375, 0.6627349853515625, 0.722991943359375, 0.7832489013671875, 0.843505859375, 0.9037628173828125, 0.964019775390625, 1.0242767333984375, 1.08453369140625, 1.1447906494140625, 1.205047607421875, 1.2653045654296875, 1.3255615234375, 1.3858184814453125, 1.446075439453125, 1.5063323974609375, 1.56658935546875, 1.6268463134765625, 1.687103271484375, 1.7473602294921875, 1.8076171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 5.0, 4.0, 8.0, 12.0, 19.0, 13.0, 8.0, 22.0, 11.0, 29.0, 28.0, 32.0, 40.0, 34.0, 47.0, 58.0, 70.0, 83.0, 76.0, 56.0, 50.0, 34.0, 34.0, 35.0, 27.0, 22.0, 16.0, 14.0, 15.0, 16.0, 16.0, 15.0, 9.0, 12.0, 6.0, 10.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03656005859375, -0.03528594970703125, -0.0340118408203125, -0.03273773193359375, -0.031463623046875, -0.03018951416015625, -0.0289154052734375, -0.02764129638671875, -0.0263671875, -0.02509307861328125, -0.0238189697265625, -0.02254486083984375, -0.021270751953125, -0.01999664306640625, -0.0187225341796875, -0.01744842529296875, -0.01617431640625, -0.01490020751953125, -0.0136260986328125, -0.01235198974609375, -0.011077880859375, -0.00980377197265625, -0.0085296630859375, -0.00725555419921875, -0.0059814453125, -0.00470733642578125, -0.0034332275390625, -0.00215911865234375, -0.000885009765625, 0.00038909912109375, 0.0016632080078125, 0.00293731689453125, 0.00421142578125, 0.00548553466796875, 0.0067596435546875, 0.00803375244140625, 0.009307861328125, 0.01058197021484375, 0.0118560791015625, 0.01313018798828125, 0.014404296875, 0.01567840576171875, 0.0169525146484375, 0.01822662353515625, 0.019500732421875, 0.02077484130859375, 0.0220489501953125, 0.02332305908203125, 0.02459716796875, 0.02587127685546875, 0.0271453857421875, 0.02841949462890625, 0.029693603515625, 0.03096771240234375, 0.0322418212890625, 0.03351593017578125, 0.0347900390625, 0.03606414794921875, 0.0373382568359375, 0.03861236572265625, 0.039886474609375, 0.04116058349609375, 0.0424346923828125, 0.04370880126953125, 0.04498291015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 5.0, 16.0, 23.0, 22.0, 30.0, 43.0, 52.0, 79.0, 105.0, 177.0, 243.0, 387.0, 637.0, 1098.0, 1874.0, 3443.0, 6317.0, 12333.0, 24959.0, 51050.0, 105570.0, 194979.0, 258719.0, 188527.0, 100003.0, 48379.0, 23822.0, 11508.0, 6212.0, 3227.0, 1802.0, 1093.0, 622.0, 391.0, 254.0, 168.0, 114.0, 64.0, 53.0, 44.0, 32.0, 23.0, 19.0, 12.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1494140625, -0.14481163024902344, -0.14020919799804688, -0.1356067657470703, -0.13100433349609375, -0.1264019012451172, -0.12179946899414062, -0.11719703674316406, -0.1125946044921875, -0.10799217224121094, -0.10338973999023438, -0.09878730773925781, -0.09418487548828125, -0.08958244323730469, -0.08498001098632812, -0.08037757873535156, -0.075775146484375, -0.07117271423339844, -0.06657028198242188, -0.06196784973144531, -0.05736541748046875, -0.05276298522949219, -0.048160552978515625, -0.04355812072753906, -0.0389556884765625, -0.03435325622558594, -0.029750823974609375, -0.025148391723632812, -0.02054595947265625, -0.015943527221679688, -0.011341094970703125, -0.0067386627197265625, -0.00213623046875, 0.0024662017822265625, 0.007068634033203125, 0.011671066284179688, 0.01627349853515625, 0.020875930786132812, 0.025478363037109375, 0.030080795288085938, 0.0346832275390625, 0.03928565979003906, 0.043888092041015625, 0.04849052429199219, 0.05309295654296875, 0.05769538879394531, 0.062297821044921875, 0.06690025329589844, 0.071502685546875, 0.07610511779785156, 0.08070755004882812, 0.08530998229980469, 0.08991241455078125, 0.09451484680175781, 0.09911727905273438, 0.10371971130371094, 0.1083221435546875, 0.11292457580566406, 0.11752700805664062, 0.12212944030761719, 0.12673187255859375, 0.1313343048095703, 0.13593673706054688, 0.14053916931152344, 0.1451416015625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 19.0, 14.0, 27.0, 42.0, 74.0, 96.0, 122.0, 132.0, 124.0, 94.0, 82.0, 38.0, 37.0, 29.0, 22.0, 9.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06124163046479225, -0.057829827070236206, -0.05441802740097046, -0.05100622773170471, -0.047594424337148666, -0.04418262094259262, -0.040770821273326874, -0.03735902160406113, -0.03394721820950508, -0.030535416677594185, -0.02712361514568329, -0.023711813613772392, -0.020300012081861496, -0.0168882105499506, -0.013476409018039703, -0.010064607486128807, -0.006652805954217911, -0.0032410044223070145, 0.00017079710960388184, 0.003582598641514778, 0.0069944001734256744, 0.01040620170533657, 0.013818003237247467, 0.017229804769158363, 0.02064160630106926, 0.024053407832980156, 0.027465209364891052, 0.03087701089680195, 0.034288812428712845, 0.03770061582326889, 0.04111241549253464, 0.044524215161800385, 0.04793602228164673, 0.051347821950912476, 0.05475962534546852, 0.05817142874002457, 0.061583228409290314, 0.06499502807855606, 0.0684068351984024, 0.07181863486766815, 0.0752304345369339, 0.07864223420619965, 0.0820540338754654, 0.08546584099531174, 0.08887764066457748, 0.09228944033384323, 0.09570124745368958, 0.09911304712295532, 0.10252484679222107, 0.10593664646148682, 0.10934844613075256, 0.11276025325059891, 0.11617205291986465, 0.1195838525891304, 0.12299565970897675, 0.1264074593782425, 0.12981925904750824, 0.133231058716774, 0.13664285838603973, 0.14005465805530548, 0.14346647262573242, 0.14687827229499817, 0.15029007196426392, 0.15370187163352966, 0.1571136713027954]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 5.0, 1.0, 11.0, 5.0, 8.0, 8.0, 8.0, 15.0, 13.0, 28.0, 27.0, 22.0, 24.0, 16.0, 19.0, 26.0, 43.0, 38.0, 38.0, 44.0, 41.0, 42.0, 39.0, 51.0, 52.0, 39.0, 36.0, 27.0, 33.0, 34.0, 24.0, 16.0, 25.0, 25.0, 18.0, 14.0, 17.0, 14.0, 14.0, 9.0, 5.0, 14.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.03454029560089111, -0.03342816233634949, -0.03231602907180786, -0.031203892081975937, -0.03009175881743431, -0.028979625552892685, -0.02786749042570591, -0.026755355298519135, -0.02564322203397751, -0.024531088769435883, -0.023418953642249107, -0.022306818515062332, -0.021194685250520706, -0.02008255198597908, -0.018970416858792305, -0.01785828173160553, -0.016746148467063904, -0.015634015202522278, -0.014521880075335503, -0.013409745879471302, -0.012297611683607101, -0.0111854774877429, -0.0100733432918787, -0.0089612090960145, -0.007849074900150299, -0.0067369407042860985, -0.005624806508421898, -0.004512672312557697, -0.0034005381166934967, -0.002288403920829296, -0.0011762697249650955, -6.413552910089493e-05, 0.0010479986667633057, 0.0021601328626275063, 0.003272267058491707, 0.0043844012543559074, 0.005496535450220108, 0.006608669646084309, 0.007720803841948509, 0.00883293803781271, 0.00994507223367691, 0.011057206429541111, 0.012169340625405312, 0.013281474821269512, 0.014393609017133713, 0.015505743212997913, 0.016617877408862114, 0.01773001253604889, 0.018842145800590515, 0.01995427906513214, 0.021066414192318916, 0.02217854931950569, 0.023290682584047318, 0.024402815848588943, 0.02551495097577572, 0.026627086102962494, 0.02773921936750412, 0.028851352632045746, 0.02996348775923252, 0.031075622886419296, 0.03218775615096092, 0.03329988941550255, 0.03441202640533447, 0.0355241596698761, 0.036636292934417725]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 6.0, 12.0, 19.0, 17.0, 16.0, 17.0, 28.0, 25.0, 34.0, 42.0, 43.0, 38.0, 49.0, 52.0, 60.0, 43.0, 61.0, 63.0, 48.0, 43.0, 45.0, 40.0, 27.0, 22.0, 28.0, 28.0, 18.0, 12.0, 12.0, 17.0, 7.0, 6.0, 4.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.0, -76.5087890625, -74.017578125, -71.5263671875, -69.03515625, -66.5439453125, -64.052734375, -61.5615234375, -59.0703125, -56.5791015625, -54.087890625, -51.5966796875, -49.10546875, -46.6142578125, -44.123046875, -41.6318359375, -39.140625, -36.6494140625, -34.158203125, -31.6669921875, -29.17578125, -26.6845703125, -24.193359375, -21.7021484375, -19.2109375, -16.7197265625, -14.228515625, -11.7373046875, -9.24609375, -6.7548828125, -4.263671875, -1.7724609375, 0.71875, 3.2099609375, 5.701171875, 8.1923828125, 10.68359375, 13.1748046875, 15.666015625, 18.1572265625, 20.6484375, 23.1396484375, 25.630859375, 28.1220703125, 30.61328125, 33.1044921875, 35.595703125, 38.0869140625, 40.578125, 43.0693359375, 45.560546875, 48.0517578125, 50.54296875, 53.0341796875, 55.525390625, 58.0166015625, 60.5078125, 62.9990234375, 65.490234375, 67.9814453125, 70.47265625, 72.9638671875, 75.455078125, 77.9462890625, 80.4375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 10.0, 14.0, 8.0, 17.0, 18.0, 23.0, 23.0, 34.0, 74.0, 75.0, 148.0, 223.0, 513.0, 1385.0, 5831.0, 40363.0, 361029.0, 549064.0, 76678.0, 9631.0, 1979.0, 617.0, 283.0, 146.0, 99.0, 69.0, 42.0, 40.0, 26.0, 13.0, 18.0, 12.0, 8.0, 8.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.90625, -14.4425048828125, -13.978759765625, -13.5150146484375, -13.05126953125, -12.5875244140625, -12.123779296875, -11.6600341796875, -11.1962890625, -10.7325439453125, -10.268798828125, -9.8050537109375, -9.34130859375, -8.8775634765625, -8.413818359375, -7.9500732421875, -7.486328125, -7.0225830078125, -6.558837890625, -6.0950927734375, -5.63134765625, -5.1676025390625, -4.703857421875, -4.2401123046875, -3.7763671875, -3.3126220703125, -2.848876953125, -2.3851318359375, -1.92138671875, -1.4576416015625, -0.993896484375, -0.5301513671875, -0.06640625, 0.3973388671875, 0.861083984375, 1.3248291015625, 1.78857421875, 2.2523193359375, 2.716064453125, 3.1798095703125, 3.6435546875, 4.1072998046875, 4.571044921875, 5.0347900390625, 5.49853515625, 5.9622802734375, 6.426025390625, 6.8897705078125, 7.353515625, 7.8172607421875, 8.281005859375, 8.7447509765625, 9.20849609375, 9.6722412109375, 10.135986328125, 10.5997314453125, 11.0634765625, 11.5272216796875, 11.990966796875, 12.4547119140625, 12.91845703125, 13.3822021484375, 13.845947265625, 14.3096923828125, 14.7734375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 9.0, 4.0, 8.0, 8.0, 16.0, 18.0, 20.0, 24.0, 23.0, 32.0, 35.0, 45.0, 48.0, 48.0, 54.0, 60.0, 2064.0, 96.0, 56.0, 49.0, 44.0, 42.0, 40.0, 32.0, 30.0, 27.0, 18.0, 19.0, 16.0, 14.0, 6.0, 10.0, 4.0, 4.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.125, -84.2021484375, -81.279296875, -78.3564453125, -75.43359375, -72.5107421875, -69.587890625, -66.6650390625, -63.7421875, -60.8193359375, -57.896484375, -54.9736328125, -52.05078125, -49.1279296875, -46.205078125, -43.2822265625, -40.359375, -37.4365234375, -34.513671875, -31.5908203125, -28.66796875, -25.7451171875, -22.822265625, -19.8994140625, -16.9765625, -14.0537109375, -11.130859375, -8.2080078125, -5.28515625, -2.3623046875, 0.560546875, 3.4833984375, 6.40625, 9.3291015625, 12.251953125, 15.1748046875, 18.09765625, 21.0205078125, 23.943359375, 26.8662109375, 29.7890625, 32.7119140625, 35.634765625, 38.5576171875, 41.48046875, 44.4033203125, 47.326171875, 50.2490234375, 53.171875, 56.0947265625, 59.017578125, 61.9404296875, 64.86328125, 67.7861328125, 70.708984375, 73.6318359375, 76.5546875, 79.4775390625, 82.400390625, 85.3232421875, 88.24609375, 91.1689453125, 94.091796875, 97.0146484375, 99.9375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 12.0, 10.0, 18.0, 22.0, 38.0, 57.0, 99.0, 136.0, 226.0, 441.0, 787.0, 1595.0, 4068.0, 18494.0, 218859.0, 2775159.0, 108636.0, 11096.0, 3032.0, 1256.0, 663.0, 359.0, 218.0, 142.0, 89.0, 50.0, 24.0, 35.0, 19.0, 16.0, 11.0, 10.0, 2.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.984375, -12.5567626953125, -12.129150390625, -11.7015380859375, -11.27392578125, -10.8463134765625, -10.418701171875, -9.9910888671875, -9.5634765625, -9.1358642578125, -8.708251953125, -8.2806396484375, -7.85302734375, -7.4254150390625, -6.997802734375, -6.5701904296875, -6.142578125, -5.7149658203125, -5.287353515625, -4.8597412109375, -4.43212890625, -4.0045166015625, -3.576904296875, -3.1492919921875, -2.7216796875, -2.2940673828125, -1.866455078125, -1.4388427734375, -1.01123046875, -0.5836181640625, -0.156005859375, 0.2716064453125, 0.69921875, 1.1268310546875, 1.554443359375, 1.9820556640625, 2.40966796875, 2.8372802734375, 3.264892578125, 3.6925048828125, 4.1201171875, 4.5477294921875, 4.975341796875, 5.4029541015625, 5.83056640625, 6.2581787109375, 6.685791015625, 7.1134033203125, 7.541015625, 7.9686279296875, 8.396240234375, 8.8238525390625, 9.25146484375, 9.6790771484375, 10.106689453125, 10.5343017578125, 10.9619140625, 11.3895263671875, 11.817138671875, 12.2447509765625, 12.67236328125, 13.0999755859375, 13.527587890625, 13.9552001953125, 14.3828125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 3.0, 7.0, 12.0, 8.0, 26.0, 43.0, 52.0, 87.0, 127.0, 107.0, 123.0, 119.0, 89.0, 59.0, 45.0, 29.0, 16.0, 11.0, 8.0, 5.0, 5.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.33577728271484, -76.49996185302734, -72.66414642333984, -68.82832336425781, -64.99250793457031, -61.15669250488281, -57.32087707519531, -53.48506164550781, -49.64924240112305, -45.81342697143555, -41.97760772705078, -38.14179229736328, -34.30597686767578, -30.470157623291016, -26.634342193603516, -22.798524856567383, -18.96270751953125, -15.126890182495117, -11.2910737991333, -7.455257415771484, -3.6194400787353516, 0.21637725830078125, 4.052192687988281, 7.888010025024414, 11.723827362060547, 15.55964469909668, 19.395462036132812, 23.231277465820312, 27.067094802856445, 30.902912139892578, 34.73872756958008, 38.574546813964844, 42.41035461425781, 46.24617004394531, 50.08198928833008, 53.91780471801758, 57.753623962402344, 61.589439392089844, 65.42525482177734, 69.26107025146484, 73.09689331054688, 76.93270874023438, 80.76852416992188, 84.60433959960938, 88.4401626586914, 92.2759780883789, 96.1117935180664, 99.9476089477539, 103.7834243774414, 107.6192398071289, 111.4550552368164, 115.29087829589844, 119.12669372558594, 122.96250915527344, 126.79832458496094, 130.63414001464844, 134.46995544433594, 138.30577087402344, 142.14158630371094, 145.97740173339844, 149.81321716308594, 153.6490478515625, 157.48486328125, 161.3206787109375, 165.156494140625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 6.0, 4.0, 13.0, 14.0, 16.0, 20.0, 23.0, 33.0, 29.0, 21.0, 32.0, 46.0, 28.0, 40.0, 53.0, 53.0, 41.0, 43.0, 42.0, 38.0, 55.0, 47.0, 29.0, 30.0, 30.0, 26.0, 27.0, 21.0, 24.0, 17.0, 20.0, 15.0, 16.0, 13.0, 12.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-134.5689697265625, -130.8948516845703, -127.22073364257812, -123.54662322998047, -119.87250518798828, -116.1983871459961, -112.52427673339844, -108.85015869140625, -105.17604064941406, -101.50192260742188, -97.82780456542969, -94.15369415283203, -90.47957611083984, -86.80545806884766, -83.13134765625, -79.45722961425781, -75.78311157226562, -72.10899353027344, -68.43487548828125, -64.7607650756836, -61.086647033691406, -57.41252899169922, -53.7384147644043, -50.064300537109375, -46.39018249511719, -42.716064453125, -39.04195022583008, -35.367835998535156, -31.69371795654297, -28.019601821899414, -24.34548568725586, -20.671369552612305, -16.99724578857422, -13.323129653930664, -9.64901351928711, -5.974897384643555, -2.30078125, 1.3733348846435547, 5.047451019287109, 8.721567153930664, 12.395683288574219, 16.069799423217773, 19.743915557861328, 23.418031692504883, 27.092147827148438, 30.766263961791992, 34.44038009643555, 38.11449432373047, 41.788612365722656, 45.462730407714844, 49.136844635009766, 52.81095886230469, 56.485076904296875, 60.15919494628906, 63.833309173583984, 67.5074234008789, 71.1815414428711, 74.85565948486328, 78.52976989746094, 82.20388793945312, 85.87800598144531, 89.5521240234375, 93.22624206542969, 96.90035247802734, 100.57447052001953]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 12.0, 21.0, 15.0, 19.0, 42.0, 37.0, 54.0, 88.0, 94.0, 204.0, 392.0, 742.0, 1611.0, 3838.0, 10860.0, 1018465.0, 6861.0, 2689.0, 1172.0, 510.0, 241.0, 175.0, 104.0, 61.0, 50.0, 41.0, 27.0, 22.0, 18.0, 10.0, 11.0, 6.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.861122131347656, -39.46613311767578, -38.071144104003906, -36.67615509033203, -35.28116226196289, -33.886173248291016, -32.49118423461914, -31.096195220947266, -29.701204299926758, -28.306215286254883, -26.911224365234375, -25.5162353515625, -24.121246337890625, -22.726255416870117, -21.331266403198242, -19.936275482177734, -18.54128646850586, -17.146297454833984, -15.751306533813477, -14.356317520141602, -12.96132755279541, -11.566337585449219, -10.171348571777344, -8.776358604431152, -7.381368637084961, -5.9863786697387695, -4.591389179229736, -3.196399688720703, -1.8014097213745117, -0.4064197540283203, 0.9885692596435547, 2.383559226989746, 3.7785491943359375, 5.173539161682129, 6.568528652191162, 7.963518142700195, 9.358508110046387, 10.753498077392578, 12.148487091064453, 13.543477058410645, 14.938467025756836, 16.33345603942871, 17.72844696044922, 19.123435974121094, 20.51842498779297, 21.913415908813477, 23.30840492248535, 24.70339584350586, 26.098384857177734, 27.49337387084961, 28.888364791870117, 30.283353805541992, 31.6783447265625, 33.073333740234375, 34.46832275390625, 35.863311767578125, 37.25830078125, 38.653289794921875, 40.04827880859375, 41.443267822265625, 42.838260650634766, 44.23324966430664, 45.628238677978516, 47.02322769165039, 48.41822052001953]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 10.0, 7.0, 5.0, 12.0, 20.0, 24.0, 41.0, 50.0, 75.0, 224.0, 3021.0, 51458976.0, 464.0, 79.0, 45.0, 28.0, 19.0, 17.0, 10.0, 4.0, 8.0, 4.0, 7.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-921.6270751953125, -887.8526611328125, -854.0783081054688, -820.303955078125, -786.529541015625, -752.755126953125, -718.9807739257812, -685.2064208984375, -651.4320068359375, -617.6575927734375, -583.8832397460938, -550.10888671875, -516.33447265625, -482.5600891113281, -448.78570556640625, -415.0113220214844, -381.2369384765625, -347.4625549316406, -313.68817138671875, -279.9137878417969, -246.139404296875, -212.36502075195312, -178.59063720703125, -144.81625366210938, -111.0418701171875, -77.26748657226562, -43.49310302734375, -9.718719482421875, 24.0556640625, 57.830047607421875, 91.60443115234375, 125.37881469726562, 159.1533203125, 192.92770385742188, 226.70208740234375, 260.4764709472656, 294.2508544921875, 328.0252380371094, 361.79962158203125, 395.5740051269531, 429.348388671875, 463.1227722167969, 496.89715576171875, 530.6715087890625, 564.4459228515625, 598.2203369140625, 631.9946899414062, 665.76904296875, 699.54345703125, 733.31787109375, 767.0922241210938, 800.8665771484375, 834.6409912109375, 868.4154052734375, 902.1897583007812, 935.964111328125, 969.738525390625, 1003.512939453125, 1037.287353515625, 1071.0616455078125, 1104.8360595703125, 1138.6104736328125, 1172.384765625, 1206.1591796875, 1239.93359375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 9.0, 25.0, 36.0, 53.0, 74.0, 127.0, 212.0, 296.0, 458.0, 672.0, 1073.0, 1790.0, 2834.0, 4344.0, 6764.0, 10843.0, 17458.0, 28334.0, 45892.0, 75295.0, 123355.0, 196151.0, 300431.0, 448290.0, 3196127.0, 814532.0, 363126.0, 244371.0, 156239.0, 97020.0, 59144.0, 36352.0, 22292.0, 13566.0, 8495.0, 5478.0, 3562.0, 2211.0, 1530.0, 979.0, 595.0, 367.0, 258.0, 146.0, 98.0, 51.0, 35.0, 18.0, 12.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.1240234375, -1.088623046875, -1.05322265625, -1.017822265625, -0.982421875, -0.947021484375, -0.91162109375, -0.876220703125, -0.8408203125, -0.805419921875, -0.77001953125, -0.734619140625, -0.69921875, -0.663818359375, -0.62841796875, -0.593017578125, -0.5576171875, -0.522216796875, -0.48681640625, -0.451416015625, -0.416015625, -0.380615234375, -0.34521484375, -0.309814453125, -0.2744140625, -0.239013671875, -0.20361328125, -0.168212890625, -0.1328125, -0.097412109375, -0.06201171875, -0.026611328125, 0.0087890625, 0.044189453125, 0.07958984375, 0.114990234375, 0.150390625, 0.185791015625, 0.22119140625, 0.256591796875, 0.2919921875, 0.327392578125, 0.36279296875, 0.398193359375, 0.43359375, 0.468994140625, 0.50439453125, 0.539794921875, 0.5751953125, 0.610595703125, 0.64599609375, 0.681396484375, 0.716796875, 0.752197265625, 0.78759765625, 0.822998046875, 0.8583984375, 0.893798828125, 0.92919921875, 0.964599609375, 1.0, 1.035400390625, 1.07080078125, 1.106201171875, 1.1416015625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 12.0, 11.0, 9.0, 8.0, 15.0, 16.0, 21.0, 33.0, 23.0, 37.0, 32.0, 35.0, 35.0, 47.0, 40.0, 48.0, 54.0, 1037.0, 63.0, 45.0, 35.0, 49.0, 32.0, 37.0, 34.0, 26.0, 43.0, 24.0, 19.0, 19.0, 16.0, 15.0, 9.0, 8.0, 12.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-31.359375, -30.50439453125, -29.6494140625, -28.79443359375, -27.939453125, -27.08447265625, -26.2294921875, -25.37451171875, -24.51953125, -23.66455078125, -22.8095703125, -21.95458984375, -21.099609375, -20.24462890625, -19.3896484375, -18.53466796875, -17.6796875, -16.82470703125, -15.9697265625, -15.11474609375, -14.259765625, -13.40478515625, -12.5498046875, -11.69482421875, -10.83984375, -9.98486328125, -9.1298828125, -8.27490234375, -7.419921875, -6.56494140625, -5.7099609375, -4.85498046875, -4.0, -3.14501953125, -2.2900390625, -1.43505859375, -0.580078125, 0.27490234375, 1.1298828125, 1.98486328125, 2.83984375, 3.69482421875, 4.5498046875, 5.40478515625, 6.259765625, 7.11474609375, 7.9697265625, 8.82470703125, 9.6796875, 10.53466796875, 11.3896484375, 12.24462890625, 13.099609375, 13.95458984375, 14.8095703125, 15.66455078125, 16.51953125, 17.37451171875, 18.2294921875, 19.08447265625, 19.939453125, 20.79443359375, 21.6494140625, 22.50439453125, 23.359375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 13.0, 11.0, 14.0, 33.0, 29.0, 52.0, 85.0, 143.0, 206.0, 316.0, 389.0, 522.0, 769.0, 1142.0, 1661.0, 2389.0, 3351.0, 5107.0, 7549.0, 11681.0, 17841.0, 28722.0, 46958.0, 78591.0, 137278.0, 239447.0, 400183.0, 1247563.0, 2977968.0, 437574.0, 263802.0, 152008.0, 87122.0, 51325.0, 31391.0, 19594.0, 12566.0, 8418.0, 5559.0, 3685.0, 2594.0, 1826.0, 1180.0, 847.0, 543.0, 424.0, 286.0, 193.0, 159.0, 97.0, 74.0, 47.0, 37.0, 26.0, 26.0, 9.0, 3.0, 6.0, 5.0, 2.0, 3.0], "bins": [-1.1376953125, -1.101104736328125, -1.06451416015625, -1.027923583984375, -0.9913330078125, -0.954742431640625, -0.91815185546875, -0.881561279296875, -0.844970703125, -0.808380126953125, -0.77178955078125, -0.735198974609375, -0.6986083984375, -0.662017822265625, -0.62542724609375, -0.588836669921875, -0.55224609375, -0.515655517578125, -0.47906494140625, -0.442474365234375, -0.4058837890625, -0.369293212890625, -0.33270263671875, -0.296112060546875, -0.259521484375, -0.222930908203125, -0.18634033203125, -0.149749755859375, -0.1131591796875, -0.076568603515625, -0.03997802734375, -0.003387451171875, 0.033203125, 0.069793701171875, 0.10638427734375, 0.142974853515625, 0.1795654296875, 0.216156005859375, 0.25274658203125, 0.289337158203125, 0.325927734375, 0.362518310546875, 0.39910888671875, 0.435699462890625, 0.4722900390625, 0.508880615234375, 0.54547119140625, 0.582061767578125, 0.61865234375, 0.655242919921875, 0.69183349609375, 0.728424072265625, 0.7650146484375, 0.801605224609375, 0.83819580078125, 0.874786376953125, 0.911376953125, 0.947967529296875, 0.98455810546875, 1.021148681640625, 1.0577392578125, 1.094329833984375, 1.13092041015625, 1.167510986328125, 1.2041015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 8.0, 8.0, 10.0, 9.0, 15.0, 11.0, 14.0, 24.0, 27.0, 32.0, 48.0, 61.0, 50.0, 52.0, 66.0, 1079.0, 72.0, 46.0, 51.0, 53.0, 44.0, 33.0, 31.0, 22.0, 27.0, 19.0, 17.0, 11.0, 17.0, 8.0, 8.0, 6.0, 9.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.8125, -35.6845703125, -34.556640625, -33.4287109375, -32.30078125, -31.1728515625, -30.044921875, -28.9169921875, -27.7890625, -26.6611328125, -25.533203125, -24.4052734375, -23.27734375, -22.1494140625, -21.021484375, -19.8935546875, -18.765625, -17.6376953125, -16.509765625, -15.3818359375, -14.25390625, -13.1259765625, -11.998046875, -10.8701171875, -9.7421875, -8.6142578125, -7.486328125, -6.3583984375, -5.23046875, -4.1025390625, -2.974609375, -1.8466796875, -0.71875, 0.4091796875, 1.537109375, 2.6650390625, 3.79296875, 4.9208984375, 6.048828125, 7.1767578125, 8.3046875, 9.4326171875, 10.560546875, 11.6884765625, 12.81640625, 13.9443359375, 15.072265625, 16.2001953125, 17.328125, 18.4560546875, 19.583984375, 20.7119140625, 21.83984375, 22.9677734375, 24.095703125, 25.2236328125, 26.3515625, 27.4794921875, 28.607421875, 29.7353515625, 30.86328125, 31.9912109375, 33.119140625, 34.2470703125, 35.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 8.0, 2.0, 3.0, 1.0, 9.0, 5.0, 12.0, 11.0, 19.0, 10.0, 18.0, 20.0, 32.0, 24.0, 48.0, 47.0, 79.0, 130.0, 162.0, 208.0, 460.0, 864.0, 1495.0, 3678.0, 10749.0, 43270.0, 265051.0, 5868181.0, 72125.0, 15642.0, 4837.0, 1956.0, 884.0, 487.0, 299.0, 163.0, 145.0, 95.0, 63.0, 35.0, 27.0, 26.0, 13.0, 6.0, 8.0, 12.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.203125, -9.86474609375, -9.5263671875, -9.18798828125, -8.849609375, -8.51123046875, -8.1728515625, -7.83447265625, -7.49609375, -7.15771484375, -6.8193359375, -6.48095703125, -6.142578125, -5.80419921875, -5.4658203125, -5.12744140625, -4.7890625, -4.45068359375, -4.1123046875, -3.77392578125, -3.435546875, -3.09716796875, -2.7587890625, -2.42041015625, -2.08203125, -1.74365234375, -1.4052734375, -1.06689453125, -0.728515625, -0.39013671875, -0.0517578125, 0.28662109375, 0.625, 0.96337890625, 1.3017578125, 1.64013671875, 1.978515625, 2.31689453125, 2.6552734375, 2.99365234375, 3.33203125, 3.67041015625, 4.0087890625, 4.34716796875, 4.685546875, 5.02392578125, 5.3623046875, 5.70068359375, 6.0390625, 6.37744140625, 6.7158203125, 7.05419921875, 7.392578125, 7.73095703125, 8.0693359375, 8.40771484375, 8.74609375, 9.08447265625, 9.4228515625, 9.76123046875, 10.099609375, 10.43798828125, 10.7763671875, 11.11474609375, 11.453125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 13.0, 13.0, 14.0, 20.0, 25.0, 26.0, 39.0, 43.0, 50.0, 66.0, 76.0, 74.0, 1103.0, 72.0, 67.0, 48.0, 66.0, 51.0, 38.0, 15.0, 23.0, 13.0, 19.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.0625, -69.21484375, -67.3671875, -65.51953125, -63.671875, -61.82421875, -59.9765625, -58.12890625, -56.28125, -54.43359375, -52.5859375, -50.73828125, -48.890625, -47.04296875, -45.1953125, -43.34765625, -41.5, -39.65234375, -37.8046875, -35.95703125, -34.109375, -32.26171875, -30.4140625, -28.56640625, -26.71875, -24.87109375, -23.0234375, -21.17578125, -19.328125, -17.48046875, -15.6328125, -13.78515625, -11.9375, -10.08984375, -8.2421875, -6.39453125, -4.546875, -2.69921875, -0.8515625, 0.99609375, 2.84375, 4.69140625, 6.5390625, 8.38671875, 10.234375, 12.08203125, 13.9296875, 15.77734375, 17.625, 19.47265625, 21.3203125, 23.16796875, 25.015625, 26.86328125, 28.7109375, 30.55859375, 32.40625, 34.25390625, 36.1015625, 37.94921875, 39.796875, 41.64453125, 43.4921875, 45.33984375, 47.1875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 15.0, 26.0, 107.0, 439.0, 299.0, 66.0, 16.0, 9.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-115.61796569824219, -112.85746765136719, -110.09696960449219, -107.33647155761719, -104.57597351074219, -101.81546783447266, -99.05496978759766, -96.29447174072266, -93.53397369384766, -90.77347564697266, -88.01297760009766, -85.25247955322266, -82.49197387695312, -79.73147583007812, -76.97097778320312, -74.21047973632812, -71.44998168945312, -68.68948364257812, -65.92898559570312, -63.16848373413086, -60.40798568725586, -57.64748764038086, -54.886985778808594, -52.126487731933594, -49.365989685058594, -46.605491638183594, -43.844993591308594, -41.08449172973633, -38.32399368286133, -35.56349563598633, -32.80299377441406, -30.042495727539062, -27.282005310058594, -24.521507263183594, -21.76100730895996, -19.000507354736328, -16.240009307861328, -13.479510307312012, -10.719011306762695, -7.9585113525390625, -5.1980133056640625, -2.437514305114746, 0.3229846954345703, 3.0834836959838867, 5.843982696533203, 8.60448169708252, 11.364980697631836, 14.125480651855469, 16.88597869873047, 19.64647674560547, 22.4069766998291, 25.167476654052734, 27.927974700927734, 30.688472747802734, 33.448974609375, 36.20947265625, 38.969970703125, 41.73046875, 44.490966796875, 47.251468658447266, 50.011966705322266, 52.772464752197266, 55.53296661376953, 58.29346466064453, 61.05396270751953]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 9.0, 5.0, 8.0, 14.0, 17.0, 33.0, 76.0, 229.0, 236.0, 191.0, 90.0, 20.0, 21.0, 11.0, 8.0, 7.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.84921264648438, -193.88018798828125, -187.91116333007812, -181.942138671875, -175.97311401367188, -170.00408935546875, -164.03506469726562, -158.06605529785156, -152.09703063964844, -146.1280059814453, -140.1589813232422, -134.18995666503906, -128.22093200683594, -122.25191497802734, -116.28289031982422, -110.31387329101562, -104.34484100341797, -98.37581634521484, -92.40679168701172, -86.43777465820312, -80.46875, -74.49972534179688, -68.53070068359375, -62.56167984008789, -56.592655181884766, -50.62363052368164, -44.65460968017578, -38.685585021972656, -32.71656036376953, -26.747539520263672, -20.778514862060547, -14.809494018554688, -8.840469360351562, -2.871446132659912, 3.0975770950317383, 9.066600799560547, 15.035623550415039, 21.00464630126953, 26.973670959472656, 32.942691802978516, 38.91171646118164, 44.880741119384766, 50.849761962890625, 56.81878662109375, 62.787811279296875, 68.7568359375, 74.72586059570312, 80.69487762451172, 86.66390228271484, 92.63292694091797, 98.6019515991211, 104.57096862792969, 110.53999328613281, 116.50901794433594, 122.47804260253906, 128.4470672607422, 134.4160919189453, 140.38511657714844, 146.35414123535156, 152.3231658935547, 158.2921905517578, 164.26119995117188, 170.230224609375, 176.19924926757812, 182.16827392578125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 15.0, 12.0, 5.0, 22.0, 16.0, 27.0, 48.0, 84.0, 102.0, 155.0, 269.0, 407.0, 634.0, 1141.0, 2273.0, 4799.0, 12957.0, 99420.0, 3999940.0, 53653.0, 9875.0, 3933.0, 1888.0, 1016.0, 616.0, 327.0, 203.0, 156.0, 79.0, 53.0, 56.0, 27.0, 15.0, 17.0, 8.0, 10.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.37841796875, -0.3677253723144531, -0.35703277587890625, -0.3463401794433594, -0.3356475830078125, -0.3249549865722656, -0.31426239013671875, -0.3035697937011719, -0.292877197265625, -0.2821846008300781, -0.27149200439453125, -0.2607994079589844, -0.2501068115234375, -0.23941421508789062, -0.22872161865234375, -0.21802902221679688, -0.20733642578125, -0.19664382934570312, -0.18595123291015625, -0.17525863647460938, -0.1645660400390625, -0.15387344360351562, -0.14318084716796875, -0.13248825073242188, -0.121795654296875, -0.11110305786132812, -0.10041046142578125, -0.08971786499023438, -0.0790252685546875, -0.06833267211914062, -0.05764007568359375, -0.046947479248046875, -0.0362548828125, -0.025562286376953125, -0.01486968994140625, -0.004177093505859375, 0.0065155029296875, 0.017208099365234375, 0.02790069580078125, 0.038593292236328125, 0.049285888671875, 0.059978485107421875, 0.07067108154296875, 0.08136367797851562, 0.0920562744140625, 0.10274887084960938, 0.11344146728515625, 0.12413406372070312, 0.13482666015625, 0.14551925659179688, 0.15621185302734375, 0.16690444946289062, 0.1775970458984375, 0.18828964233398438, 0.19898223876953125, 0.20967483520507812, 0.220367431640625, 0.23106002807617188, 0.24175262451171875, 0.2524452209472656, 0.2631378173828125, 0.2738304138183594, 0.28452301025390625, 0.2952156066894531, 0.305908203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 11.0, 4.0, 16.0, 8.0, 11.0, 11.0, 9.0, 23.0, 472.0, 317.0, 24.0, 16.0, 16.0, 9.0, 6.0, 2.0, 7.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381103515625, -0.36917877197265625, -0.3572540283203125, -0.34532928466796875, -0.333404541015625, -0.32147979736328125, -0.3095550537109375, -0.29763031005859375, -0.28570556640625, -0.27378082275390625, -0.2618560791015625, -0.24993133544921875, -0.238006591796875, -0.22608184814453125, -0.2141571044921875, -0.20223236083984375, -0.1903076171875, -0.17838287353515625, -0.1664581298828125, -0.15453338623046875, -0.142608642578125, -0.13068389892578125, -0.1187591552734375, -0.10683441162109375, -0.09490966796875, -0.08298492431640625, -0.0710601806640625, -0.05913543701171875, -0.047210693359375, -0.03528594970703125, -0.0233612060546875, -0.01143646240234375, 0.00048828125, 0.01241302490234375, 0.0243377685546875, 0.03626251220703125, 0.048187255859375, 0.06011199951171875, 0.0720367431640625, 0.08396148681640625, 0.09588623046875, 0.10781097412109375, 0.1197357177734375, 0.13166046142578125, 0.143585205078125, 0.15550994873046875, 0.1674346923828125, 0.17935943603515625, 0.1912841796875, 0.20320892333984375, 0.2151336669921875, 0.22705841064453125, 0.238983154296875, 0.25090789794921875, 0.2628326416015625, 0.27475738525390625, 0.28668212890625, 0.29860687255859375, 0.3105316162109375, 0.32245635986328125, 0.334381103515625, 0.34630584716796875, 0.3582305908203125, 0.37015533447265625, 0.382080078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 13.0, 17.0, 28.0, 34.0, 44.0, 82.0, 112.0, 226.0, 414.0, 784.0, 1709.0, 4653.0, 16257.0, 112204.0, 3818268.0, 205621.0, 23380.0, 5978.0, 2219.0, 952.0, 484.0, 307.0, 147.0, 112.0, 78.0, 40.0, 32.0, 15.0, 13.0, 16.0, 10.0, 3.0, 7.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3282051086425781, -0.31485748291015625, -0.3015098571777344, -0.2881622314453125, -0.2748146057128906, -0.26146697998046875, -0.24811935424804688, -0.234771728515625, -0.22142410278320312, -0.20807647705078125, -0.19472885131835938, -0.1813812255859375, -0.16803359985351562, -0.15468597412109375, -0.14133834838867188, -0.12799072265625, -0.11464309692382812, -0.10129547119140625, -0.08794784545898438, -0.0746002197265625, -0.061252593994140625, -0.04790496826171875, -0.034557342529296875, -0.021209716796875, -0.007862091064453125, 0.00548553466796875, 0.018833160400390625, 0.0321807861328125, 0.045528411865234375, 0.05887603759765625, 0.07222366333007812, 0.0855712890625, 0.09891891479492188, 0.11226654052734375, 0.12561416625976562, 0.1389617919921875, 0.15230941772460938, 0.16565704345703125, 0.17900466918945312, 0.192352294921875, 0.20569992065429688, 0.21904754638671875, 0.23239517211914062, 0.2457427978515625, 0.2590904235839844, 0.27243804931640625, 0.2857856750488281, 0.29913330078125, 0.3124809265136719, 0.32582855224609375, 0.3391761779785156, 0.3525238037109375, 0.3658714294433594, 0.37921905517578125, 0.3925666809082031, 0.405914306640625, 0.4192619323730469, 0.43260955810546875, 0.4459571838378906, 0.4593048095703125, 0.4726524353027344, 0.48600006103515625, 0.4993476867675781, 0.5126953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 9.0, 2.0, 10.0, 10.0, 13.0, 22.0, 19.0, 29.0, 35.0, 81.0, 134.0, 304.0, 1300.0, 1301.0, 340.0, 129.0, 101.0, 69.0, 44.0, 33.0, 19.0, 18.0, 8.0, 12.0, 7.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.198974609375, -0.19255447387695312, -0.18613433837890625, -0.17971420288085938, -0.1732940673828125, -0.16687393188476562, -0.16045379638671875, -0.15403366088867188, -0.147613525390625, -0.14119338989257812, -0.13477325439453125, -0.12835311889648438, -0.1219329833984375, -0.11551284790039062, -0.10909271240234375, -0.10267257690429688, -0.09625244140625, -0.08983230590820312, -0.08341217041015625, -0.07699203491210938, -0.0705718994140625, -0.06415176391601562, -0.05773162841796875, -0.051311492919921875, -0.044891357421875, -0.038471221923828125, -0.03205108642578125, -0.025630950927734375, -0.0192108154296875, -0.012790679931640625, -0.00637054443359375, 4.9591064453125e-05, 0.0064697265625, 0.012889862060546875, 0.01930999755859375, 0.025730133056640625, 0.0321502685546875, 0.038570404052734375, 0.04499053955078125, 0.051410675048828125, 0.057830810546875, 0.06425094604492188, 0.07067108154296875, 0.07709121704101562, 0.0835113525390625, 0.08993148803710938, 0.09635162353515625, 0.10277175903320312, 0.10919189453125, 0.11561203002929688, 0.12203216552734375, 0.12845230102539062, 0.1348724365234375, 0.14129257202148438, 0.14771270751953125, 0.15413284301757812, 0.160552978515625, 0.16697311401367188, 0.17339324951171875, 0.17981338500976562, 0.1862335205078125, 0.19265365600585938, 0.19907379150390625, 0.20549392700195312, 0.2119140625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 2.0, 5.0, 10.0, 52.0, 357.0, 464.0, 82.0, 20.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6174995303153992, -0.5556272268295288, -0.49375489354133606, -0.4318825602531433, -0.37001025676727295, -0.3081379234790802, -0.24626559019088745, -0.1843932867050171, -0.12252095341682434, -0.06064863130450249, 0.0012236908078193665, 0.06309601664543152, 0.12496833503246307, 0.18684065341949463, 0.24871298670768738, 0.31058529019355774, 0.3724576234817505, 0.43432995676994324, 0.4962022602558136, 0.5580745935440063, 0.6199468970298767, 0.6818192005157471, 0.7436915636062622, 0.8055638670921326, 0.8674361705780029, 0.9293084740638733, 0.9911808371543884, 1.0530531406402588, 1.114925503730774, 1.1767977476119995, 1.2386701107025146, 1.3005423545837402, 1.3624147176742554, 1.4242870807647705, 1.486159324645996, 1.5480316877365112, 1.6099040508270264, 1.671776294708252, 1.733648657798767, 1.7955210208892822, 1.8573932647705078, 1.919265627861023, 1.9811378717422485, 2.0430102348327637, 2.1048824787139893, 2.166754961013794, 2.2286272048950195, 2.290499448776245, 2.35237193107605, 2.4142441749572754, 2.47611665725708, 2.5379889011383057, 2.5998611450195312, 2.661733627319336, 2.7236058712005615, 2.785478115081787, 2.8473503589630127, 2.9092226028442383, 2.971095085144043, 3.0329673290252686, 3.094839572906494, 3.156712055206299, 3.2185842990875244, 3.28045654296875, 3.3423290252685547]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 4.0, 14.0, 13.0, 20.0, 35.0, 34.0, 43.0, 58.0, 70.0, 61.0, 57.0, 61.0, 63.0, 59.0, 61.0, 64.0, 51.0, 54.0, 40.0, 32.0, 25.0, 22.0, 11.0, 13.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6864107847213745, -0.6605428457260132, -0.6346749663352966, -0.6088070869445801, -0.5829391479492188, -0.5570712089538574, -0.5312033295631409, -0.5053354501724243, -0.479467511177063, -0.45359960198402405, -0.4277316927909851, -0.40186378359794617, -0.3759958744049072, -0.3501279652118683, -0.32426005601882935, -0.2983921468257904, -0.27252423763275146, -0.24665632843971252, -0.22078841924667358, -0.19492051005363464, -0.1690526008605957, -0.14318469166755676, -0.11731678247451782, -0.09144887328147888, -0.06558096408843994, -0.039713054895401, -0.01384514570236206, 0.01202276349067688, 0.03789067268371582, 0.06375858187675476, 0.0896264910697937, 0.11549440026283264, 0.14136236906051636, 0.1672302782535553, 0.19309818744659424, 0.21896609663963318, 0.24483400583267212, 0.27070191502571106, 0.29656982421875, 0.32243773341178894, 0.3483056426048279, 0.3741735517978668, 0.40004146099090576, 0.4259093701839447, 0.45177727937698364, 0.4776451885700226, 0.5035130977630615, 0.5293810367584229, 0.5552489161491394, 0.581116795539856, 0.6069847345352173, 0.6328526735305786, 0.6587205529212952, 0.6845884323120117, 0.710456371307373, 0.7363243103027344, 0.7621921896934509, 0.7880600690841675, 0.8139280080795288, 0.8397959470748901, 0.8656638264656067, 0.8915317058563232, 0.9173996448516846, 0.9432675838470459, 0.9691354632377625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 10.0, 7.0, 11.0, 21.0, 31.0, 46.0, 50.0, 96.0, 145.0, 231.0, 327.0, 529.0, 872.0, 1466.0, 2718.0, 5450.0, 12057.0, 35245.0, 911940.0, 48986.0, 14445.0, 6337.0, 3162.0, 1745.0, 982.0, 596.0, 361.0, 230.0, 153.0, 106.0, 53.0, 50.0, 34.0, 21.0, 6.0, 11.0, 13.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7353515625, -1.680450439453125, -1.62554931640625, -1.570648193359375, -1.5157470703125, -1.460845947265625, -1.40594482421875, -1.351043701171875, -1.296142578125, -1.241241455078125, -1.18634033203125, -1.131439208984375, -1.0765380859375, -1.021636962890625, -0.96673583984375, -0.911834716796875, -0.85693359375, -0.802032470703125, -0.74713134765625, -0.692230224609375, -0.6373291015625, -0.582427978515625, -0.52752685546875, -0.472625732421875, -0.417724609375, -0.362823486328125, -0.30792236328125, -0.253021240234375, -0.1981201171875, -0.143218994140625, -0.08831787109375, -0.033416748046875, 0.021484375, 0.076385498046875, 0.13128662109375, 0.186187744140625, 0.2410888671875, 0.295989990234375, 0.35089111328125, 0.405792236328125, 0.460693359375, 0.515594482421875, 0.57049560546875, 0.625396728515625, 0.6802978515625, 0.735198974609375, 0.79010009765625, 0.845001220703125, 0.89990234375, 0.954803466796875, 1.00970458984375, 1.064605712890625, 1.1195068359375, 1.174407958984375, 1.22930908203125, 1.284210205078125, 1.339111328125, 1.394012451171875, 1.44891357421875, 1.503814697265625, 1.5587158203125, 1.613616943359375, 1.66851806640625, 1.723419189453125, 1.7783203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 8.0, 13.0, 8.0, 16.0, 23.0, 737.0, 50.0, 19.0, 15.0, 18.0, 8.0, 5.0, 4.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376220703125, -0.3643760681152344, -0.35253143310546875, -0.3406867980957031, -0.3288421630859375, -0.3169975280761719, -0.30515289306640625, -0.2933082580566406, -0.281463623046875, -0.2696189880371094, -0.25777435302734375, -0.24592971801757812, -0.2340850830078125, -0.22224044799804688, -0.21039581298828125, -0.19855117797851562, -0.18670654296875, -0.17486190795898438, -0.16301727294921875, -0.15117263793945312, -0.1393280029296875, -0.12748336791992188, -0.11563873291015625, -0.10379409790039062, -0.091949462890625, -0.08010482788085938, -0.06826019287109375, -0.056415557861328125, -0.0445709228515625, -0.032726287841796875, -0.02088165283203125, -0.009037017822265625, 0.0028076171875, 0.014652252197265625, 0.02649688720703125, 0.038341522216796875, 0.0501861572265625, 0.062030792236328125, 0.07387542724609375, 0.08572006225585938, 0.097564697265625, 0.10940933227539062, 0.12125396728515625, 0.13309860229492188, 0.1449432373046875, 0.15678787231445312, 0.16863250732421875, 0.18047714233398438, 0.19232177734375, 0.20416641235351562, 0.21601104736328125, 0.22785568237304688, 0.2397003173828125, 0.2515449523925781, 0.26338958740234375, 0.2752342224121094, 0.287078857421875, 0.2989234924316406, 0.31076812744140625, 0.3226127624511719, 0.3344573974609375, 0.3463020324707031, 0.35814666748046875, 0.3699913024902344, 0.3818359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 8.0, 13.0, 12.0, 17.0, 23.0, 28.0, 37.0, 46.0, 60.0, 101.0, 105.0, 155.0, 222.0, 335.0, 557.0, 1401.0, 4210.0, 15249.0, 79087.0, 636161.0, 261672.0, 35930.0, 8295.0, 2449.0, 936.0, 426.0, 312.0, 175.0, 146.0, 101.0, 66.0, 62.0, 48.0, 25.0, 21.0, 19.0, 16.0, 15.0, 2.0, 6.0, 8.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.966796875, -0.93817138671875, -0.9095458984375, -0.88092041015625, -0.852294921875, -0.82366943359375, -0.7950439453125, -0.76641845703125, -0.73779296875, -0.70916748046875, -0.6805419921875, -0.65191650390625, -0.623291015625, -0.59466552734375, -0.5660400390625, -0.53741455078125, -0.5087890625, -0.48016357421875, -0.4515380859375, -0.42291259765625, -0.394287109375, -0.36566162109375, -0.3370361328125, -0.30841064453125, -0.27978515625, -0.25115966796875, -0.2225341796875, -0.19390869140625, -0.165283203125, -0.13665771484375, -0.1080322265625, -0.07940673828125, -0.05078125, -0.02215576171875, 0.0064697265625, 0.03509521484375, 0.063720703125, 0.09234619140625, 0.1209716796875, 0.14959716796875, 0.17822265625, 0.20684814453125, 0.2354736328125, 0.26409912109375, 0.292724609375, 0.32135009765625, 0.3499755859375, 0.37860107421875, 0.4072265625, 0.43585205078125, 0.4644775390625, 0.49310302734375, 0.521728515625, 0.55035400390625, 0.5789794921875, 0.60760498046875, 0.63623046875, 0.66485595703125, 0.6934814453125, 0.72210693359375, 0.750732421875, 0.77935791015625, 0.8079833984375, 0.83660888671875, 0.865234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 13.0, 14.0, 11.0, 16.0, 16.0, 21.0, 33.0, 27.0, 35.0, 33.0, 33.0, 41.0, 39.0, 55.0, 43.0, 34.0, 43.0, 40.0, 42.0, 42.0, 36.0, 33.0, 34.0, 31.0, 44.0, 28.0, 29.0, 18.0, 21.0, 18.0, 11.0, 18.0, 7.0, 5.0, 6.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9140625, -0.8803863525390625, -0.846710205078125, -0.8130340576171875, -0.77935791015625, -0.7456817626953125, -0.712005615234375, -0.6783294677734375, -0.6446533203125, -0.6109771728515625, -0.577301025390625, -0.5436248779296875, -0.50994873046875, -0.4762725830078125, -0.442596435546875, -0.4089202880859375, -0.375244140625, -0.3415679931640625, -0.307891845703125, -0.2742156982421875, -0.24053955078125, -0.2068634033203125, -0.173187255859375, -0.1395111083984375, -0.1058349609375, -0.0721588134765625, -0.038482666015625, -0.0048065185546875, 0.02886962890625, 0.0625457763671875, 0.096221923828125, 0.1298980712890625, 0.16357421875, 0.1972503662109375, 0.230926513671875, 0.2646026611328125, 0.29827880859375, 0.3319549560546875, 0.365631103515625, 0.3993072509765625, 0.4329833984375, 0.4666595458984375, 0.500335693359375, 0.5340118408203125, 0.56768798828125, 0.6013641357421875, 0.635040283203125, 0.6687164306640625, 0.702392578125, 0.7360687255859375, 0.769744873046875, 0.8034210205078125, 0.83709716796875, 0.8707733154296875, 0.904449462890625, 0.9381256103515625, 0.9718017578125, 1.0054779052734375, 1.039154052734375, 1.0728302001953125, 1.10650634765625, 1.1401824951171875, 1.173858642578125, 1.2075347900390625, 1.2412109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 13.0, 23.0, 65.0, 145.0, 403.0, 1920.0, 48673.0, 991377.0, 4825.0, 709.0, 207.0, 98.0, 40.0, 23.0, 13.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.2637939453125, -1.218994140625, -1.1741943359375, -1.12939453125, -1.0845947265625, -1.039794921875, -0.9949951171875, -0.9501953125, -0.9053955078125, -0.860595703125, -0.8157958984375, -0.77099609375, -0.7261962890625, -0.681396484375, -0.6365966796875, -0.591796875, -0.5469970703125, -0.502197265625, -0.4573974609375, -0.41259765625, -0.3677978515625, -0.322998046875, -0.2781982421875, -0.2333984375, -0.1885986328125, -0.143798828125, -0.0989990234375, -0.05419921875, -0.0093994140625, 0.035400390625, 0.0802001953125, 0.125, 0.1697998046875, 0.214599609375, 0.2593994140625, 0.30419921875, 0.3489990234375, 0.393798828125, 0.4385986328125, 0.4833984375, 0.5281982421875, 0.572998046875, 0.6177978515625, 0.66259765625, 0.7073974609375, 0.752197265625, 0.7969970703125, 0.841796875, 0.8865966796875, 0.931396484375, 0.9761962890625, 1.02099609375, 1.0657958984375, 1.110595703125, 1.1553955078125, 1.2001953125, 1.2449951171875, 1.289794921875, 1.3345947265625, 1.37939453125, 1.4241943359375, 1.468994140625, 1.5137939453125, 1.55859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 3.0, 2.0, 10.0, 4.0, 10.0, 13.0, 21.0, 20.0, 32.0, 39.0, 60.0, 63.0, 72.0, 88.0, 89.0, 98.0, 68.0, 66.0, 71.0, 45.0, 32.0, 33.0, 15.0, 11.0, 12.0, 10.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.2007694244384766e-05, -3.1132251024246216e-05, -3.0256807804107666e-05, -2.9381364583969116e-05, -2.8505921363830566e-05, -2.7630478143692017e-05, -2.6755034923553467e-05, -2.5879591703414917e-05, -2.5004148483276367e-05, -2.4128705263137817e-05, -2.3253262042999268e-05, -2.2377818822860718e-05, -2.1502375602722168e-05, -2.0626932382583618e-05, -1.975148916244507e-05, -1.887604594230652e-05, -1.800060272216797e-05, -1.712515950202942e-05, -1.624971628189087e-05, -1.537427306175232e-05, -1.449882984161377e-05, -1.362338662147522e-05, -1.274794340133667e-05, -1.187250018119812e-05, -1.099705696105957e-05, -1.012161374092102e-05, -9.24617052078247e-06, -8.370727300643921e-06, -7.495284080505371e-06, -6.619840860366821e-06, -5.7443976402282715e-06, -4.868954420089722e-06, -3.993511199951172e-06, -3.118067979812622e-06, -2.2426247596740723e-06, -1.3671815395355225e-06, -4.917383193969727e-07, 3.8370490074157715e-07, 1.259148120880127e-06, 2.1345913410186768e-06, 3.0100345611572266e-06, 3.885477781295776e-06, 4.760921001434326e-06, 5.636364221572876e-06, 6.511807441711426e-06, 7.387250661849976e-06, 8.262693881988525e-06, 9.138137102127075e-06, 1.0013580322265625e-05, 1.0889023542404175e-05, 1.1764466762542725e-05, 1.2639909982681274e-05, 1.3515353202819824e-05, 1.4390796422958374e-05, 1.5266239643096924e-05, 1.6141682863235474e-05, 1.7017126083374023e-05, 1.7892569303512573e-05, 1.8768012523651123e-05, 1.9643455743789673e-05, 2.0518898963928223e-05, 2.1394342184066772e-05, 2.2269785404205322e-05, 2.3145228624343872e-05, 2.4020671844482422e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 7.0, 9.0, 11.0, 19.0, 40.0, 30.0, 80.0, 99.0, 177.0, 342.0, 593.0, 1330.0, 3655.0, 14909.0, 149578.0, 810142.0, 54465.0, 8363.0, 2486.0, 1025.0, 489.0, 242.0, 163.0, 82.0, 67.0, 33.0, 21.0, 19.0, 11.0, 3.0, 10.0, 10.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.438720703125, -0.4259376525878906, -0.41315460205078125, -0.4003715515136719, -0.3875885009765625, -0.3748054504394531, -0.36202239990234375, -0.3492393493652344, -0.336456298828125, -0.3236732482910156, -0.31089019775390625, -0.2981071472167969, -0.2853240966796875, -0.2725410461425781, -0.25975799560546875, -0.24697494506835938, -0.23419189453125, -0.22140884399414062, -0.20862579345703125, -0.19584274291992188, -0.1830596923828125, -0.17027664184570312, -0.15749359130859375, -0.14471054077148438, -0.131927490234375, -0.11914443969726562, -0.10636138916015625, -0.09357833862304688, -0.0807952880859375, -0.06801223754882812, -0.05522918701171875, -0.042446136474609375, -0.0296630859375, -0.016880035400390625, -0.00409698486328125, 0.008686065673828125, 0.0214691162109375, 0.034252166748046875, 0.04703521728515625, 0.059818267822265625, 0.072601318359375, 0.08538436889648438, 0.09816741943359375, 0.11095046997070312, 0.1237335205078125, 0.13651657104492188, 0.14929962158203125, 0.16208267211914062, 0.17486572265625, 0.18764877319335938, 0.20043182373046875, 0.21321487426757812, 0.2259979248046875, 0.23878097534179688, 0.25156402587890625, 0.2643470764160156, 0.277130126953125, 0.2899131774902344, 0.30269622802734375, 0.3154792785644531, 0.3282623291015625, 0.3410453796386719, 0.35382843017578125, 0.3666114807128906, 0.37939453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 11.0, 16.0, 21.0, 29.0, 47.0, 72.0, 76.0, 114.0, 95.0, 108.0, 96.0, 75.0, 52.0, 38.0, 27.0, 20.0, 21.0, 14.0, 13.0, 6.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4638671875, -0.447723388671875, -0.43157958984375, -0.415435791015625, -0.3992919921875, -0.383148193359375, -0.36700439453125, -0.350860595703125, -0.334716796875, -0.318572998046875, -0.30242919921875, -0.286285400390625, -0.2701416015625, -0.253997802734375, -0.23785400390625, -0.221710205078125, -0.20556640625, -0.189422607421875, -0.17327880859375, -0.157135009765625, -0.1409912109375, -0.124847412109375, -0.10870361328125, -0.092559814453125, -0.076416015625, -0.060272216796875, -0.04412841796875, -0.027984619140625, -0.0118408203125, 0.004302978515625, 0.02044677734375, 0.036590576171875, 0.052734375, 0.068878173828125, 0.08502197265625, 0.101165771484375, 0.1173095703125, 0.133453369140625, 0.14959716796875, 0.165740966796875, 0.181884765625, 0.198028564453125, 0.21417236328125, 0.230316162109375, 0.2464599609375, 0.262603759765625, 0.27874755859375, 0.294891357421875, 0.31103515625, 0.327178955078125, 0.34332275390625, 0.359466552734375, 0.3756103515625, 0.391754150390625, 0.40789794921875, 0.424041748046875, 0.440185546875, 0.456329345703125, 0.47247314453125, 0.488616943359375, 0.5047607421875, 0.520904541015625, 0.53704833984375, 0.553192138671875, 0.5693359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 11.0, 34.0, 628.0, 300.0, 20.0, 8.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.820430755615234, -19.770545959472656, -18.720661163330078, -17.6707763671875, -16.620891571044922, -15.57100772857666, -14.521123886108398, -13.47123908996582, -12.421354293823242, -11.371469497680664, -10.321584701538086, -9.271700859069824, -8.221816062927246, -7.171931266784668, -6.122046947479248, -5.072162628173828, -4.02227783203125, -2.972393274307251, -1.922508716583252, -0.8726241588592529, 0.1772603988647461, 1.2271451950073242, 2.277029514312744, 3.326913833618164, 4.376798629760742, 5.42668342590332, 6.47656774520874, 7.52645206451416, 8.576336860656738, 9.626221656799316, 10.676105499267578, 11.725990295410156, 12.775875091552734, 13.825759887695312, 14.87564468383789, 15.925528526306152, 16.975414276123047, 18.025299072265625, 19.07518196105957, 20.12506675720215, 21.174951553344727, 22.224836349487305, 23.274721145629883, 24.32460594177246, 25.374488830566406, 26.424373626708984, 27.474258422851562, 28.52414321899414, 29.57402801513672, 30.623912811279297, 31.673797607421875, 32.72368240356445, 33.77356719970703, 34.82345199584961, 35.87333679199219, 36.9232177734375, 37.973106384277344, 39.02299118041992, 40.0728759765625, 41.12276077270508, 42.172645568847656, 43.222530364990234, 44.27241516113281, 45.322296142578125, 46.3721809387207]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 4.0, 3.0, 5.0, 4.0, 9.0, 4.0, 3.0, 4.0, 23.0, 22.0, 41.0, 48.0, 85.0, 129.0, 123.0, 131.0, 104.0, 67.0, 52.0, 27.0, 15.0, 20.0, 8.0, 9.0, 7.0, 9.0, 2.0, 5.0, 3.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-22.300975799560547, -21.725990295410156, -21.1510066986084, -20.576021194458008, -20.001035690307617, -19.426050186157227, -18.85106658935547, -18.276081085205078, -17.701095581054688, -17.126110076904297, -16.55112648010254, -15.976140975952148, -15.401155471801758, -14.826170921325684, -14.25118637084961, -13.676200866699219, -13.101216316223145, -12.52623176574707, -11.95124626159668, -11.376261711120605, -10.801276206970215, -10.22629165649414, -9.65130615234375, -9.076321601867676, -8.501337051391602, -7.926352024078369, -7.351366996765137, -6.7763824462890625, -6.201396942138672, -5.626412391662598, -5.051427364349365, -4.476442337036133, -3.901456832885742, -3.3264718055725098, -2.7514867782592773, -2.176501989364624, -1.6015169620513916, -1.0265319347381592, -0.45154714584350586, 0.12343788146972656, 0.698422908782959, 1.2734079360961914, 1.8483928442001343, 2.423377752304077, 2.9983627796173096, 3.573347806930542, 4.148332595825195, 4.723317623138428, 5.29830265045166, 5.873287677764893, 6.448272705078125, 7.023257255554199, 7.59824275970459, 8.173227310180664, 8.748212814331055, 9.323197364807129, 9.898181915283203, 10.473166465759277, 11.048151969909668, 11.623136520385742, 12.198122024536133, 12.773106575012207, 13.348091125488281, 13.923076629638672, 14.498062133789062]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 8.0, 11.0, 15.0, 26.0, 54.0, 102.0, 206.0, 379.0, 770.0, 1582.0, 3998.0, 14598.0, 157214.0, 3978726.0, 27729.0, 5574.0, 1728.0, 735.0, 365.0, 212.0, 103.0, 55.0, 34.0, 25.0, 10.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.544921875, -3.431304931640625, -3.31768798828125, -3.204071044921875, -3.0904541015625, -2.976837158203125, -2.86322021484375, -2.749603271484375, -2.635986328125, -2.522369384765625, -2.40875244140625, -2.295135498046875, -2.1815185546875, -2.067901611328125, -1.95428466796875, -1.840667724609375, -1.72705078125, -1.613433837890625, -1.49981689453125, -1.386199951171875, -1.2725830078125, -1.158966064453125, -1.04534912109375, -0.931732177734375, -0.818115234375, -0.704498291015625, -0.59088134765625, -0.477264404296875, -0.3636474609375, -0.250030517578125, -0.13641357421875, -0.022796630859375, 0.0908203125, 0.204437255859375, 0.31805419921875, 0.431671142578125, 0.5452880859375, 0.658905029296875, 0.77252197265625, 0.886138916015625, 0.999755859375, 1.113372802734375, 1.22698974609375, 1.340606689453125, 1.4542236328125, 1.567840576171875, 1.68145751953125, 1.795074462890625, 1.90869140625, 2.022308349609375, 2.13592529296875, 2.249542236328125, 2.3631591796875, 2.476776123046875, 2.59039306640625, 2.704010009765625, 2.817626953125, 2.931243896484375, 3.04486083984375, 3.158477783203125, 3.2720947265625, 3.385711669921875, 3.49932861328125, 3.612945556640625, 3.7265625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 8.0, 11.0, 11.0, 13.0, 25.0, 23.0, 306.0, 448.0, 47.0, 24.0, 14.0, 16.0, 8.0, 4.0, 8.0, 8.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343994140625, -0.333587646484375, -0.32318115234375, -0.312774658203125, -0.3023681640625, -0.291961669921875, -0.28155517578125, -0.271148681640625, -0.2607421875, -0.250335693359375, -0.23992919921875, -0.229522705078125, -0.2191162109375, -0.208709716796875, -0.19830322265625, -0.187896728515625, -0.177490234375, -0.167083740234375, -0.15667724609375, -0.146270751953125, -0.1358642578125, -0.125457763671875, -0.11505126953125, -0.104644775390625, -0.09423828125, -0.083831787109375, -0.07342529296875, -0.063018798828125, -0.0526123046875, -0.042205810546875, -0.03179931640625, -0.021392822265625, -0.010986328125, -0.000579833984375, 0.00982666015625, 0.020233154296875, 0.0306396484375, 0.041046142578125, 0.05145263671875, 0.061859130859375, 0.072265625, 0.082672119140625, 0.09307861328125, 0.103485107421875, 0.1138916015625, 0.124298095703125, 0.13470458984375, 0.145111083984375, 0.155517578125, 0.165924072265625, 0.17633056640625, 0.186737060546875, 0.1971435546875, 0.207550048828125, 0.21795654296875, 0.228363037109375, 0.23876953125, 0.249176025390625, 0.25958251953125, 0.269989013671875, 0.2803955078125, 0.290802001953125, 0.30120849609375, 0.311614990234375, 0.322021484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 7.0, 16.0, 36.0, 59.0, 83.0, 149.0, 265.0, 556.0, 1339.0, 4084.0, 19763.0, 252948.0, 3778416.0, 118050.0, 13337.0, 3059.0, 1052.0, 453.0, 278.0, 137.0, 67.0, 52.0, 32.0, 12.0, 4.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82666015625, -0.7897262573242188, -0.7527923583984375, -0.7158584594726562, -0.678924560546875, -0.6419906616210938, -0.6050567626953125, -0.5681228637695312, -0.53118896484375, -0.49425506591796875, -0.4573211669921875, -0.42038726806640625, -0.383453369140625, -0.34651947021484375, -0.3095855712890625, -0.27265167236328125, -0.2357177734375, -0.19878387451171875, -0.1618499755859375, -0.12491607666015625, -0.087982177734375, -0.05104827880859375, -0.0141143798828125, 0.02281951904296875, 0.05975341796875, 0.09668731689453125, 0.1336212158203125, 0.17055511474609375, 0.207489013671875, 0.24442291259765625, 0.2813568115234375, 0.31829071044921875, 0.355224609375, 0.39215850830078125, 0.4290924072265625, 0.46602630615234375, 0.502960205078125, 0.5398941040039062, 0.5768280029296875, 0.6137619018554688, 0.65069580078125, 0.6876296997070312, 0.7245635986328125, 0.7614974975585938, 0.798431396484375, 0.8353652954101562, 0.8722991943359375, 0.9092330932617188, 0.9461669921875, 0.9831008911132812, 1.0200347900390625, 1.0569686889648438, 1.093902587890625, 1.1308364868164062, 1.1677703857421875, 1.2047042846679688, 1.24163818359375, 1.2785720825195312, 1.3155059814453125, 1.3524398803710938, 1.389373779296875, 1.4263076782226562, 1.4632415771484375, 1.5001754760742188, 1.537109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 0.0, 6.0, 7.0, 6.0, 14.0, 14.0, 25.0, 24.0, 42.0, 54.0, 71.0, 129.0, 181.0, 348.0, 728.0, 1186.0, 488.0, 243.0, 148.0, 98.0, 75.0, 52.0, 32.0, 17.0, 10.0, 15.0, 10.0, 10.0, 8.0, 8.0, 4.0, 7.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.15862655639648438, -0.15258026123046875, -0.14653396606445312, -0.1404876708984375, -0.13444137573242188, -0.12839508056640625, -0.12234878540039062, -0.116302490234375, -0.11025619506835938, -0.10420989990234375, -0.09816360473632812, -0.0921173095703125, -0.08607101440429688, -0.08002471923828125, -0.07397842407226562, -0.06793212890625, -0.061885833740234375, -0.05583953857421875, -0.049793243408203125, -0.0437469482421875, -0.037700653076171875, -0.03165435791015625, -0.025608062744140625, -0.019561767578125, -0.013515472412109375, -0.00746917724609375, -0.001422882080078125, 0.0046234130859375, 0.010669708251953125, 0.01671600341796875, 0.022762298583984375, 0.02880859375, 0.034854888916015625, 0.04090118408203125, 0.046947479248046875, 0.0529937744140625, 0.059040069580078125, 0.06508636474609375, 0.07113265991210938, 0.077178955078125, 0.08322525024414062, 0.08927154541015625, 0.09531784057617188, 0.1013641357421875, 0.10741043090820312, 0.11345672607421875, 0.11950302124023438, 0.12554931640625, 0.13159561157226562, 0.13764190673828125, 0.14368820190429688, 0.1497344970703125, 0.15578079223632812, 0.16182708740234375, 0.16787338256835938, 0.173919677734375, 0.17996597290039062, 0.18601226806640625, 0.19205856323242188, 0.1981048583984375, 0.20415115356445312, 0.21019744873046875, 0.21624374389648438, 0.2222900390625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 10.0, 36.0, 345.0, 502.0, 80.0, 15.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.457648515701294, -2.3593242168426514, -2.260999917984009, -2.1626758575439453, -2.0643515586853027, -1.9660272598266602, -1.8677029609680176, -1.769378662109375, -1.671054482460022, -1.5727301836013794, -1.4744060039520264, -1.3760817050933838, -1.2777574062347412, -1.1794332265853882, -1.0811089277267456, -0.9827846884727478, -0.88446044921875, -0.7861362099647522, -0.6878119707107544, -0.5894876718521118, -0.491163432598114, -0.3928391933441162, -0.29451489448547363, -0.19619065523147583, -0.09786641597747803, 0.00045783817768096924, 0.09878209233283997, 0.19710636138916016, 0.29543060064315796, 0.39375483989715576, 0.49207913875579834, 0.5904033780097961, 0.688727617263794, 0.7870518565177917, 0.8853760957717896, 0.9837003946304321, 1.0820245742797852, 1.1803488731384277, 1.2786731719970703, 1.376997470855713, 1.475321650505066, 1.5736459493637085, 1.6719701290130615, 1.770294427871704, 1.8686187267303467, 1.9669429063796997, 2.0652670860290527, 2.1635913848876953, 2.261915683746338, 2.3602399826049805, 2.458564281463623, 2.5568885803222656, 2.655212640762329, 2.7535369396209717, 2.8518612384796143, 2.950185537338257, 3.0485095977783203, 3.146833896636963, 3.2451581954956055, 3.343482494354248, 3.4418065547943115, 3.540130853652954, 3.6384551525115967, 3.7367794513702393, 3.835103750228882]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 16.0, 22.0, 34.0, 46.0, 45.0, 66.0, 70.0, 87.0, 97.0, 86.0, 87.0, 67.0, 51.0, 52.0, 39.0, 31.0, 16.0, 14.0, 17.0, 10.0, 6.0, 7.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1305944919586182, -1.0897785425186157, -1.0489625930786133, -1.0081465244293213, -0.9673305749893188, -0.9265146255493164, -0.8856986165046692, -0.844882607460022, -0.8040666580200195, -0.7632507085800171, -0.7224346995353699, -0.6816186904907227, -0.6408027410507202, -0.5999867916107178, -0.5591707825660706, -0.5183547735214233, -0.4775388240814209, -0.43672284483909607, -0.39590686559677124, -0.3550908863544464, -0.3142749071121216, -0.27345892786979675, -0.23264294862747192, -0.1918269693851471, -0.15101099014282227, -0.11019501090049744, -0.06937903165817261, -0.02856305241584778, 0.01225292682647705, 0.05306890606880188, 0.09388488531112671, 0.13470086455345154, 0.17551672458648682, 0.21633270382881165, 0.2571486830711365, 0.2979646623134613, 0.33878064155578613, 0.37959662079811096, 0.4204126000404358, 0.4612285792827606, 0.5020445585250854, 0.5428605079650879, 0.5836765170097351, 0.6244925260543823, 0.6653084754943848, 0.7061244249343872, 0.7469404339790344, 0.7877564430236816, 0.8285723924636841, 0.8693883419036865, 0.9102043509483337, 0.951020359992981, 0.9918363094329834, 1.0326522588729858, 1.0734682083129883, 1.1142842769622803, 1.1551002264022827, 1.1959161758422852, 1.2367322444915771, 1.2775481939315796, 1.318364143371582, 1.3591800928115845, 1.399996042251587, 1.440812110900879, 1.4816280603408813]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 9.0, 14.0, 10.0, 25.0, 40.0, 58.0, 83.0, 113.0, 169.0, 250.0, 327.0, 567.0, 867.0, 1339.0, 2332.0, 5129.0, 13363.0, 62194.0, 896346.0, 43619.0, 11369.0, 4480.0, 2165.0, 1230.0, 823.0, 543.0, 342.0, 219.0, 157.0, 122.0, 66.0, 45.0, 35.0, 20.0, 13.0, 16.0, 15.0, 4.0, 5.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.880859375, -1.816925048828125, -1.75299072265625, -1.689056396484375, -1.6251220703125, -1.561187744140625, -1.49725341796875, -1.433319091796875, -1.369384765625, -1.305450439453125, -1.24151611328125, -1.177581787109375, -1.1136474609375, -1.049713134765625, -0.98577880859375, -0.921844482421875, -0.85791015625, -0.793975830078125, -0.73004150390625, -0.666107177734375, -0.6021728515625, -0.538238525390625, -0.47430419921875, -0.410369873046875, -0.346435546875, -0.282501220703125, -0.21856689453125, -0.154632568359375, -0.0906982421875, -0.026763916015625, 0.03717041015625, 0.101104736328125, 0.1650390625, 0.228973388671875, 0.29290771484375, 0.356842041015625, 0.4207763671875, 0.484710693359375, 0.54864501953125, 0.612579345703125, 0.676513671875, 0.740447998046875, 0.80438232421875, 0.868316650390625, 0.9322509765625, 0.996185302734375, 1.06011962890625, 1.124053955078125, 1.18798828125, 1.251922607421875, 1.31585693359375, 1.379791259765625, 1.4437255859375, 1.507659912109375, 1.57159423828125, 1.635528564453125, 1.699462890625, 1.763397216796875, 1.82733154296875, 1.891265869140625, 1.9552001953125, 2.019134521484375, 2.08306884765625, 2.147003173828125, 2.2109375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 9.0, 10.0, 13.0, 10.0, 15.0, 32.0, 141.0, 419.0, 228.0, 32.0, 22.0, 17.0, 11.0, 10.0, 8.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.370361328125, -0.3599510192871094, -0.34954071044921875, -0.3391304016113281, -0.3287200927734375, -0.3183097839355469, -0.30789947509765625, -0.2974891662597656, -0.287078857421875, -0.2766685485839844, -0.26625823974609375, -0.2558479309082031, -0.2454376220703125, -0.23502731323242188, -0.22461700439453125, -0.21420669555664062, -0.20379638671875, -0.19338607788085938, -0.18297576904296875, -0.17256546020507812, -0.1621551513671875, -0.15174484252929688, -0.14133453369140625, -0.13092422485351562, -0.120513916015625, -0.11010360717773438, -0.09969329833984375, -0.08928298950195312, -0.0788726806640625, -0.06846237182617188, -0.05805206298828125, -0.047641754150390625, -0.0372314453125, -0.026821136474609375, -0.01641082763671875, -0.006000518798828125, 0.0044097900390625, 0.014820098876953125, 0.02523040771484375, 0.035640716552734375, 0.046051025390625, 0.056461334228515625, 0.06687164306640625, 0.07728195190429688, 0.0876922607421875, 0.09810256958007812, 0.10851287841796875, 0.11892318725585938, 0.12933349609375, 0.13974380493164062, 0.15015411376953125, 0.16056442260742188, 0.1709747314453125, 0.18138504028320312, 0.19179534912109375, 0.20220565795898438, 0.212615966796875, 0.22302627563476562, 0.23343658447265625, 0.24384689331054688, 0.2542572021484375, 0.2646675109863281, 0.27507781982421875, 0.2854881286621094, 0.2958984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 2.0, 10.0, 7.0, 10.0, 15.0, 22.0, 37.0, 44.0, 76.0, 97.0, 189.0, 326.0, 574.0, 1297.0, 3145.0, 10463.0, 45542.0, 340775.0, 548936.0, 74711.0, 14685.0, 4351.0, 1591.0, 739.0, 312.0, 215.0, 122.0, 81.0, 40.0, 45.0, 30.0, 9.0, 12.0, 13.0, 10.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91015625, -0.8818359375, -0.853515625, -0.8251953125, -0.796875, -0.7685546875, -0.740234375, -0.7119140625, -0.68359375, -0.6552734375, -0.626953125, -0.5986328125, -0.5703125, -0.5419921875, -0.513671875, -0.4853515625, -0.45703125, -0.4287109375, -0.400390625, -0.3720703125, -0.34375, -0.3154296875, -0.287109375, -0.2587890625, -0.23046875, -0.2021484375, -0.173828125, -0.1455078125, -0.1171875, -0.0888671875, -0.060546875, -0.0322265625, -0.00390625, 0.0244140625, 0.052734375, 0.0810546875, 0.109375, 0.1376953125, 0.166015625, 0.1943359375, 0.22265625, 0.2509765625, 0.279296875, 0.3076171875, 0.3359375, 0.3642578125, 0.392578125, 0.4208984375, 0.44921875, 0.4775390625, 0.505859375, 0.5341796875, 0.5625, 0.5908203125, 0.619140625, 0.6474609375, 0.67578125, 0.7041015625, 0.732421875, 0.7607421875, 0.7890625, 0.8173828125, 0.845703125, 0.8740234375, 0.90234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 7.0, 6.0, 12.0, 18.0, 18.0, 32.0, 27.0, 42.0, 47.0, 34.0, 42.0, 59.0, 57.0, 60.0, 70.0, 58.0, 55.0, 61.0, 50.0, 46.0, 35.0, 38.0, 33.0, 19.0, 19.0, 11.0, 13.0, 8.0, 7.0, 6.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.900390625, -0.8742523193359375, -0.848114013671875, -0.8219757080078125, -0.79583740234375, -0.7696990966796875, -0.743560791015625, -0.7174224853515625, -0.6912841796875, -0.6651458740234375, -0.639007568359375, -0.6128692626953125, -0.58673095703125, -0.5605926513671875, -0.534454345703125, -0.5083160400390625, -0.482177734375, -0.4560394287109375, -0.429901123046875, -0.4037628173828125, -0.37762451171875, -0.3514862060546875, -0.325347900390625, -0.2992095947265625, -0.2730712890625, -0.2469329833984375, -0.220794677734375, -0.1946563720703125, -0.16851806640625, -0.1423797607421875, -0.116241455078125, -0.0901031494140625, -0.06396484375, -0.0378265380859375, -0.011688232421875, 0.0144500732421875, 0.04058837890625, 0.0667266845703125, 0.092864990234375, 0.1190032958984375, 0.1451416015625, 0.1712799072265625, 0.197418212890625, 0.2235565185546875, 0.24969482421875, 0.2758331298828125, 0.301971435546875, 0.3281097412109375, 0.354248046875, 0.3803863525390625, 0.406524658203125, 0.4326629638671875, 0.45880126953125, 0.4849395751953125, 0.511077880859375, 0.5372161865234375, 0.5633544921875, 0.5894927978515625, 0.615631103515625, 0.6417694091796875, 0.66790771484375, 0.6940460205078125, 0.720184326171875, 0.7463226318359375, 0.7724609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 17.0, 19.0, 30.0, 46.0, 107.0, 197.0, 489.0, 1725.0, 12581.0, 971253.0, 57446.0, 3383.0, 707.0, 244.0, 119.0, 70.0, 39.0, 27.0, 13.0, 11.0, 10.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.75, -2.675079345703125, -2.60015869140625, -2.525238037109375, -2.4503173828125, -2.375396728515625, -2.30047607421875, -2.225555419921875, -2.150634765625, -2.075714111328125, -2.00079345703125, -1.925872802734375, -1.8509521484375, -1.776031494140625, -1.70111083984375, -1.626190185546875, -1.55126953125, -1.476348876953125, -1.40142822265625, -1.326507568359375, -1.2515869140625, -1.176666259765625, -1.10174560546875, -1.026824951171875, -0.951904296875, -0.876983642578125, -0.80206298828125, -0.727142333984375, -0.6522216796875, -0.577301025390625, -0.50238037109375, -0.427459716796875, -0.3525390625, -0.277618408203125, -0.20269775390625, -0.127777099609375, -0.0528564453125, 0.022064208984375, 0.09698486328125, 0.171905517578125, 0.246826171875, 0.321746826171875, 0.39666748046875, 0.471588134765625, 0.5465087890625, 0.621429443359375, 0.69635009765625, 0.771270751953125, 0.84619140625, 0.921112060546875, 0.99603271484375, 1.070953369140625, 1.1458740234375, 1.220794677734375, 1.29571533203125, 1.370635986328125, 1.445556640625, 1.520477294921875, 1.59539794921875, 1.670318603515625, 1.7452392578125, 1.820159912109375, 1.89508056640625, 1.970001220703125, 2.044921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 5.0, 14.0, 11.0, 20.0, 30.0, 41.0, 90.0, 153.0, 225.0, 147.0, 99.0, 30.0, 31.0, 22.0, 14.0, 15.0, 12.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0001537799835205078, -0.00014978554099798203, -0.00014579109847545624, -0.00014179665595293045, -0.00013780221343040466, -0.00013380777090787888, -0.0001298133283853531, -0.0001258188858628273, -0.00012182444334030151, -0.00011783000081777573, -0.00011383555829524994, -0.00010984111577272415, -0.00010584667325019836, -0.00010185223072767258, -9.785778820514679e-05, -9.3863345682621e-05, -8.986890316009521e-05, -8.587446063756943e-05, -8.188001811504364e-05, -7.788557559251785e-05, -7.389113306999207e-05, -6.989669054746628e-05, -6.590224802494049e-05, -6.19078055024147e-05, -5.7913362979888916e-05, -5.391892045736313e-05, -4.992447793483734e-05, -4.5930035412311554e-05, -4.1935592889785767e-05, -3.794115036725998e-05, -3.394670784473419e-05, -2.9952265322208405e-05, -2.5957822799682617e-05, -2.196338027715683e-05, -1.7968937754631042e-05, -1.3974495232105255e-05, -9.980052709579468e-06, -5.98561018705368e-06, -1.991167664527893e-06, 2.0032748579978943e-06, 5.997717380523682e-06, 9.992159903049469e-06, 1.3986602425575256e-05, 1.7981044948101044e-05, 2.197548747062683e-05, 2.596992999315262e-05, 2.9964372515678406e-05, 3.395881503820419e-05, 3.795325756072998e-05, 4.194770008325577e-05, 4.5942142605781555e-05, 4.993658512830734e-05, 5.393102765083313e-05, 5.792547017335892e-05, 6.19199126958847e-05, 6.591435521841049e-05, 6.990879774093628e-05, 7.390324026346207e-05, 7.789768278598785e-05, 8.189212530851364e-05, 8.588656783103943e-05, 8.988101035356522e-05, 9.3875452876091e-05, 9.786989539861679e-05, 0.00010186433792114258]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 9.0, 8.0, 14.0, 25.0, 30.0, 59.0, 104.0, 171.0, 325.0, 720.0, 1899.0, 8328.0, 109376.0, 881708.0, 38410.0, 4840.0, 1319.0, 581.0, 222.0, 165.0, 94.0, 57.0, 21.0, 21.0, 15.0, 8.0, 7.0, 4.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2197265625, -1.1820068359375, -1.144287109375, -1.1065673828125, -1.06884765625, -1.0311279296875, -0.993408203125, -0.9556884765625, -0.91796875, -0.8802490234375, -0.842529296875, -0.8048095703125, -0.76708984375, -0.7293701171875, -0.691650390625, -0.6539306640625, -0.6162109375, -0.5784912109375, -0.540771484375, -0.5030517578125, -0.46533203125, -0.4276123046875, -0.389892578125, -0.3521728515625, -0.314453125, -0.2767333984375, -0.239013671875, -0.2012939453125, -0.16357421875, -0.1258544921875, -0.088134765625, -0.0504150390625, -0.0126953125, 0.0250244140625, 0.062744140625, 0.1004638671875, 0.13818359375, 0.1759033203125, 0.213623046875, 0.2513427734375, 0.2890625, 0.3267822265625, 0.364501953125, 0.4022216796875, 0.43994140625, 0.4776611328125, 0.515380859375, 0.5531005859375, 0.5908203125, 0.6285400390625, 0.666259765625, 0.7039794921875, 0.74169921875, 0.7794189453125, 0.817138671875, 0.8548583984375, 0.892578125, 0.9302978515625, 0.968017578125, 1.0057373046875, 1.04345703125, 1.0811767578125, 1.118896484375, 1.1566162109375, 1.1943359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 10.0, 23.0, 35.0, 79.0, 102.0, 161.0, 176.0, 169.0, 96.0, 63.0, 24.0, 19.0, 13.0, 7.0, 10.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79248046875, -0.7612686157226562, -0.7300567626953125, -0.6988449096679688, -0.667633056640625, -0.6364212036132812, -0.6052093505859375, -0.5739974975585938, -0.54278564453125, -0.5115737915039062, -0.4803619384765625, -0.44915008544921875, -0.417938232421875, -0.38672637939453125, -0.3555145263671875, -0.32430267333984375, -0.2930908203125, -0.26187896728515625, -0.2306671142578125, -0.19945526123046875, -0.168243408203125, -0.13703155517578125, -0.1058197021484375, -0.07460784912109375, -0.04339599609375, -0.01218414306640625, 0.0190277099609375, 0.05023956298828125, 0.081451416015625, 0.11266326904296875, 0.1438751220703125, 0.17508697509765625, 0.206298828125, 0.23751068115234375, 0.2687225341796875, 0.29993438720703125, 0.331146240234375, 0.36235809326171875, 0.3935699462890625, 0.42478179931640625, 0.45599365234375, 0.48720550537109375, 0.5184173583984375, 0.5496292114257812, 0.580841064453125, 0.6120529174804688, 0.6432647705078125, 0.6744766235351562, 0.7056884765625, 0.7369003295898438, 0.7681121826171875, 0.7993240356445312, 0.830535888671875, 0.8617477416992188, 0.8929595947265625, 0.9241714477539062, 0.95538330078125, 0.9865951538085938, 1.0178070068359375, 1.0490188598632812, 1.080230712890625, 1.1114425659179688, 1.1426544189453125, 1.1738662719726562, 1.205078125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 7.0, 33.0, 294.0, 532.0, 106.0, 18.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.770467758178711, -8.28856086730957, -7.8066534996032715, -7.324746608734131, -6.842839241027832, -6.360932350158691, -5.879025459289551, -5.397118091583252, -4.915210723876953, -4.4333038330078125, -3.9513964653015137, -3.469489574432373, -2.987582206726074, -2.5056753158569336, -2.023768186569214, -1.5418610572814941, -1.0599541664123535, -0.5780470371246338, -0.09613996744155884, 0.3857671022415161, 0.8676742315292358, 1.349581241607666, 1.8314883708953857, 2.3133955001831055, 2.795302629470825, 3.277209758758545, 3.7591168880462646, 4.241024017333984, 4.722930908203125, 5.204837799072266, 5.6867451667785645, 6.168652534484863, 6.650559425354004, 7.1324663162231445, 7.614373683929443, 8.096281051635742, 8.578187942504883, 9.060094833374023, 9.542001724243164, 10.023908615112305, 10.505816459655762, 10.987723350524902, 11.469630241394043, 11.9515380859375, 12.43344497680664, 12.915351867675781, 13.397258758544922, 13.879165649414062, 14.361072540283203, 14.842979431152344, 15.324886322021484, 15.806794166564941, 16.288700103759766, 16.770606994628906, 17.25251579284668, 17.73442268371582, 18.21632957458496, 18.6982364654541, 19.180143356323242, 19.662050247192383, 20.143957138061523, 20.625865936279297, 21.107772827148438, 21.589679718017578, 22.07158660888672]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 6.0, 4.0, 5.0, 13.0, 14.0, 14.0, 31.0, 34.0, 49.0, 47.0, 60.0, 75.0, 93.0, 85.0, 78.0, 89.0, 57.0, 59.0, 55.0, 34.0, 20.0, 18.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.724906921386719, -6.502395153045654, -6.279883861541748, -6.057372093200684, -5.834860324859619, -5.612348556518555, -5.389837265014648, -5.167325496673584, -4.9448137283325195, -4.722301959991455, -4.499790668487549, -4.277278900146484, -4.05476713180542, -3.8322556018829346, -3.609744071960449, -3.3872323036193848, -3.1647207736968994, -2.942209243774414, -2.7196974754333496, -2.4971859455108643, -2.2746741771698, -2.0521626472473145, -1.8296509981155396, -1.6071393489837646, -1.3846276998519897, -1.1621160507202148, -0.9396044015884399, -0.7170928120613098, -0.4945811629295349, -0.2720695734024048, -0.04955792427062988, 0.17295372486114502, 0.3954653739929199, 0.6179770231246948, 0.8404886722564697, 1.063000202178955, 1.2855119705200195, 1.5080235004425049, 1.7305351495742798, 1.9530467987060547, 2.175558567047119, 2.3980700969696045, 2.620581865310669, 2.8430933952331543, 3.0656051635742188, 3.288116693496704, 3.5106282234191895, 3.733139991760254, 3.9556515216827393, 4.178163051605225, 4.400674819946289, 4.6231865882873535, 4.84569787979126, 5.068209648132324, 5.290721416473389, 5.513233184814453, 5.735744476318359, 5.958256244659424, 6.18076753616333, 6.4032793045043945, 6.625791072845459, 6.848302841186523, 7.07081413269043, 7.293325901031494, 7.515837669372559]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 10.0, 8.0, 19.0, 27.0, 24.0, 47.0, 56.0, 71.0, 92.0, 139.0, 202.0, 266.0, 429.0, 879.0, 2180.0, 8181.0, 4019954.0, 153167.0, 5300.0, 1585.0, 612.0, 316.0, 189.0, 129.0, 108.0, 59.0, 55.0, 46.0, 30.0, 24.0, 17.0, 12.0, 15.0, 6.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.9140625, -7.66595458984375, -7.4178466796875, -7.16973876953125, -6.921630859375, -6.67352294921875, -6.4254150390625, -6.17730712890625, -5.92919921875, -5.68109130859375, -5.4329833984375, -5.18487548828125, -4.936767578125, -4.68865966796875, -4.4405517578125, -4.19244384765625, -3.9443359375, -3.69622802734375, -3.4481201171875, -3.20001220703125, -2.951904296875, -2.70379638671875, -2.4556884765625, -2.20758056640625, -1.95947265625, -1.71136474609375, -1.4632568359375, -1.21514892578125, -0.967041015625, -0.71893310546875, -0.4708251953125, -0.22271728515625, 0.025390625, 0.27349853515625, 0.5216064453125, 0.76971435546875, 1.017822265625, 1.26593017578125, 1.5140380859375, 1.76214599609375, 2.01025390625, 2.25836181640625, 2.5064697265625, 2.75457763671875, 3.002685546875, 3.25079345703125, 3.4989013671875, 3.74700927734375, 3.9951171875, 4.24322509765625, 4.4913330078125, 4.73944091796875, 4.987548828125, 5.23565673828125, 5.4837646484375, 5.73187255859375, 5.97998046875, 6.22808837890625, 6.4761962890625, 6.72430419921875, 6.972412109375, 7.22052001953125, 7.4686279296875, 7.71673583984375, 7.96484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 15.0, 27.0, 75.0, 221.0, 337.0, 184.0, 47.0, 17.0, 16.0, 13.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3359375, -0.325531005859375, -0.31512451171875, -0.304718017578125, -0.2943115234375, -0.283905029296875, -0.27349853515625, -0.263092041015625, -0.252685546875, -0.242279052734375, -0.23187255859375, -0.221466064453125, -0.2110595703125, -0.200653076171875, -0.19024658203125, -0.179840087890625, -0.16943359375, -0.159027099609375, -0.14862060546875, -0.138214111328125, -0.1278076171875, -0.117401123046875, -0.10699462890625, -0.096588134765625, -0.086181640625, -0.075775146484375, -0.06536865234375, -0.054962158203125, -0.0445556640625, -0.034149169921875, -0.02374267578125, -0.013336181640625, -0.0029296875, 0.007476806640625, 0.01788330078125, 0.028289794921875, 0.0386962890625, 0.049102783203125, 0.05950927734375, 0.069915771484375, 0.080322265625, 0.090728759765625, 0.10113525390625, 0.111541748046875, 0.1219482421875, 0.132354736328125, 0.14276123046875, 0.153167724609375, 0.16357421875, 0.173980712890625, 0.18438720703125, 0.194793701171875, 0.2052001953125, 0.215606689453125, 0.22601318359375, 0.236419677734375, 0.246826171875, 0.257232666015625, 0.26763916015625, 0.278045654296875, 0.2884521484375, 0.298858642578125, 0.30926513671875, 0.319671630859375, 0.330078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 7.0, 8.0, 13.0, 11.0, 24.0, 33.0, 31.0, 58.0, 172.0, 897.0, 36795.0, 4150963.0, 4636.0, 369.0, 116.0, 59.0, 25.0, 14.0, 13.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19921875, -4.99359130859375, -4.7879638671875, -4.58233642578125, -4.376708984375, -4.17108154296875, -3.9654541015625, -3.75982666015625, -3.55419921875, -3.34857177734375, -3.1429443359375, -2.93731689453125, -2.731689453125, -2.52606201171875, -2.3204345703125, -2.11480712890625, -1.9091796875, -1.70355224609375, -1.4979248046875, -1.29229736328125, -1.086669921875, -0.88104248046875, -0.6754150390625, -0.46978759765625, -0.26416015625, -0.05853271484375, 0.1470947265625, 0.35272216796875, 0.558349609375, 0.76397705078125, 0.9696044921875, 1.17523193359375, 1.380859375, 1.58648681640625, 1.7921142578125, 1.99774169921875, 2.203369140625, 2.40899658203125, 2.6146240234375, 2.82025146484375, 3.02587890625, 3.23150634765625, 3.4371337890625, 3.64276123046875, 3.848388671875, 4.05401611328125, 4.2596435546875, 4.46527099609375, 4.6708984375, 4.87652587890625, 5.0821533203125, 5.28778076171875, 5.493408203125, 5.69903564453125, 5.9046630859375, 6.11029052734375, 6.31591796875, 6.52154541015625, 6.7271728515625, 6.93280029296875, 7.138427734375, 7.34405517578125, 7.5496826171875, 7.75531005859375, 7.9609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 1.0, 4.0, 4.0, 9.0, 22.0, 27.0, 49.0, 69.0, 200.0, 755.0, 2178.0, 419.0, 125.0, 58.0, 39.0, 25.0, 24.0, 9.0, 13.0, 11.0, 6.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.439697265625, -0.42852020263671875, -0.4173431396484375, -0.40616607666015625, -0.394989013671875, -0.38381195068359375, -0.3726348876953125, -0.36145782470703125, -0.35028076171875, -0.33910369873046875, -0.3279266357421875, -0.31674957275390625, -0.305572509765625, -0.29439544677734375, -0.2832183837890625, -0.27204132080078125, -0.2608642578125, -0.24968719482421875, -0.2385101318359375, -0.22733306884765625, -0.216156005859375, -0.20497894287109375, -0.1938018798828125, -0.18262481689453125, -0.17144775390625, -0.16027069091796875, -0.1490936279296875, -0.13791656494140625, -0.126739501953125, -0.11556243896484375, -0.1043853759765625, -0.09320831298828125, -0.08203125, -0.07085418701171875, -0.0596771240234375, -0.04850006103515625, -0.037322998046875, -0.02614593505859375, -0.0149688720703125, -0.00379180908203125, 0.00738525390625, 0.01856231689453125, 0.0297393798828125, 0.04091644287109375, 0.052093505859375, 0.06327056884765625, 0.0744476318359375, 0.08562469482421875, 0.0968017578125, 0.10797882080078125, 0.1191558837890625, 0.13033294677734375, 0.141510009765625, 0.15268707275390625, 0.1638641357421875, 0.17504119873046875, 0.18621826171875, 0.19739532470703125, 0.2085723876953125, 0.21974945068359375, 0.230926513671875, 0.24210357666015625, 0.2532806396484375, 0.26445770263671875, 0.275634765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 45.0, 242.0, 553.0, 129.0, 23.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7642295360565186, -3.6442859172821045, -3.5243422985076904, -3.4043986797332764, -3.2844550609588623, -3.1645114421844482, -3.0445680618286133, -2.924624443054199, -2.804680824279785, -2.684737205505371, -2.564793586730957, -2.444849967956543, -2.324906349182129, -2.204962730407715, -2.085019111633301, -1.9650756120681763, -1.8451318740844727, -1.7251882553100586, -1.6052446365356445, -1.4853010177612305, -1.3653573989868164, -1.2454137802124023, -1.1254702806472778, -1.0055266618728638, -0.8855830430984497, -0.7656394243240356, -0.6456958055496216, -0.5257522463798523, -0.40580862760543823, -0.28586500883102417, -0.16592144966125488, -0.04597783088684082, 0.07396578788757324, 0.1939093917608261, 0.313852995634079, 0.43379658460617065, 0.5537402033805847, 0.6736838221549988, 0.7936273813247681, 0.9135710000991821, 1.0335146188735962, 1.1534582376480103, 1.2734018564224243, 1.3933453559875488, 1.513288974761963, 1.633232593536377, 1.753176212310791, 1.873119831085205, 1.9930634498596191, 2.113007068634033, 2.2329506874084473, 2.3528943061828613, 2.4728379249572754, 2.5927815437316895, 2.7127251625061035, 2.8326687812805176, 2.9526124000549316, 3.0725560188293457, 3.1924996376037598, 3.312443256378174, 3.432386875152588, 3.552330493927002, 3.672274112701416, 3.79221773147583, 3.912161111831665]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 13.0, 14.0, 26.0, 26.0, 44.0, 69.0, 109.0, 123.0, 116.0, 105.0, 95.0, 82.0, 54.0, 45.0, 33.0, 17.0, 11.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7814204692840576, -1.721726417541504, -1.6620323657989502, -1.6023383140563965, -1.5426442623138428, -1.482950210571289, -1.4232561588287354, -1.3635622262954712, -1.3038681745529175, -1.2441741228103638, -1.18448007106781, -1.1247860193252563, -1.0650919675827026, -1.0053980350494385, -0.94570392370224, -0.886009931564331, -0.8263158202171326, -0.7666217684745789, -0.7069277167320251, -0.6472337245941162, -0.5875396728515625, -0.5278456211090088, -0.4681515693664551, -0.40845754742622375, -0.34876349568367004, -0.28906944394111633, -0.229375422000885, -0.1696813702583313, -0.10998733341693878, -0.050293296575546265, 0.009400755167007446, 0.06909477710723877, 0.12878882884979248, 0.188482865691185, 0.24817690253257751, 0.3078709542751312, 0.36756497621536255, 0.42725902795791626, 0.48695307970046997, 0.5466470718383789, 0.6063411235809326, 0.6660351753234863, 0.72572922706604, 0.7854232788085938, 0.8451172709465027, 0.9048113226890564, 0.9645053744316101, 1.024199366569519, 1.0838935375213623, 1.143587589263916, 1.2032816410064697, 1.2629756927490234, 1.3226697444915771, 1.3823637962341309, 1.4420578479766846, 1.5017517805099487, 1.5614458322525024, 1.6211398839950562, 1.6808339357376099, 1.7405279874801636, 1.8002220392227173, 1.8599159717559814, 1.9196100234985352, 1.9793040752410889, 2.0389981269836426]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 12.0, 12.0, 9.0, 18.0, 24.0, 37.0, 48.0, 69.0, 86.0, 176.0, 249.0, 438.0, 782.0, 1448.0, 3088.0, 10224.0, 198966.0, 805895.0, 18499.0, 4269.0, 1859.0, 913.0, 527.0, 316.0, 177.0, 134.0, 88.0, 45.0, 35.0, 35.0, 16.0, 12.0, 10.0, 8.0, 5.0, 10.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2734375, -2.19805908203125, -2.1226806640625, -2.04730224609375, -1.971923828125, -1.89654541015625, -1.8211669921875, -1.74578857421875, -1.67041015625, -1.59503173828125, -1.5196533203125, -1.44427490234375, -1.368896484375, -1.29351806640625, -1.2181396484375, -1.14276123046875, -1.0673828125, -0.99200439453125, -0.9166259765625, -0.84124755859375, -0.765869140625, -0.69049072265625, -0.6151123046875, -0.53973388671875, -0.46435546875, -0.38897705078125, -0.3135986328125, -0.23822021484375, -0.162841796875, -0.08746337890625, -0.0120849609375, 0.06329345703125, 0.138671875, 0.21405029296875, 0.2894287109375, 0.36480712890625, 0.440185546875, 0.51556396484375, 0.5909423828125, 0.66632080078125, 0.74169921875, 0.81707763671875, 0.8924560546875, 0.96783447265625, 1.043212890625, 1.11859130859375, 1.1939697265625, 1.26934814453125, 1.3447265625, 1.42010498046875, 1.4954833984375, 1.57086181640625, 1.646240234375, 1.72161865234375, 1.7969970703125, 1.87237548828125, 1.94775390625, 2.02313232421875, 2.0985107421875, 2.17388916015625, 2.249267578125, 2.32464599609375, 2.4000244140625, 2.47540283203125, 2.55078125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 8.0, 2.0, 13.0, 11.0, 34.0, 75.0, 238.0, 306.0, 187.0, 57.0, 29.0, 16.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.32763671875, -0.31780242919921875, -0.3079681396484375, -0.29813385009765625, -0.288299560546875, -0.27846527099609375, -0.2686309814453125, -0.25879669189453125, -0.24896240234375, -0.23912811279296875, -0.2292938232421875, -0.21945953369140625, -0.209625244140625, -0.19979095458984375, -0.1899566650390625, -0.18012237548828125, -0.1702880859375, -0.16045379638671875, -0.1506195068359375, -0.14078521728515625, -0.130950927734375, -0.12111663818359375, -0.1112823486328125, -0.10144805908203125, -0.09161376953125, -0.08177947998046875, -0.0719451904296875, -0.06211090087890625, -0.052276611328125, -0.04244232177734375, -0.0326080322265625, -0.02277374267578125, -0.012939453125, -0.00310516357421875, 0.0067291259765625, 0.01656341552734375, 0.026397705078125, 0.03623199462890625, 0.0460662841796875, 0.05590057373046875, 0.06573486328125, 0.07556915283203125, 0.0854034423828125, 0.09523773193359375, 0.105072021484375, 0.11490631103515625, 0.1247406005859375, 0.13457489013671875, 0.1444091796875, 0.15424346923828125, 0.1640777587890625, 0.17391204833984375, 0.183746337890625, 0.19358062744140625, 0.2034149169921875, 0.21324920654296875, 0.22308349609375, 0.23291778564453125, 0.2427520751953125, 0.25258636474609375, 0.262420654296875, 0.27225494384765625, 0.2820892333984375, 0.29192352294921875, 0.3017578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 9.0, 12.0, 11.0, 14.0, 21.0, 23.0, 38.0, 59.0, 82.0, 118.0, 183.0, 282.0, 476.0, 754.0, 1458.0, 3597.0, 11369.0, 55061.0, 343946.0, 507028.0, 95871.0, 18288.0, 5235.0, 1988.0, 972.0, 546.0, 368.0, 217.0, 141.0, 103.0, 67.0, 53.0, 39.0, 37.0, 19.0, 17.0, 11.0, 12.0, 4.0, 3.0, 1.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.96484375, -0.933868408203125, -0.90289306640625, -0.871917724609375, -0.8409423828125, -0.809967041015625, -0.77899169921875, -0.748016357421875, -0.717041015625, -0.686065673828125, -0.65509033203125, -0.624114990234375, -0.5931396484375, -0.562164306640625, -0.53118896484375, -0.500213623046875, -0.46923828125, -0.438262939453125, -0.40728759765625, -0.376312255859375, -0.3453369140625, -0.314361572265625, -0.28338623046875, -0.252410888671875, -0.221435546875, -0.190460205078125, -0.15948486328125, -0.128509521484375, -0.0975341796875, -0.066558837890625, -0.03558349609375, -0.004608154296875, 0.0263671875, 0.057342529296875, 0.08831787109375, 0.119293212890625, 0.1502685546875, 0.181243896484375, 0.21221923828125, 0.243194580078125, 0.274169921875, 0.305145263671875, 0.33612060546875, 0.367095947265625, 0.3980712890625, 0.429046630859375, 0.46002197265625, 0.490997314453125, 0.52197265625, 0.552947998046875, 0.58392333984375, 0.614898681640625, 0.6458740234375, 0.676849365234375, 0.70782470703125, 0.738800048828125, 0.769775390625, 0.800750732421875, 0.83172607421875, 0.862701416015625, 0.8936767578125, 0.924652099609375, 0.95562744140625, 0.986602783203125, 1.017578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 0.0, 6.0, 4.0, 1.0, 9.0, 9.0, 10.0, 10.0, 8.0, 16.0, 22.0, 16.0, 23.0, 22.0, 28.0, 38.0, 33.0, 27.0, 35.0, 28.0, 47.0, 28.0, 41.0, 38.0, 32.0, 38.0, 43.0, 33.0, 36.0, 34.0, 36.0, 39.0, 30.0, 28.0, 24.0, 19.0, 20.0, 8.0, 15.0, 10.0, 10.0, 8.0, 8.0, 3.0, 8.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.61962890625, -0.5999755859375, -0.580322265625, -0.5606689453125, -0.541015625, -0.5213623046875, -0.501708984375, -0.4820556640625, -0.46240234375, -0.4427490234375, -0.423095703125, -0.4034423828125, -0.3837890625, -0.3641357421875, -0.344482421875, -0.3248291015625, -0.30517578125, -0.2855224609375, -0.265869140625, -0.2462158203125, -0.2265625, -0.2069091796875, -0.187255859375, -0.1676025390625, -0.14794921875, -0.1282958984375, -0.108642578125, -0.0889892578125, -0.0693359375, -0.0496826171875, -0.030029296875, -0.0103759765625, 0.00927734375, 0.0289306640625, 0.048583984375, 0.0682373046875, 0.087890625, 0.1075439453125, 0.127197265625, 0.1468505859375, 0.16650390625, 0.1861572265625, 0.205810546875, 0.2254638671875, 0.2451171875, 0.2647705078125, 0.284423828125, 0.3040771484375, 0.32373046875, 0.3433837890625, 0.363037109375, 0.3826904296875, 0.40234375, 0.4219970703125, 0.441650390625, 0.4613037109375, 0.48095703125, 0.5006103515625, 0.520263671875, 0.5399169921875, 0.5595703125, 0.5792236328125, 0.598876953125, 0.6185302734375, 0.63818359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 7.0, 10.0, 12.0, 20.0, 39.0, 60.0, 99.0, 228.0, 468.0, 1207.0, 4292.0, 35236.0, 794023.0, 199157.0, 10142.0, 2098.0, 729.0, 326.0, 162.0, 73.0, 47.0, 28.0, 20.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 7.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9609375, -0.9315948486328125, -0.902252197265625, -0.8729095458984375, -0.84356689453125, -0.8142242431640625, -0.784881591796875, -0.7555389404296875, -0.7261962890625, -0.6968536376953125, -0.667510986328125, -0.6381683349609375, -0.60882568359375, -0.5794830322265625, -0.550140380859375, -0.5207977294921875, -0.491455078125, -0.4621124267578125, -0.432769775390625, -0.4034271240234375, -0.37408447265625, -0.3447418212890625, -0.315399169921875, -0.2860565185546875, -0.2567138671875, -0.2273712158203125, -0.198028564453125, -0.1686859130859375, -0.13934326171875, -0.1100006103515625, -0.080657958984375, -0.0513153076171875, -0.02197265625, 0.0073699951171875, 0.036712646484375, 0.0660552978515625, 0.09539794921875, 0.1247406005859375, 0.154083251953125, 0.1834259033203125, 0.2127685546875, 0.2421112060546875, 0.271453857421875, 0.3007965087890625, 0.33013916015625, 0.3594818115234375, 0.388824462890625, 0.4181671142578125, 0.447509765625, 0.4768524169921875, 0.506195068359375, 0.5355377197265625, 0.56488037109375, 0.5942230224609375, 0.623565673828125, 0.6529083251953125, 0.6822509765625, 0.7115936279296875, 0.740936279296875, 0.7702789306640625, 0.79962158203125, 0.8289642333984375, 0.858306884765625, 0.8876495361328125, 0.9169921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 10.0, 16.0, 18.0, 19.0, 32.0, 35.0, 45.0, 55.0, 87.0, 120.0, 117.0, 125.0, 79.0, 71.0, 32.0, 25.0, 15.0, 24.0, 15.0, 9.0, 9.0, 12.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002117156982421875, -0.00020559877157211304, -0.00019948184490203857, -0.0001933649182319641, -0.00018724799156188965, -0.00018113106489181519, -0.00017501413822174072, -0.00016889721155166626, -0.0001627802848815918, -0.00015666335821151733, -0.00015054643154144287, -0.0001444295048713684, -0.00013831257820129395, -0.00013219565153121948, -0.00012607872486114502, -0.00011996179819107056, -0.0001138448715209961, -0.00010772794485092163, -0.00010161101818084717, -9.54940915107727e-05, -8.937716484069824e-05, -8.326023817062378e-05, -7.714331150054932e-05, -7.102638483047485e-05, -6.490945816040039e-05, -5.879253149032593e-05, -5.2675604820251465e-05, -4.6558678150177e-05, -4.044175148010254e-05, -3.4324824810028076e-05, -2.8207898139953613e-05, -2.209097146987915e-05, -1.5974044799804688e-05, -9.857118129730225e-06, -3.7401914596557617e-06, 2.376735210418701e-06, 8.493661880493164e-06, 1.4610588550567627e-05, 2.072751522064209e-05, 2.6844441890716553e-05, 3.2961368560791016e-05, 3.907829523086548e-05, 4.519522190093994e-05, 5.1312148571014404e-05, 5.742907524108887e-05, 6.354600191116333e-05, 6.966292858123779e-05, 7.577985525131226e-05, 8.189678192138672e-05, 8.801370859146118e-05, 9.413063526153564e-05, 0.00010024756193161011, 0.00010636448860168457, 0.00011248141527175903, 0.0001185983419418335, 0.00012471526861190796, 0.00013083219528198242, 0.00013694912195205688, 0.00014306604862213135, 0.0001491829752922058, 0.00015529990196228027, 0.00016141682863235474, 0.0001675337553024292, 0.00017365068197250366, 0.00017976760864257812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 11.0, 15.0, 18.0, 17.0, 22.0, 36.0, 62.0, 80.0, 118.0, 171.0, 349.0, 596.0, 1043.0, 2275.0, 6015.0, 25275.0, 191267.0, 677774.0, 117083.0, 17678.0, 4662.0, 1807.0, 883.0, 470.0, 267.0, 163.0, 103.0, 72.0, 52.0, 35.0, 19.0, 28.0, 14.0, 15.0, 11.0, 8.0, 8.0, 5.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.55029296875, -0.5338134765625, -0.517333984375, -0.5008544921875, -0.484375, -0.4678955078125, -0.451416015625, -0.4349365234375, -0.41845703125, -0.4019775390625, -0.385498046875, -0.3690185546875, -0.3525390625, -0.3360595703125, -0.319580078125, -0.3031005859375, -0.28662109375, -0.2701416015625, -0.253662109375, -0.2371826171875, -0.220703125, -0.2042236328125, -0.187744140625, -0.1712646484375, -0.15478515625, -0.1383056640625, -0.121826171875, -0.1053466796875, -0.0888671875, -0.0723876953125, -0.055908203125, -0.0394287109375, -0.02294921875, -0.0064697265625, 0.010009765625, 0.0264892578125, 0.04296875, 0.0594482421875, 0.075927734375, 0.0924072265625, 0.10888671875, 0.1253662109375, 0.141845703125, 0.1583251953125, 0.1748046875, 0.1912841796875, 0.207763671875, 0.2242431640625, 0.24072265625, 0.2572021484375, 0.273681640625, 0.2901611328125, 0.306640625, 0.3231201171875, 0.339599609375, 0.3560791015625, 0.37255859375, 0.3890380859375, 0.405517578125, 0.4219970703125, 0.4384765625, 0.4549560546875, 0.471435546875, 0.4879150390625, 0.50439453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 10.0, 5.0, 11.0, 18.0, 20.0, 27.0, 34.0, 58.0, 59.0, 85.0, 118.0, 115.0, 90.0, 86.0, 73.0, 57.0, 39.0, 25.0, 14.0, 12.0, 11.0, 12.0, 6.0, 4.0, 4.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.398681640625, -0.3860740661621094, -0.37346649169921875, -0.3608589172363281, -0.3482513427734375, -0.3356437683105469, -0.32303619384765625, -0.3104286193847656, -0.297821044921875, -0.2852134704589844, -0.27260589599609375, -0.2599983215332031, -0.2473907470703125, -0.23478317260742188, -0.22217559814453125, -0.20956802368164062, -0.19696044921875, -0.18435287475585938, -0.17174530029296875, -0.15913772583007812, -0.1465301513671875, -0.13392257690429688, -0.12131500244140625, -0.10870742797851562, -0.096099853515625, -0.08349227905273438, -0.07088470458984375, -0.058277130126953125, -0.0456695556640625, -0.033061981201171875, -0.02045440673828125, -0.007846832275390625, 0.0047607421875, 0.017368316650390625, 0.02997589111328125, 0.042583465576171875, 0.0551910400390625, 0.06779861450195312, 0.08040618896484375, 0.09301376342773438, 0.105621337890625, 0.11822891235351562, 0.13083648681640625, 0.14344406127929688, 0.1560516357421875, 0.16865921020507812, 0.18126678466796875, 0.19387435913085938, 0.20648193359375, 0.21908950805664062, 0.23169708251953125, 0.24430465698242188, 0.2569122314453125, 0.2695198059082031, 0.28212738037109375, 0.2947349548339844, 0.307342529296875, 0.3199501037597656, 0.33255767822265625, 0.3451652526855469, 0.3577728271484375, 0.3703804016113281, 0.38298797607421875, 0.3955955505371094, 0.408203125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 16.0, 156.0, 690.0, 128.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.569157600402832, -10.769261360168457, -9.969365119934082, -9.169468879699707, -8.369572639465332, -7.569676399230957, -6.769779682159424, -5.969883441925049, -5.169987201690674, -4.370090961456299, -3.570194721221924, -2.7702982425689697, -1.9704020023345947, -1.1705057621002197, -0.3706092834472656, 0.4292869567871094, 1.2291831970214844, 2.0290794372558594, 2.8289756774902344, 3.6288721561431885, 4.428768157958984, 5.228664398193359, 6.028561115264893, 6.828457355499268, 7.628353595733643, 8.428250312805176, 9.22814655303955, 10.028042793273926, 10.8279390335083, 11.627835273742676, 12.42773151397705, 13.227627754211426, 14.027524948120117, 14.827421188354492, 15.627317428588867, 16.427213668823242, 17.227109909057617, 18.027006149291992, 18.826902389526367, 19.626798629760742, 20.426694869995117, 21.226591110229492, 22.026487350463867, 22.826383590698242, 23.626279830932617, 24.426176071166992, 25.226072311401367, 26.025968551635742, 26.82586669921875, 27.625762939453125, 28.4256591796875, 29.225555419921875, 30.02545166015625, 30.825347900390625, 31.625244140625, 32.425140380859375, 33.22503662109375, 34.024932861328125, 34.8248291015625, 35.624725341796875, 36.42462158203125, 37.224517822265625, 38.0244140625, 38.824310302734375, 39.62420654296875]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 13.0, 20.0, 35.0, 38.0, 41.0, 57.0, 83.0, 81.0, 82.0, 101.0, 103.0, 69.0, 79.0, 46.0, 52.0, 29.0, 20.0, 14.0, 6.0, 9.0, 9.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.44974136352539, -8.150243759155273, -7.8507466316223145, -7.5512495040893555, -7.2517523765563965, -6.9522552490234375, -6.65275764465332, -6.353260517120361, -6.053763389587402, -5.754266262054443, -5.454768657684326, -5.155271530151367, -4.855774402618408, -4.556277275085449, -4.256779670715332, -3.957282543182373, -3.657784938812256, -3.3582875728607178, -3.058790445327759, -2.7592930793762207, -2.4597959518432617, -2.1602985858917236, -1.8608012199401855, -1.5613040924072266, -1.2618067264556885, -0.9623094797134399, -0.6628121733665466, -0.3633148670196533, -0.06381762027740479, 0.23567962646484375, 0.5351769924163818, 0.8346741199493408, 1.134171485900879, 1.4336687326431274, 1.733165979385376, 2.032663345336914, 2.332160472869873, 2.631657838821411, 2.931155204772949, 3.230652332305908, 3.5301496982574463, 3.8296470642089844, 4.129144191741943, 4.428641319274902, 4.7281389236450195, 5.0276360511779785, 5.3271331787109375, 5.626630783081055, 5.926127910614014, 6.225625038146973, 6.52512264251709, 6.824619770050049, 7.124116897583008, 7.423614501953125, 7.723111629486084, 8.022608757019043, 8.32210636138916, 8.621603965759277, 8.921100616455078, 9.220598220825195, 9.520095825195312, 9.819592475891113, 10.11909008026123, 10.418586730957031, 10.718084335327148]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 32.0, 73.0, 162.0, 525.0, 4597.0, 4184331.0, 3858.0, 440.0, 132.0, 58.0, 29.0, 11.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.38671875, -16.8515625, -16.31640625, -15.78125, -15.24609375, -14.7109375, -14.17578125, -13.640625, -13.10546875, -12.5703125, -12.03515625, -11.5, -10.96484375, -10.4296875, -9.89453125, -9.359375, -8.82421875, -8.2890625, -7.75390625, -7.21875, -6.68359375, -6.1484375, -5.61328125, -5.078125, -4.54296875, -4.0078125, -3.47265625, -2.9375, -2.40234375, -1.8671875, -1.33203125, -0.796875, -0.26171875, 0.2734375, 0.80859375, 1.34375, 1.87890625, 2.4140625, 2.94921875, 3.484375, 4.01953125, 4.5546875, 5.08984375, 5.625, 6.16015625, 6.6953125, 7.23046875, 7.765625, 8.30078125, 8.8359375, 9.37109375, 9.90625, 10.44140625, 10.9765625, 11.51171875, 12.046875, 12.58203125, 13.1171875, 13.65234375, 14.1875, 14.72265625, 15.2578125, 15.79296875, 16.328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 2.0, 5.0, 15.0, 21.0, 62.0, 129.0, 245.0, 243.0, 149.0, 71.0, 23.0, 10.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.4209442138671875, -0.407806396484375, -0.3946685791015625, -0.38153076171875, -0.3683929443359375, -0.355255126953125, -0.3421173095703125, -0.3289794921875, -0.3158416748046875, -0.302703857421875, -0.2895660400390625, -0.27642822265625, -0.2632904052734375, -0.250152587890625, -0.2370147705078125, -0.223876953125, -0.2107391357421875, -0.197601318359375, -0.1844635009765625, -0.17132568359375, -0.1581878662109375, -0.145050048828125, -0.1319122314453125, -0.1187744140625, -0.1056365966796875, -0.092498779296875, -0.0793609619140625, -0.06622314453125, -0.0530853271484375, -0.039947509765625, -0.0268096923828125, -0.013671875, -0.0005340576171875, 0.012603759765625, 0.0257415771484375, 0.03887939453125, 0.0520172119140625, 0.065155029296875, 0.0782928466796875, 0.0914306640625, 0.1045684814453125, 0.117706298828125, 0.1308441162109375, 0.14398193359375, 0.1571197509765625, 0.170257568359375, 0.1833953857421875, 0.196533203125, 0.2096710205078125, 0.222808837890625, 0.2359466552734375, 0.24908447265625, 0.2622222900390625, 0.275360107421875, 0.2884979248046875, 0.3016357421875, 0.3147735595703125, 0.327911376953125, 0.3410491943359375, 0.35418701171875, 0.3673248291015625, 0.380462646484375, 0.3936004638671875, 0.40673828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 25.0, 23.0, 66.0, 108.0, 176.0, 321.0, 972.0, 4178.0, 36345.0, 3924511.0, 214911.0, 9643.0, 1760.0, 620.0, 284.0, 142.0, 72.0, 44.0, 28.0, 14.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.376953125, -2.30853271484375, -2.2401123046875, -2.17169189453125, -2.103271484375, -2.03485107421875, -1.9664306640625, -1.89801025390625, -1.82958984375, -1.76116943359375, -1.6927490234375, -1.62432861328125, -1.555908203125, -1.48748779296875, -1.4190673828125, -1.35064697265625, -1.2822265625, -1.21380615234375, -1.1453857421875, -1.07696533203125, -1.008544921875, -0.94012451171875, -0.8717041015625, -0.80328369140625, -0.73486328125, -0.66644287109375, -0.5980224609375, -0.52960205078125, -0.461181640625, -0.39276123046875, -0.3243408203125, -0.25592041015625, -0.1875, -0.11907958984375, -0.0506591796875, 0.01776123046875, 0.086181640625, 0.15460205078125, 0.2230224609375, 0.29144287109375, 0.35986328125, 0.42828369140625, 0.4967041015625, 0.56512451171875, 0.633544921875, 0.70196533203125, 0.7703857421875, 0.83880615234375, 0.9072265625, 0.97564697265625, 1.0440673828125, 1.11248779296875, 1.180908203125, 1.24932861328125, 1.3177490234375, 1.38616943359375, 1.45458984375, 1.52301025390625, 1.5914306640625, 1.65985107421875, 1.728271484375, 1.79669189453125, 1.8651123046875, 1.93353271484375, 2.001953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 9.0, 15.0, 12.0, 23.0, 39.0, 51.0, 96.0, 173.0, 564.0, 1871.0, 751.0, 229.0, 90.0, 34.0, 33.0, 20.0, 12.0, 13.0, 8.0, 9.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427001953125, -0.4156608581542969, -0.40431976318359375, -0.3929786682128906, -0.3816375732421875, -0.3702964782714844, -0.35895538330078125, -0.3476142883300781, -0.336273193359375, -0.3249320983886719, -0.31359100341796875, -0.3022499084472656, -0.2909088134765625, -0.2795677185058594, -0.26822662353515625, -0.2568855285644531, -0.24554443359375, -0.23420333862304688, -0.22286224365234375, -0.21152114868164062, -0.2001800537109375, -0.18883895874023438, -0.17749786376953125, -0.16615676879882812, -0.154815673828125, -0.14347457885742188, -0.13213348388671875, -0.12079238891601562, -0.1094512939453125, -0.09811019897460938, -0.08676910400390625, -0.07542800903320312, -0.0640869140625, -0.052745819091796875, -0.04140472412109375, -0.030063629150390625, -0.0187225341796875, -0.007381439208984375, 0.00395965576171875, 0.015300750732421875, 0.026641845703125, 0.037982940673828125, 0.04932403564453125, 0.060665130615234375, 0.0720062255859375, 0.08334732055664062, 0.09468841552734375, 0.10602951049804688, 0.11737060546875, 0.12871170043945312, 0.14005279541015625, 0.15139389038085938, 0.1627349853515625, 0.17407608032226562, 0.18541717529296875, 0.19675827026367188, 0.208099365234375, 0.21944046020507812, 0.23078155517578125, 0.24212265014648438, 0.2534637451171875, 0.2648048400878906, 0.27614593505859375, 0.2874870300292969, 0.298828125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 13.0, 51.0, 194.0, 400.0, 237.0, 77.0, 15.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.691003799438477, -4.594726085662842, -4.498447895050049, -4.402170181274414, -4.305892467498779, -4.2096147537231445, -4.113336563110352, -4.017058849334717, -3.920781135559082, -3.824503183364868, -3.7282254695892334, -3.6319475173950195, -3.5356698036193848, -3.439391851425171, -3.343113899230957, -3.2468361854553223, -3.1505582332611084, -3.0542802810668945, -2.9580025672912598, -2.861724615097046, -2.765446901321411, -2.6691689491271973, -2.5728912353515625, -2.4766132831573486, -2.3803353309631348, -2.284057378768921, -2.187779664993286, -2.0915017127990723, -1.9952239990234375, -1.8989460468292236, -1.8026682138442993, -1.706390380859375, -1.6101127862930298, -1.5138349533081055, -1.4175571203231812, -1.3212792873382568, -1.225001335144043, -1.1287236213684082, -1.0324456691741943, -0.93616783618927, -0.8398900032043457, -0.7436121702194214, -0.6473343372344971, -0.551056444644928, -0.45477861166000366, -0.35850077867507935, -0.26222288608551025, -0.16594505310058594, -0.06966722011566162, 0.02661062777042389, 0.1228884756565094, 0.2191663384437561, 0.3154441714286804, 0.41172200441360474, 0.5079998970031738, 0.6042777299880981, 0.7005555629730225, 0.7968333959579468, 0.8931112289428711, 0.9893891215324402, 1.0856668949127197, 1.1819448471069336, 1.278222680091858, 1.3745005130767822, 1.4707783460617065]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 8.0, 11.0, 15.0, 22.0, 26.0, 31.0, 25.0, 35.0, 48.0, 62.0, 41.0, 66.0, 72.0, 62.0, 54.0, 61.0, 55.0, 45.0, 48.0, 42.0, 35.0, 35.0, 21.0, 18.0, 18.0, 14.0, 12.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3862881660461426, -1.3494021892547607, -1.312516212463379, -1.275630235671997, -1.2387442588806152, -1.2018582820892334, -1.1649723052978516, -1.1280863285064697, -1.091200351715088, -1.054314374923706, -1.0174283981323242, -0.9805424213409424, -0.9436564445495605, -0.9067704677581787, -0.8698844909667969, -0.832998514175415, -0.796112596988678, -0.7592266201972961, -0.7223406434059143, -0.6854546666145325, -0.6485686898231506, -0.6116827130317688, -0.5747967958450317, -0.5379108190536499, -0.5010248422622681, -0.46413886547088623, -0.4272528886795044, -0.39036691188812256, -0.3534809350967407, -0.3165949583053589, -0.27970901131629944, -0.2428230345249176, -0.20593708753585815, -0.16905111074447632, -0.13216513395309448, -0.09527917206287384, -0.058393195271492004, -0.02150721848011017, 0.015378743410110474, 0.05226472020149231, 0.08915069699287415, 0.12603667378425598, 0.16292265057563782, 0.19980861246585846, 0.2366945892572403, 0.27358055114746094, 0.3104665279388428, 0.3473525047302246, 0.38423848152160645, 0.4211244583129883, 0.4580104351043701, 0.49489641189575195, 0.5317823886871338, 0.5686683654785156, 0.6055543422698975, 0.6424403190612793, 0.6793262958526611, 0.716212272644043, 0.7530982494354248, 0.7899842262268066, 0.8268702030181885, 0.8637561798095703, 0.9006421566009521, 0.937528133392334, 0.974414050579071]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 4.0, 6.0, 10.0, 18.0, 11.0, 19.0, 31.0, 36.0, 65.0, 121.0, 241.0, 423.0, 898.0, 2155.0, 6406.0, 70206.0, 925842.0, 33584.0, 5110.0, 1684.0, 784.0, 374.0, 197.0, 89.0, 78.0, 41.0, 34.0, 16.0, 14.0, 9.0, 9.0, 5.0, 9.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -1.998443603515625, -1.93048095703125, -1.862518310546875, -1.7945556640625, -1.726593017578125, -1.65863037109375, -1.590667724609375, -1.522705078125, -1.454742431640625, -1.38677978515625, -1.318817138671875, -1.2508544921875, -1.182891845703125, -1.11492919921875, -1.046966552734375, -0.97900390625, -0.911041259765625, -0.84307861328125, -0.775115966796875, -0.7071533203125, -0.639190673828125, -0.57122802734375, -0.503265380859375, -0.435302734375, -0.367340087890625, -0.29937744140625, -0.231414794921875, -0.1634521484375, -0.095489501953125, -0.02752685546875, 0.040435791015625, 0.1083984375, 0.176361083984375, 0.24432373046875, 0.312286376953125, 0.3802490234375, 0.448211669921875, 0.51617431640625, 0.584136962890625, 0.652099609375, 0.720062255859375, 0.78802490234375, 0.855987548828125, 0.9239501953125, 0.991912841796875, 1.05987548828125, 1.127838134765625, 1.19580078125, 1.263763427734375, 1.33172607421875, 1.399688720703125, 1.4676513671875, 1.535614013671875, 1.60357666015625, 1.671539306640625, 1.739501953125, 1.807464599609375, 1.87542724609375, 1.943389892578125, 2.0113525390625, 2.079315185546875, 2.14727783203125, 2.215240478515625, 2.283203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 10.0, 31.0, 85.0, 176.0, 221.0, 232.0, 125.0, 62.0, 18.0, 10.0, 4.0, 7.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.3962287902832031, -0.38376617431640625, -0.3713035583496094, -0.3588409423828125, -0.3463783264160156, -0.33391571044921875, -0.3214530944824219, -0.308990478515625, -0.2965278625488281, -0.28406524658203125, -0.2716026306152344, -0.2591400146484375, -0.24667739868164062, -0.23421478271484375, -0.22175216674804688, -0.20928955078125, -0.19682693481445312, -0.18436431884765625, -0.17190170288085938, -0.1594390869140625, -0.14697647094726562, -0.13451385498046875, -0.12205123901367188, -0.109588623046875, -0.09712600708007812, -0.08466339111328125, -0.07220077514648438, -0.0597381591796875, -0.047275543212890625, -0.03481292724609375, -0.022350311279296875, -0.0098876953125, 0.002574920654296875, 0.01503753662109375, 0.027500152587890625, 0.0399627685546875, 0.052425384521484375, 0.06488800048828125, 0.07735061645507812, 0.089813232421875, 0.10227584838867188, 0.11473846435546875, 0.12720108032226562, 0.1396636962890625, 0.15212631225585938, 0.16458892822265625, 0.17705154418945312, 0.18951416015625, 0.20197677612304688, 0.21443939208984375, 0.22690200805664062, 0.2393646240234375, 0.2518272399902344, 0.26428985595703125, 0.2767524719238281, 0.289215087890625, 0.3016777038574219, 0.31414031982421875, 0.3266029357910156, 0.3390655517578125, 0.3515281677246094, 0.36399078369140625, 0.3764533996582031, 0.388916015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 7.0, 16.0, 18.0, 20.0, 36.0, 35.0, 36.0, 62.0, 66.0, 89.0, 158.0, 244.0, 341.0, 530.0, 857.0, 1572.0, 3324.0, 8048.0, 25228.0, 107797.0, 412486.0, 363447.0, 88261.0, 21473.0, 7291.0, 3124.0, 1520.0, 852.0, 528.0, 300.0, 201.0, 149.0, 109.0, 68.0, 62.0, 44.0, 30.0, 27.0, 18.0, 16.0, 11.0, 7.0, 6.0, 8.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.779296875, -0.7548904418945312, -0.7304840087890625, -0.7060775756835938, -0.681671142578125, -0.6572647094726562, -0.6328582763671875, -0.6084518432617188, -0.58404541015625, -0.5596389770507812, -0.5352325439453125, -0.5108261108398438, -0.486419677734375, -0.46201324462890625, -0.4376068115234375, -0.41320037841796875, -0.3887939453125, -0.36438751220703125, -0.3399810791015625, -0.31557464599609375, -0.291168212890625, -0.26676177978515625, -0.2423553466796875, -0.21794891357421875, -0.19354248046875, -0.16913604736328125, -0.1447296142578125, -0.12032318115234375, -0.095916748046875, -0.07151031494140625, -0.0471038818359375, -0.02269744873046875, 0.001708984375, 0.02611541748046875, 0.0505218505859375, 0.07492828369140625, 0.099334716796875, 0.12374114990234375, 0.1481475830078125, 0.17255401611328125, 0.19696044921875, 0.22136688232421875, 0.2457733154296875, 0.27017974853515625, 0.294586181640625, 0.31899261474609375, 0.3433990478515625, 0.36780548095703125, 0.3922119140625, 0.41661834716796875, 0.4410247802734375, 0.46543121337890625, 0.489837646484375, 0.5142440795898438, 0.5386505126953125, 0.5630569458007812, 0.58746337890625, 0.6118698120117188, 0.6362762451171875, 0.6606826782226562, 0.685089111328125, 0.7094955444335938, 0.7339019775390625, 0.7583084106445312, 0.78271484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 10.0, 4.0, 5.0, 2.0, 2.0, 9.0, 9.0, 13.0, 15.0, 21.0, 14.0, 20.0, 29.0, 29.0, 41.0, 34.0, 36.0, 39.0, 44.0, 33.0, 44.0, 60.0, 54.0, 41.0, 41.0, 41.0, 40.0, 47.0, 32.0, 30.0, 31.0, 17.0, 25.0, 17.0, 19.0, 8.0, 16.0, 1.0, 7.0, 9.0, 5.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.90576171875, -0.8786773681640625, -0.851593017578125, -0.8245086669921875, -0.79742431640625, -0.7703399658203125, -0.743255615234375, -0.7161712646484375, -0.6890869140625, -0.6620025634765625, -0.634918212890625, -0.6078338623046875, -0.58074951171875, -0.5536651611328125, -0.526580810546875, -0.4994964599609375, -0.472412109375, -0.4453277587890625, -0.418243408203125, -0.3911590576171875, -0.36407470703125, -0.3369903564453125, -0.309906005859375, -0.2828216552734375, -0.2557373046875, -0.2286529541015625, -0.201568603515625, -0.1744842529296875, -0.14739990234375, -0.1203155517578125, -0.093231201171875, -0.0661468505859375, -0.0390625, -0.0119781494140625, 0.015106201171875, 0.0421905517578125, 0.06927490234375, 0.0963592529296875, 0.123443603515625, 0.1505279541015625, 0.1776123046875, 0.2046966552734375, 0.231781005859375, 0.2588653564453125, 0.28594970703125, 0.3130340576171875, 0.340118408203125, 0.3672027587890625, 0.394287109375, 0.4213714599609375, 0.448455810546875, 0.4755401611328125, 0.50262451171875, 0.5297088623046875, 0.556793212890625, 0.5838775634765625, 0.6109619140625, 0.6380462646484375, 0.665130615234375, 0.6922149658203125, 0.71929931640625, 0.7463836669921875, 0.773468017578125, 0.8005523681640625, 0.82763671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 9.0, 8.0, 17.0, 63.0, 237.0, 1887.0, 1007727.0, 37827.0, 591.0, 115.0, 33.0, 16.0, 9.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.35546875, -3.26165771484375, -3.1678466796875, -3.07403564453125, -2.980224609375, -2.88641357421875, -2.7926025390625, -2.69879150390625, -2.60498046875, -2.51116943359375, -2.4173583984375, -2.32354736328125, -2.229736328125, -2.13592529296875, -2.0421142578125, -1.94830322265625, -1.8544921875, -1.76068115234375, -1.6668701171875, -1.57305908203125, -1.479248046875, -1.38543701171875, -1.2916259765625, -1.19781494140625, -1.10400390625, -1.01019287109375, -0.9163818359375, -0.82257080078125, -0.728759765625, -0.63494873046875, -0.5411376953125, -0.44732666015625, -0.353515625, -0.25970458984375, -0.1658935546875, -0.07208251953125, 0.021728515625, 0.11553955078125, 0.2093505859375, 0.30316162109375, 0.39697265625, 0.49078369140625, 0.5845947265625, 0.67840576171875, 0.772216796875, 0.86602783203125, 0.9598388671875, 1.05364990234375, 1.1474609375, 1.24127197265625, 1.3350830078125, 1.42889404296875, 1.522705078125, 1.61651611328125, 1.7103271484375, 1.80413818359375, 1.89794921875, 1.99176025390625, 2.0855712890625, 2.17938232421875, 2.273193359375, 2.36700439453125, 2.4608154296875, 2.55462646484375, 2.6484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 10.0, 8.0, 14.0, 10.0, 14.0, 24.0, 31.0, 27.0, 32.0, 41.0, 49.0, 63.0, 100.0, 104.0, 91.0, 62.0, 53.0, 43.0, 33.0, 31.0, 27.0, 17.0, 18.0, 14.0, 17.0, 7.0, 8.0, 4.0, 4.0, 6.0, 10.0, 1.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010389089584350586, -0.00010051392018795013, -9.713694453239441e-05, -9.375996887683868e-05, -9.038299322128296e-05, -8.700601756572723e-05, -8.362904191017151e-05, -8.025206625461578e-05, -7.687509059906006e-05, -7.349811494350433e-05, -7.012113928794861e-05, -6.674416363239288e-05, -6.336718797683716e-05, -5.999021232128143e-05, -5.661323666572571e-05, -5.323626101016998e-05, -4.985928535461426e-05, -4.648230969905853e-05, -4.310533404350281e-05, -3.972835838794708e-05, -3.635138273239136e-05, -3.297440707683563e-05, -2.9597431421279907e-05, -2.6220455765724182e-05, -2.2843480110168457e-05, -1.9466504454612732e-05, -1.6089528799057007e-05, -1.2712553143501282e-05, -9.335577487945557e-06, -5.9586018323898315e-06, -2.5816261768341064e-06, 7.953494787216187e-07, 4.172325134277344e-06, 7.549300789833069e-06, 1.0926276445388794e-05, 1.4303252100944519e-05, 1.7680227756500244e-05, 2.105720341205597e-05, 2.4434179067611694e-05, 2.781115472316742e-05, 3.1188130378723145e-05, 3.456510603427887e-05, 3.7942081689834595e-05, 4.131905734539032e-05, 4.4696033000946045e-05, 4.807300865650177e-05, 5.1449984312057495e-05, 5.482695996761322e-05, 5.8203935623168945e-05, 6.158091127872467e-05, 6.49578869342804e-05, 6.833486258983612e-05, 7.171183824539185e-05, 7.508881390094757e-05, 7.84657895565033e-05, 8.184276521205902e-05, 8.521974086761475e-05, 8.859671652317047e-05, 9.19736921787262e-05, 9.535066783428192e-05, 9.872764348983765e-05, 0.00010210461914539337, 0.0001054815948009491, 0.00010885857045650482, 0.00011223554611206055]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 8.0, 6.0, 7.0, 5.0, 14.0, 18.0, 30.0, 54.0, 102.0, 209.0, 570.0, 2846.0, 56815.0, 956692.0, 28153.0, 2184.0, 479.0, 146.0, 83.0, 52.0, 34.0, 14.0, 12.0, 5.0, 8.0, 4.0, 5.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5068359375, -1.4630584716796875, -1.419281005859375, -1.3755035400390625, -1.33172607421875, -1.2879486083984375, -1.244171142578125, -1.2003936767578125, -1.1566162109375, -1.1128387451171875, -1.069061279296875, -1.0252838134765625, -0.98150634765625, -0.9377288818359375, -0.893951416015625, -0.8501739501953125, -0.806396484375, -0.7626190185546875, -0.718841552734375, -0.6750640869140625, -0.63128662109375, -0.5875091552734375, -0.543731689453125, -0.4999542236328125, -0.4561767578125, -0.4123992919921875, -0.368621826171875, -0.3248443603515625, -0.28106689453125, -0.2372894287109375, -0.193511962890625, -0.1497344970703125, -0.10595703125, -0.0621795654296875, -0.018402099609375, 0.0253753662109375, 0.06915283203125, 0.1129302978515625, 0.156707763671875, 0.2004852294921875, 0.2442626953125, 0.2880401611328125, 0.331817626953125, 0.3755950927734375, 0.41937255859375, 0.4631500244140625, 0.506927490234375, 0.5507049560546875, 0.594482421875, 0.6382598876953125, 0.682037353515625, 0.7258148193359375, 0.76959228515625, 0.8133697509765625, 0.857147216796875, 0.9009246826171875, 0.9447021484375, 0.9884796142578125, 1.032257080078125, 1.0760345458984375, 1.11981201171875, 1.1635894775390625, 1.207366943359375, 1.2511444091796875, 1.294921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 3.0, 12.0, 23.0, 39.0, 58.0, 91.0, 148.0, 173.0, 146.0, 119.0, 66.0, 53.0, 19.0, 12.0, 8.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9013671875, -0.8780593872070312, -0.8547515869140625, -0.8314437866210938, -0.808135986328125, -0.7848281860351562, -0.7615203857421875, -0.7382125854492188, -0.71490478515625, -0.6915969848632812, -0.6682891845703125, -0.6449813842773438, -0.621673583984375, -0.5983657836914062, -0.5750579833984375, -0.5517501831054688, -0.5284423828125, -0.5051345825195312, -0.4818267822265625, -0.45851898193359375, -0.435211181640625, -0.41190338134765625, -0.3885955810546875, -0.36528778076171875, -0.34197998046875, -0.31867218017578125, -0.2953643798828125, -0.27205657958984375, -0.248748779296875, -0.22544097900390625, -0.2021331787109375, -0.17882537841796875, -0.155517578125, -0.13220977783203125, -0.1089019775390625, -0.08559417724609375, -0.062286376953125, -0.03897857666015625, -0.0156707763671875, 0.00763702392578125, 0.03094482421875, 0.05425262451171875, 0.0775604248046875, 0.10086822509765625, 0.124176025390625, 0.14748382568359375, 0.1707916259765625, 0.19409942626953125, 0.2174072265625, 0.24071502685546875, 0.2640228271484375, 0.28733062744140625, 0.310638427734375, 0.33394622802734375, 0.3572540283203125, 0.38056182861328125, 0.40386962890625, 0.42717742919921875, 0.4504852294921875, 0.47379302978515625, 0.497100830078125, 0.5204086303710938, 0.5437164306640625, 0.5670242309570312, 0.59033203125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 8.0, 43.0, 175.0, 460.0, 242.0, 53.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.250714302062988, -5.790975570678711, -5.331236839294434, -4.871498107910156, -4.411759376525879, -3.9520208835601807, -3.4922823905944824, -3.032543659210205, -2.5728049278259277, -2.1130661964416504, -1.6533275842666626, -1.1935889720916748, -0.7338502407073975, -0.2741115093231201, 0.18562698364257812, 0.6453657150268555, 1.1051044464111328, 1.5648431777954102, 2.0245819091796875, 2.4843204021453857, 2.944059133529663, 3.4037978649139404, 3.8635363578796387, 4.323275089263916, 4.783013820648193, 5.242752552032471, 5.702491283416748, 6.162229537963867, 6.6219682693481445, 7.081707000732422, 7.541445732116699, 8.001184463500977, 8.46092414855957, 8.920662879943848, 9.380401611328125, 9.840140342712402, 10.29987907409668, 10.759617805480957, 11.219356536865234, 11.679094314575195, 12.138833999633789, 12.598572731018066, 13.058311462402344, 13.518050193786621, 13.977788925170898, 14.437527656555176, 14.897266387939453, 15.357004165649414, 15.816742897033691, 16.27648162841797, 16.73621940612793, 17.195959091186523, 17.655696868896484, 18.115436553955078, 18.57517433166504, 19.034914016723633, 19.494651794433594, 19.954389572143555, 20.41412925720215, 20.87386703491211, 21.333606719970703, 21.793344497680664, 22.253084182739258, 22.71282196044922, 23.172561645507812]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 14.0, 15.0, 14.0, 12.0, 9.0, 16.0, 23.0, 19.0, 24.0, 34.0, 25.0, 29.0, 32.0, 30.0, 41.0, 36.0, 37.0, 34.0, 32.0, 41.0, 36.0, 34.0, 34.0, 32.0, 27.0, 34.0, 40.0, 21.0, 17.0, 21.0, 21.0, 25.0, 15.0, 13.0, 15.0, 12.0, 12.0, 8.0, 3.0, 7.0, 6.0, 7.0, 2.0, 10.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-4.362107753753662, -4.222928047180176, -4.0837483406066895, -3.9445688724517822, -3.805389404296875, -3.6662096977233887, -3.5270299911499023, -3.387850284576416, -3.248670816421509, -3.1094911098480225, -2.9703116416931152, -2.831131935119629, -2.6919522285461426, -2.5527727603912354, -2.413593053817749, -2.274413585662842, -2.1352338790893555, -1.9960542917251587, -1.856874704360962, -1.7176949977874756, -1.5785154104232788, -1.439335823059082, -1.3001561164855957, -1.160976529121399, -1.0217969417572021, -0.8826173543930054, -0.7434377074241638, -0.6042580604553223, -0.4650784730911255, -0.3258988857269287, -0.18671923875808716, -0.047539591789245605, 0.09164047241210938, 0.23082008957862854, 0.3699997067451477, 0.5091793537139893, 0.648358941078186, 0.7875385284423828, 0.9267181754112244, 1.065897822380066, 1.2050774097442627, 1.3442569971084595, 1.4834365844726562, 1.6226162910461426, 1.7617958784103394, 1.9009754657745361, 2.0401551723480225, 2.1793346405029297, 2.318514347076416, 2.4576940536499023, 2.5968735218048096, 2.736053228378296, 2.875232696533203, 3.0144124031066895, 3.153592109680176, 3.292771816253662, 3.4319512844085693, 3.5711309909820557, 3.710310459136963, 3.849490165710449, 3.9886698722839355, 4.127849578857422, 4.26702880859375, 4.406208515167236, 4.545388221740723]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 12.0, 8.0, 14.0, 33.0, 47.0, 101.0, 245.0, 785.0, 3491.0, 627339.0, 3556846.0, 4123.0, 752.0, 263.0, 96.0, 47.0, 23.0, 15.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0390625, -4.88177490234375, -4.7244873046875, -4.56719970703125, -4.409912109375, -4.25262451171875, -4.0953369140625, -3.93804931640625, -3.78076171875, -3.62347412109375, -3.4661865234375, -3.30889892578125, -3.151611328125, -2.99432373046875, -2.8370361328125, -2.67974853515625, -2.5224609375, -2.36517333984375, -2.2078857421875, -2.05059814453125, -1.893310546875, -1.73602294921875, -1.5787353515625, -1.42144775390625, -1.26416015625, -1.10687255859375, -0.9495849609375, -0.79229736328125, -0.635009765625, -0.47772216796875, -0.3204345703125, -0.16314697265625, -0.005859375, 0.15142822265625, 0.3087158203125, 0.46600341796875, 0.623291015625, 0.78057861328125, 0.9378662109375, 1.09515380859375, 1.25244140625, 1.40972900390625, 1.5670166015625, 1.72430419921875, 1.881591796875, 2.03887939453125, 2.1961669921875, 2.35345458984375, 2.5107421875, 2.66802978515625, 2.8253173828125, 2.98260498046875, 3.139892578125, 3.29718017578125, 3.4544677734375, 3.61175537109375, 3.76904296875, 3.92633056640625, 4.0836181640625, 4.24090576171875, 4.398193359375, 4.55548095703125, 4.7127685546875, 4.87005615234375, 5.02734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 9.0, 18.0, 42.0, 68.0, 106.0, 142.0, 153.0, 177.0, 117.0, 77.0, 32.0, 21.0, 14.0, 8.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.410125732421875, -0.39715576171875, -0.384185791015625, -0.3712158203125, -0.358245849609375, -0.34527587890625, -0.332305908203125, -0.3193359375, -0.306365966796875, -0.29339599609375, -0.280426025390625, -0.2674560546875, -0.254486083984375, -0.24151611328125, -0.228546142578125, -0.215576171875, -0.202606201171875, -0.18963623046875, -0.176666259765625, -0.1636962890625, -0.150726318359375, -0.13775634765625, -0.124786376953125, -0.11181640625, -0.098846435546875, -0.08587646484375, -0.072906494140625, -0.0599365234375, -0.046966552734375, -0.03399658203125, -0.021026611328125, -0.008056640625, 0.004913330078125, 0.01788330078125, 0.030853271484375, 0.0438232421875, 0.056793212890625, 0.06976318359375, 0.082733154296875, 0.095703125, 0.108673095703125, 0.12164306640625, 0.134613037109375, 0.1475830078125, 0.160552978515625, 0.17352294921875, 0.186492919921875, 0.199462890625, 0.212432861328125, 0.22540283203125, 0.238372802734375, 0.2513427734375, 0.264312744140625, 0.27728271484375, 0.290252685546875, 0.30322265625, 0.316192626953125, 0.32916259765625, 0.342132568359375, 0.3551025390625, 0.368072509765625, 0.38104248046875, 0.394012451171875, 0.406982421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 9.0, 11.0, 19.0, 39.0, 71.0, 140.0, 251.0, 700.0, 2383.0, 15752.0, 2929551.0, 1229436.0, 12537.0, 2223.0, 648.0, 240.0, 121.0, 56.0, 29.0, 18.0, 9.0, 7.0, 9.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.919921875, -1.8598480224609375, -1.799774169921875, -1.7397003173828125, -1.67962646484375, -1.6195526123046875, -1.559478759765625, -1.4994049072265625, -1.4393310546875, -1.3792572021484375, -1.319183349609375, -1.2591094970703125, -1.19903564453125, -1.1389617919921875, -1.078887939453125, -1.0188140869140625, -0.958740234375, -0.8986663818359375, -0.838592529296875, -0.7785186767578125, -0.71844482421875, -0.6583709716796875, -0.598297119140625, -0.5382232666015625, -0.4781494140625, -0.4180755615234375, -0.358001708984375, -0.2979278564453125, -0.23785400390625, -0.1777801513671875, -0.117706298828125, -0.0576324462890625, 0.00244140625, 0.0625152587890625, 0.122589111328125, 0.1826629638671875, 0.24273681640625, 0.3028106689453125, 0.362884521484375, 0.4229583740234375, 0.4830322265625, 0.5431060791015625, 0.603179931640625, 0.6632537841796875, 0.72332763671875, 0.7834014892578125, 0.843475341796875, 0.9035491943359375, 0.963623046875, 1.0236968994140625, 1.083770751953125, 1.1438446044921875, 1.20391845703125, 1.2639923095703125, 1.324066162109375, 1.3841400146484375, 1.4442138671875, 1.5042877197265625, 1.564361572265625, 1.6244354248046875, 1.68450927734375, 1.7445831298828125, 1.804656982421875, 1.8647308349609375, 1.9248046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 16.0, 27.0, 37.0, 59.0, 139.0, 307.0, 1221.0, 1597.0, 365.0, 145.0, 53.0, 31.0, 15.0, 15.0, 8.0, 1.0, 5.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.5244140625, -0.5119514465332031, -0.49948883056640625, -0.4870262145996094, -0.4745635986328125, -0.4621009826660156, -0.44963836669921875, -0.4371757507324219, -0.424713134765625, -0.4122505187988281, -0.39978790283203125, -0.3873252868652344, -0.3748626708984375, -0.3624000549316406, -0.34993743896484375, -0.3374748229980469, -0.32501220703125, -0.3125495910644531, -0.30008697509765625, -0.2876243591308594, -0.2751617431640625, -0.2626991271972656, -0.25023651123046875, -0.23777389526367188, -0.225311279296875, -0.21284866333007812, -0.20038604736328125, -0.18792343139648438, -0.1754608154296875, -0.16299819946289062, -0.15053558349609375, -0.13807296752929688, -0.1256103515625, -0.11314773559570312, -0.10068511962890625, -0.08822250366210938, -0.0757598876953125, -0.06329727172851562, -0.05083465576171875, -0.038372039794921875, -0.025909423828125, -0.013446807861328125, -0.00098419189453125, 0.011478424072265625, 0.0239410400390625, 0.036403656005859375, 0.04886627197265625, 0.061328887939453125, 0.07379150390625, 0.08625411987304688, 0.09871673583984375, 0.11117935180664062, 0.1236419677734375, 0.13610458374023438, 0.14856719970703125, 0.16102981567382812, 0.173492431640625, 0.18595504760742188, 0.19841766357421875, 0.21088027954101562, 0.2233428955078125, 0.23580551147460938, 0.24826812744140625, 0.2607307434082031, 0.273193359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 17.0, 120.0, 501.0, 311.0, 38.0, 11.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7340316772460938, -2.6027283668518066, -2.4714248180389404, -2.3401215076446533, -2.208817958831787, -2.0775146484375, -1.946211338043213, -1.8149079084396362, -1.6836044788360596, -1.552301049232483, -1.4209976196289062, -1.2896943092346191, -1.1583908796310425, -1.0270874500274658, -0.8957840800285339, -0.764480710029602, -0.6331772804260254, -0.5018738508224487, -0.37057048082351685, -0.23926708102226257, -0.1079636812210083, 0.02333974838256836, 0.15464311838150024, 0.28594648838043213, 0.4172499179840088, 0.5485533475875854, 0.6798567175865173, 0.8111600875854492, 0.9424635171890259, 1.0737669467926025, 1.2050702571868896, 1.3363736867904663, 1.4676775932312012, 1.5989810228347778, 1.7302844524383545, 1.8615877628326416, 1.9928911924362183, 2.124194622039795, 2.255497932434082, 2.386801242828369, 2.5181047916412354, 2.6494081020355225, 2.7807116508483887, 2.912014961242676, 3.043318271636963, 3.174621820449829, 3.305925130844116, 3.4372286796569824, 3.5685319900512695, 3.6998353004455566, 3.831138849258423, 3.96244215965271, 4.093745708465576, 4.225049018859863, 4.35635232925415, 4.4876556396484375, 4.618959426879883, 4.75026273727417, 4.881566047668457, 5.012869834899902, 5.1441731452941895, 5.275476455688477, 5.406779766082764, 5.538083076477051, 5.669386386871338]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 9.0, 9.0, 7.0, 14.0, 20.0, 22.0, 21.0, 16.0, 28.0, 34.0, 36.0, 32.0, 45.0, 40.0, 38.0, 52.0, 51.0, 57.0, 42.0, 39.0, 41.0, 46.0, 41.0, 31.0, 41.0, 24.0, 16.0, 28.0, 25.0, 22.0, 15.0, 14.0, 8.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8381653428077698, -0.8101806044578552, -0.7821958661079407, -0.7542111277580261, -0.7262264490127563, -0.6982417106628418, -0.6702569723129272, -0.6422722339630127, -0.6142874956130981, -0.5863027572631836, -0.558318018913269, -0.5303332805633545, -0.5023485422134399, -0.4743638336658478, -0.4463791251182556, -0.41839438676834106, -0.3904096484184265, -0.36242491006851196, -0.3344401717185974, -0.30645546317100525, -0.2784707248210907, -0.25048598647117615, -0.2225012630224228, -0.19451653957366943, -0.16653180122375488, -0.13854706287384033, -0.11056233942508698, -0.08257760852575302, -0.05459287762641907, -0.026608139276504517, 0.0013765841722488403, 0.029361307621002197, 0.05734598636627197, 0.08533071726560593, 0.11331544816493988, 0.14130017161369324, 0.1692849099636078, 0.19726964831352234, 0.2252543717622757, 0.25323909521102905, 0.2812238335609436, 0.30920857191085815, 0.3371933102607727, 0.36517801880836487, 0.3931627571582794, 0.42114749550819397, 0.44913220405578613, 0.4771169424057007, 0.5051016807556152, 0.5330864191055298, 0.5610711574554443, 0.5890558958053589, 0.6170406341552734, 0.645025372505188, 0.6730100512504578, 0.7009947896003723, 0.7289795279502869, 0.7569642663002014, 0.784949004650116, 0.8129337430000305, 0.8409184217453003, 0.8689031600952148, 0.8968878984451294, 0.924872636795044, 0.9528573751449585]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 18.0, 10.0, 18.0, 26.0, 29.0, 49.0, 64.0, 70.0, 109.0, 139.0, 187.0, 290.0, 433.0, 585.0, 911.0, 1448.0, 2407.0, 5363.0, 15019.0, 63354.0, 337237.0, 474330.0, 108822.0, 22420.0, 6971.0, 3233.0, 1707.0, 943.0, 689.0, 472.0, 313.0, 243.0, 178.0, 115.0, 97.0, 73.0, 46.0, 27.0, 21.0, 20.0, 17.0, 9.0, 7.0, 8.0, 11.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.66748046875, -0.64605712890625, -0.6246337890625, -0.60321044921875, -0.581787109375, -0.56036376953125, -0.5389404296875, -0.51751708984375, -0.49609375, -0.47467041015625, -0.4532470703125, -0.43182373046875, -0.410400390625, -0.38897705078125, -0.3675537109375, -0.34613037109375, -0.32470703125, -0.30328369140625, -0.2818603515625, -0.26043701171875, -0.239013671875, -0.21759033203125, -0.1961669921875, -0.17474365234375, -0.1533203125, -0.13189697265625, -0.1104736328125, -0.08905029296875, -0.067626953125, -0.04620361328125, -0.0247802734375, -0.00335693359375, 0.01806640625, 0.03948974609375, 0.0609130859375, 0.08233642578125, 0.103759765625, 0.12518310546875, 0.1466064453125, 0.16802978515625, 0.189453125, 0.21087646484375, 0.2322998046875, 0.25372314453125, 0.275146484375, 0.29656982421875, 0.3179931640625, 0.33941650390625, 0.36083984375, 0.38226318359375, 0.4036865234375, 0.42510986328125, 0.446533203125, 0.46795654296875, 0.4893798828125, 0.51080322265625, 0.5322265625, 0.55364990234375, 0.5750732421875, 0.59649658203125, 0.617919921875, 0.63934326171875, 0.6607666015625, 0.68218994140625, 0.70361328125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 7.0, 8.0, 16.0, 33.0, 67.0, 86.0, 136.0, 158.0, 158.0, 125.0, 93.0, 46.0, 26.0, 14.0, 13.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406005859375, -0.39365386962890625, -0.3813018798828125, -0.36894989013671875, -0.356597900390625, -0.34424591064453125, -0.3318939208984375, -0.31954193115234375, -0.30718994140625, -0.29483795166015625, -0.2824859619140625, -0.27013397216796875, -0.257781982421875, -0.24542999267578125, -0.2330780029296875, -0.22072601318359375, -0.2083740234375, -0.19602203369140625, -0.1836700439453125, -0.17131805419921875, -0.158966064453125, -0.14661407470703125, -0.1342620849609375, -0.12191009521484375, -0.10955810546875, -0.09720611572265625, -0.0848541259765625, -0.07250213623046875, -0.060150146484375, -0.04779815673828125, -0.0354461669921875, -0.02309417724609375, -0.0107421875, 0.00160980224609375, 0.0139617919921875, 0.02631378173828125, 0.038665771484375, 0.05101776123046875, 0.0633697509765625, 0.07572174072265625, 0.08807373046875, 0.10042572021484375, 0.1127777099609375, 0.12512969970703125, 0.137481689453125, 0.14983367919921875, 0.1621856689453125, 0.17453765869140625, 0.1868896484375, 0.19924163818359375, 0.2115936279296875, 0.22394561767578125, 0.236297607421875, 0.24864959716796875, 0.2610015869140625, 0.27335357666015625, 0.28570556640625, 0.29805755615234375, 0.3104095458984375, 0.32276153564453125, 0.335113525390625, 0.34746551513671875, 0.3598175048828125, 0.37216949462890625, 0.384521484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 5.0, 2.0, 9.0, 15.0, 11.0, 37.0, 47.0, 55.0, 86.0, 138.0, 201.0, 334.0, 632.0, 1326.0, 3342.0, 10467.0, 47344.0, 284081.0, 533787.0, 132841.0, 23519.0, 5993.0, 2128.0, 921.0, 488.0, 264.0, 177.0, 111.0, 59.0, 47.0, 28.0, 14.0, 12.0, 13.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84228515625, -0.8169784545898438, -0.7916717529296875, -0.7663650512695312, -0.741058349609375, -0.7157516479492188, -0.6904449462890625, -0.6651382446289062, -0.63983154296875, -0.6145248413085938, -0.5892181396484375, -0.5639114379882812, -0.538604736328125, -0.5132980346679688, -0.4879913330078125, -0.46268463134765625, -0.4373779296875, -0.41207122802734375, -0.3867645263671875, -0.36145782470703125, -0.336151123046875, -0.31084442138671875, -0.2855377197265625, -0.26023101806640625, -0.23492431640625, -0.20961761474609375, -0.1843109130859375, -0.15900421142578125, -0.133697509765625, -0.10839080810546875, -0.0830841064453125, -0.05777740478515625, -0.032470703125, -0.00716400146484375, 0.0181427001953125, 0.04344940185546875, 0.068756103515625, 0.09406280517578125, 0.1193695068359375, 0.14467620849609375, 0.16998291015625, 0.19528961181640625, 0.2205963134765625, 0.24590301513671875, 0.271209716796875, 0.29651641845703125, 0.3218231201171875, 0.34712982177734375, 0.3724365234375, 0.39774322509765625, 0.4230499267578125, 0.44835662841796875, 0.473663330078125, 0.49897003173828125, 0.5242767333984375, 0.5495834350585938, 0.57489013671875, 0.6001968383789062, 0.6255035400390625, 0.6508102416992188, 0.676116943359375, 0.7014236450195312, 0.7267303466796875, 0.7520370483398438, 0.77734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 2.0, 7.0, 3.0, 11.0, 10.0, 8.0, 14.0, 13.0, 17.0, 23.0, 26.0, 28.0, 34.0, 39.0, 35.0, 46.0, 43.0, 54.0, 46.0, 53.0, 57.0, 55.0, 57.0, 40.0, 47.0, 42.0, 39.0, 20.0, 32.0, 15.0, 21.0, 9.0, 10.0, 13.0, 7.0, 5.0, 5.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0244140625, -0.9941482543945312, -0.9638824462890625, -0.9336166381835938, -0.903350830078125, -0.8730850219726562, -0.8428192138671875, -0.8125534057617188, -0.78228759765625, -0.7520217895507812, -0.7217559814453125, -0.6914901733398438, -0.661224365234375, -0.6309585571289062, -0.6006927490234375, -0.5704269409179688, -0.5401611328125, -0.5098953247070312, -0.4796295166015625, -0.44936370849609375, -0.419097900390625, -0.38883209228515625, -0.3585662841796875, -0.32830047607421875, -0.29803466796875, -0.26776885986328125, -0.2375030517578125, -0.20723724365234375, -0.176971435546875, -0.14670562744140625, -0.1164398193359375, -0.08617401123046875, -0.055908203125, -0.02564239501953125, 0.0046234130859375, 0.03488922119140625, 0.065155029296875, 0.09542083740234375, 0.1256866455078125, 0.15595245361328125, 0.18621826171875, 0.21648406982421875, 0.2467498779296875, 0.27701568603515625, 0.307281494140625, 0.33754730224609375, 0.3678131103515625, 0.39807891845703125, 0.4283447265625, 0.45861053466796875, 0.4888763427734375, 0.5191421508789062, 0.549407958984375, 0.5796737670898438, 0.6099395751953125, 0.6402053833007812, 0.67047119140625, 0.7007369995117188, 0.7310028076171875, 0.7612686157226562, 0.791534423828125, 0.8218002319335938, 0.8520660400390625, 0.8823318481445312, 0.91259765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 7.0, 3.0, 7.0, 14.0, 26.0, 37.0, 71.0, 181.0, 478.0, 1733.0, 10944.0, 349541.0, 663329.0, 18716.0, 2443.0, 607.0, 210.0, 107.0, 43.0, 23.0, 17.0, 8.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59814453125, -0.5795135498046875, -0.560882568359375, -0.5422515869140625, -0.52362060546875, -0.5049896240234375, -0.486358642578125, -0.4677276611328125, -0.4490966796875, -0.4304656982421875, -0.411834716796875, -0.3932037353515625, -0.37457275390625, -0.3559417724609375, -0.337310791015625, -0.3186798095703125, -0.300048828125, -0.2814178466796875, -0.262786865234375, -0.2441558837890625, -0.22552490234375, -0.2068939208984375, -0.188262939453125, -0.1696319580078125, -0.1510009765625, -0.1323699951171875, -0.113739013671875, -0.0951080322265625, -0.07647705078125, -0.0578460693359375, -0.039215087890625, -0.0205841064453125, -0.001953125, 0.0166778564453125, 0.035308837890625, 0.0539398193359375, 0.07257080078125, 0.0912017822265625, 0.109832763671875, 0.1284637451171875, 0.1470947265625, 0.1657257080078125, 0.184356689453125, 0.2029876708984375, 0.22161865234375, 0.2402496337890625, 0.258880615234375, 0.2775115966796875, 0.296142578125, 0.3147735595703125, 0.333404541015625, 0.3520355224609375, 0.37066650390625, 0.3892974853515625, 0.407928466796875, 0.4265594482421875, 0.4451904296875, 0.4638214111328125, 0.482452392578125, 0.5010833740234375, 0.51971435546875, 0.5383453369140625, 0.556976318359375, 0.5756072998046875, 0.59423828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 15.0, 15.0, 11.0, 21.0, 12.0, 13.0, 21.0, 27.0, 28.0, 32.0, 47.0, 34.0, 46.0, 70.0, 71.0, 84.0, 70.0, 55.0, 32.0, 34.0, 29.0, 24.0, 28.0, 20.0, 26.0, 17.0, 24.0, 14.0, 5.0, 9.0, 10.0, 6.0, 8.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.5367431640625e-05, -9.241234511137009e-05, -8.945725858211517e-05, -8.650217205286026e-05, -8.354708552360535e-05, -8.059199899435043e-05, -7.763691246509552e-05, -7.46818259358406e-05, -7.17267394065857e-05, -6.877165287733078e-05, -6.581656634807587e-05, -6.286147981882095e-05, -5.990639328956604e-05, -5.695130676031113e-05, -5.399622023105621e-05, -5.10411337018013e-05, -4.808604717254639e-05, -4.5130960643291473e-05, -4.217587411403656e-05, -3.922078758478165e-05, -3.6265701055526733e-05, -3.331061452627182e-05, -3.0355527997016907e-05, -2.7400441467761993e-05, -2.444535493850708e-05, -2.1490268409252167e-05, -1.8535181879997253e-05, -1.558009535074234e-05, -1.2625008821487427e-05, -9.669922292232513e-06, -6.7148357629776e-06, -3.7597492337226868e-06, -8.046627044677734e-07, 2.15042382478714e-06, 5.105510354042053e-06, 8.060596883296967e-06, 1.101568341255188e-05, 1.3970769941806793e-05, 1.6925856471061707e-05, 1.988094300031662e-05, 2.2836029529571533e-05, 2.5791116058826447e-05, 2.874620258808136e-05, 3.170128911733627e-05, 3.4656375646591187e-05, 3.76114621758461e-05, 4.056654870510101e-05, 4.3521635234355927e-05, 4.647672176361084e-05, 4.943180829286575e-05, 5.2386894822120667e-05, 5.534198135137558e-05, 5.829706788063049e-05, 6.12521544098854e-05, 6.420724093914032e-05, 6.716232746839523e-05, 7.011741399765015e-05, 7.307250052690506e-05, 7.602758705615997e-05, 7.898267358541489e-05, 8.19377601146698e-05, 8.489284664392471e-05, 8.784793317317963e-05, 9.080301970243454e-05, 9.375810623168945e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 15.0, 20.0, 24.0, 37.0, 65.0, 143.0, 283.0, 737.0, 2463.0, 16176.0, 407649.0, 593332.0, 22898.0, 3169.0, 850.0, 331.0, 173.0, 65.0, 40.0, 27.0, 19.0, 4.0, 11.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.556640625, -0.5403022766113281, -0.5239639282226562, -0.5076255798339844, -0.4912872314453125, -0.4749488830566406, -0.45861053466796875, -0.4422721862792969, -0.425933837890625, -0.4095954895019531, -0.39325714111328125, -0.3769187927246094, -0.3605804443359375, -0.3442420959472656, -0.32790374755859375, -0.3115653991699219, -0.29522705078125, -0.2788887023925781, -0.26255035400390625, -0.24621200561523438, -0.2298736572265625, -0.21353530883789062, -0.19719696044921875, -0.18085861206054688, -0.164520263671875, -0.14818191528320312, -0.13184356689453125, -0.11550521850585938, -0.0991668701171875, -0.08282852172851562, -0.06649017333984375, -0.050151824951171875, -0.0338134765625, -0.017475128173828125, -0.00113677978515625, 0.015201568603515625, 0.0315399169921875, 0.047878265380859375, 0.06421661376953125, 0.08055496215820312, 0.096893310546875, 0.11323165893554688, 0.12957000732421875, 0.14590835571289062, 0.1622467041015625, 0.17858505249023438, 0.19492340087890625, 0.21126174926757812, 0.22760009765625, 0.24393844604492188, 0.26027679443359375, 0.2766151428222656, 0.2929534912109375, 0.3092918395996094, 0.32563018798828125, 0.3419685363769531, 0.358306884765625, 0.3746452331542969, 0.39098358154296875, 0.4073219299316406, 0.4236602783203125, 0.4399986267089844, 0.45633697509765625, 0.4726753234863281, 0.489013671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 5.0, 1.0, 6.0, 6.0, 10.0, 13.0, 6.0, 18.0, 20.0, 19.0, 41.0, 53.0, 56.0, 76.0, 108.0, 107.0, 80.0, 79.0, 69.0, 58.0, 48.0, 34.0, 20.0, 16.0, 7.0, 10.0, 10.0, 3.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.278961181640625, -0.26983642578125, -0.260711669921875, -0.2515869140625, -0.242462158203125, -0.23333740234375, -0.224212646484375, -0.215087890625, -0.205963134765625, -0.19683837890625, -0.187713623046875, -0.1785888671875, -0.169464111328125, -0.16033935546875, -0.151214599609375, -0.14208984375, -0.132965087890625, -0.12384033203125, -0.114715576171875, -0.1055908203125, -0.096466064453125, -0.08734130859375, -0.078216552734375, -0.069091796875, -0.059967041015625, -0.05084228515625, -0.041717529296875, -0.0325927734375, -0.023468017578125, -0.01434326171875, -0.005218505859375, 0.00390625, 0.013031005859375, 0.02215576171875, 0.031280517578125, 0.0404052734375, 0.049530029296875, 0.05865478515625, 0.067779541015625, 0.076904296875, 0.086029052734375, 0.09515380859375, 0.104278564453125, 0.1134033203125, 0.122528076171875, 0.13165283203125, 0.140777587890625, 0.14990234375, 0.159027099609375, 0.16815185546875, 0.177276611328125, 0.1864013671875, 0.195526123046875, 0.20465087890625, 0.213775634765625, 0.222900390625, 0.232025146484375, 0.24114990234375, 0.250274658203125, 0.2593994140625, 0.268524169921875, 0.27764892578125, 0.286773681640625, 0.2958984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 14.0, 39.0, 110.0, 271.0, 360.0, 145.0, 41.0, 12.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.75207805633545, -10.463418960571289, -10.174758911132812, -9.886098861694336, -9.597439765930176, -9.308780670166016, -9.020120620727539, -8.731460571289062, -8.442801475524902, -8.154142379760742, -7.865482330322266, -7.576822757720947, -7.288163185119629, -6.9995036125183105, -6.710844039916992, -6.422184467315674, -6.1335248947143555, -5.844865322113037, -5.556205749511719, -5.2675461769104, -4.978886604309082, -4.690227031707764, -4.401567459106445, -4.112907886505127, -3.8242483139038086, -3.5355887413024902, -3.246929168701172, -2.9582695960998535, -2.669610023498535, -2.380950450897217, -2.0922908782958984, -1.80363130569458, -1.5149707794189453, -1.226311206817627, -0.9376516342163086, -0.6489920616149902, -0.3603324890136719, -0.07167291641235352, 0.21698665618896484, 0.5056462287902832, 0.7943058013916016, 1.08296537399292, 1.3716249465942383, 1.6602845191955566, 1.948944091796875, 2.2376036643981934, 2.5262632369995117, 2.81492280960083, 3.1035823822021484, 3.392241954803467, 3.680901527404785, 3.9695611000061035, 4.258220672607422, 4.54688024520874, 4.835539817810059, 5.124199390411377, 5.412858963012695, 5.701518535614014, 5.990178108215332, 6.27883768081665, 6.567497253417969, 6.856156826019287, 7.1448163986206055, 7.433475971221924, 7.722135543823242]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 0.0, 7.0, 1.0, 12.0, 13.0, 25.0, 14.0, 37.0, 29.0, 40.0, 49.0, 43.0, 46.0, 59.0, 60.0, 61.0, 78.0, 48.0, 68.0, 54.0, 39.0, 47.0, 36.0, 31.0, 21.0, 20.0, 21.0, 12.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0081915855407715, -6.807882308959961, -6.60757303237915, -6.40726375579834, -6.2069549560546875, -6.006645202636719, -5.806336402893066, -5.606027126312256, -5.405717849731445, -5.205408573150635, -5.005099296569824, -4.804790019989014, -4.604480743408203, -4.404171943664551, -4.20386266708374, -4.00355339050293, -3.803244113922119, -3.6029348373413086, -3.402625560760498, -3.2023165225982666, -3.002007246017456, -2.8016979694366455, -2.601388931274414, -2.4010796546936035, -2.200770378112793, -2.0004611015319824, -1.8001519441604614, -1.5998427867889404, -1.3995335102081299, -1.1992242336273193, -0.9989150762557983, -0.7986059188842773, -0.5982961654663086, -0.3979869484901428, -0.19767773151397705, 0.0026314854621887207, 0.2029407024383545, 0.40324997901916504, 0.603559136390686, 0.803868293762207, 1.0041775703430176, 1.2044868469238281, 1.4047960042953491, 1.6051051616668701, 1.8054144382476807, 2.005723714828491, 2.2060327529907227, 2.406342029571533, 2.6066513061523438, 2.8069605827331543, 3.007269859313965, 3.2075788974761963, 3.407888174057007, 3.6081974506378174, 3.808506488800049, 4.008815765380859, 4.20912504196167, 4.4094343185424805, 4.609743595123291, 4.810052871704102, 5.010361671447754, 5.210671424865723, 5.410980224609375, 5.6112895011901855, 5.811598777770996]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 4.0, 14.0, 16.0, 32.0, 71.0, 105.0, 197.0, 468.0, 1432.0, 7794.0, 501032.0, 3669040.0, 11183.0, 1792.0, 580.0, 236.0, 116.0, 46.0, 44.0, 26.0, 14.0, 11.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2734375, -2.210418701171875, -2.14739990234375, -2.084381103515625, -2.0213623046875, -1.958343505859375, -1.89532470703125, -1.832305908203125, -1.769287109375, -1.706268310546875, -1.64324951171875, -1.580230712890625, -1.5172119140625, -1.454193115234375, -1.39117431640625, -1.328155517578125, -1.26513671875, -1.202117919921875, -1.13909912109375, -1.076080322265625, -1.0130615234375, -0.950042724609375, -0.88702392578125, -0.824005126953125, -0.760986328125, -0.697967529296875, -0.63494873046875, -0.571929931640625, -0.5089111328125, -0.445892333984375, -0.38287353515625, -0.319854736328125, -0.2568359375, -0.193817138671875, -0.13079833984375, -0.067779541015625, -0.0047607421875, 0.058258056640625, 0.12127685546875, 0.184295654296875, 0.247314453125, 0.310333251953125, 0.37335205078125, 0.436370849609375, 0.4993896484375, 0.562408447265625, 0.62542724609375, 0.688446044921875, 0.75146484375, 0.814483642578125, 0.87750244140625, 0.940521240234375, 1.0035400390625, 1.066558837890625, 1.12957763671875, 1.192596435546875, 1.255615234375, 1.318634033203125, 1.38165283203125, 1.444671630859375, 1.5076904296875, 1.570709228515625, 1.63372802734375, 1.696746826171875, 1.759765625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 15.0, 18.0, 31.0, 37.0, 67.0, 108.0, 133.0, 134.0, 113.0, 107.0, 88.0, 58.0, 36.0, 19.0, 9.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.408447265625, -0.3962898254394531, -0.38413238525390625, -0.3719749450683594, -0.3598175048828125, -0.3476600646972656, -0.33550262451171875, -0.3233451843261719, -0.311187744140625, -0.2990303039550781, -0.28687286376953125, -0.2747154235839844, -0.2625579833984375, -0.2504005432128906, -0.23824310302734375, -0.22608566284179688, -0.21392822265625, -0.20177078247070312, -0.18961334228515625, -0.17745590209960938, -0.1652984619140625, -0.15314102172851562, -0.14098358154296875, -0.12882614135742188, -0.116668701171875, -0.10451126098632812, -0.09235382080078125, -0.08019638061523438, -0.0680389404296875, -0.055881500244140625, -0.04372406005859375, -0.031566619873046875, -0.0194091796875, -0.007251739501953125, 0.00490570068359375, 0.017063140869140625, 0.0292205810546875, 0.041378021240234375, 0.05353546142578125, 0.06569290161132812, 0.077850341796875, 0.09000778198242188, 0.10216522216796875, 0.11432266235351562, 0.1264801025390625, 0.13863754272460938, 0.15079498291015625, 0.16295242309570312, 0.17510986328125, 0.18726730346679688, 0.19942474365234375, 0.21158218383789062, 0.2237396240234375, 0.23589706420898438, 0.24805450439453125, 0.2602119445800781, 0.272369384765625, 0.2845268249511719, 0.29668426513671875, 0.3088417053222656, 0.3209991455078125, 0.3331565856933594, 0.34531402587890625, 0.3574714660644531, 0.36962890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 7.0, 15.0, 24.0, 44.0, 71.0, 175.0, 467.0, 1512.0, 8648.0, 222850.0, 3922987.0, 32827.0, 3212.0, 812.0, 329.0, 138.0, 73.0, 41.0, 17.0, 12.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4912109375, -1.4511871337890625, -1.411163330078125, -1.3711395263671875, -1.33111572265625, -1.2910919189453125, -1.251068115234375, -1.2110443115234375, -1.1710205078125, -1.1309967041015625, -1.090972900390625, -1.0509490966796875, -1.01092529296875, -0.9709014892578125, -0.930877685546875, -0.8908538818359375, -0.850830078125, -0.8108062744140625, -0.770782470703125, -0.7307586669921875, -0.69073486328125, -0.6507110595703125, -0.610687255859375, -0.5706634521484375, -0.5306396484375, -0.4906158447265625, -0.450592041015625, -0.4105682373046875, -0.37054443359375, -0.3305206298828125, -0.290496826171875, -0.2504730224609375, -0.21044921875, -0.1704254150390625, -0.130401611328125, -0.0903778076171875, -0.05035400390625, -0.0103302001953125, 0.029693603515625, 0.0697174072265625, 0.1097412109375, 0.1497650146484375, 0.189788818359375, 0.2298126220703125, 0.26983642578125, 0.3098602294921875, 0.349884033203125, 0.3899078369140625, 0.429931640625, 0.4699554443359375, 0.509979248046875, 0.5500030517578125, 0.59002685546875, 0.6300506591796875, 0.670074462890625, 0.7100982666015625, 0.7501220703125, 0.7901458740234375, 0.830169677734375, 0.8701934814453125, 0.91021728515625, 0.9502410888671875, 0.990264892578125, 1.0302886962890625, 1.0703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 10.0, 23.0, 32.0, 39.0, 59.0, 120.0, 278.0, 909.0, 1663.0, 497.0, 182.0, 76.0, 52.0, 32.0, 29.0, 11.0, 12.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.220703125, -0.21364402770996094, -0.20658493041992188, -0.1995258331298828, -0.19246673583984375, -0.1854076385498047, -0.17834854125976562, -0.17128944396972656, -0.1642303466796875, -0.15717124938964844, -0.15011215209960938, -0.1430530548095703, -0.13599395751953125, -0.1289348602294922, -0.12187576293945312, -0.11481666564941406, -0.107757568359375, -0.10069847106933594, -0.09363937377929688, -0.08658027648925781, -0.07952117919921875, -0.07246208190917969, -0.06540298461914062, -0.05834388732910156, -0.0512847900390625, -0.04422569274902344, -0.037166595458984375, -0.030107498168945312, -0.02304840087890625, -0.015989303588867188, -0.008930206298828125, -0.0018711090087890625, 0.00518798828125, 0.012247085571289062, 0.019306182861328125, 0.026365280151367188, 0.03342437744140625, 0.04048347473144531, 0.047542572021484375, 0.05460166931152344, 0.0616607666015625, 0.06871986389160156, 0.07577896118164062, 0.08283805847167969, 0.08989715576171875, 0.09695625305175781, 0.10401535034179688, 0.11107444763183594, 0.118133544921875, 0.12519264221191406, 0.13225173950195312, 0.1393108367919922, 0.14636993408203125, 0.1534290313720703, 0.16048812866210938, 0.16754722595214844, 0.1746063232421875, 0.18166542053222656, 0.18872451782226562, 0.1957836151123047, 0.20284271240234375, 0.2099018096923828, 0.21696090698242188, 0.22402000427246094, 0.2310791015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 45.0, 79.0, 181.0, 298.0, 216.0, 113.0, 39.0, 16.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3465769290924072, -2.29524827003479, -2.243919610977173, -2.1925911903381348, -2.1412625312805176, -2.0899338722229004, -2.038605213165283, -1.9872766733169556, -1.935948133468628, -1.8846194744110107, -1.833290934562683, -1.781962275505066, -1.7306337356567383, -1.679305076599121, -1.627976417541504, -1.5766478776931763, -1.525319218635559, -1.473990559577942, -1.4226620197296143, -1.371333360671997, -1.3200048208236694, -1.2686761617660522, -1.2173476219177246, -1.1660189628601074, -1.1146903038024902, -1.063361644744873, -1.0120331048965454, -0.9607044458389282, -0.9093759059906006, -0.8580472469329834, -0.806718647480011, -0.7553900480270386, -0.7040615081787109, -0.6527329087257385, -0.6014043092727661, -0.5500756502151489, -0.4987470805644989, -0.4474184811115265, -0.3960898518562317, -0.3447612524032593, -0.29343265295028687, -0.24210405349731445, -0.19077543914318085, -0.13944682478904724, -0.08811822533607483, -0.03678962588310242, 0.014539003372192383, 0.0658676028251648, 0.11719620227813721, 0.16852480173110962, 0.21985341608524323, 0.27118203043937683, 0.32251062989234924, 0.37383922934532166, 0.42516785860061646, 0.47649645805358887, 0.5278250575065613, 0.5791536569595337, 0.6304822564125061, 0.6818108558654785, 0.7331395149230957, 0.7844680547714233, 0.8357967138290405, 0.8871253132820129, 0.9384539127349854]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 6.0, 12.0, 11.0, 14.0, 15.0, 21.0, 21.0, 33.0, 22.0, 35.0, 29.0, 37.0, 37.0, 38.0, 33.0, 48.0, 40.0, 43.0, 40.0, 46.0, 57.0, 41.0, 45.0, 32.0, 43.0, 30.0, 31.0, 32.0, 9.0, 13.0, 12.0, 13.0, 14.0, 16.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5483723878860474, -0.5289035439491272, -0.509434700012207, -0.48996591567993164, -0.4704970717430115, -0.4510282278060913, -0.43155941367149353, -0.41209059953689575, -0.3926217555999756, -0.3731529116630554, -0.35368409752845764, -0.33421528339385986, -0.3147464394569397, -0.29527759552001953, -0.27580878138542175, -0.256339967250824, -0.2368711233139038, -0.21740229427814484, -0.19793346524238586, -0.1784646362066269, -0.15899580717086792, -0.13952697813510895, -0.12005814909934998, -0.100589320063591, -0.08112049102783203, -0.06165166199207306, -0.04218283295631409, -0.022714003920555115, -0.0032451748847961426, 0.01622365415096283, 0.0356924831867218, 0.055161312222480774, 0.07463014125823975, 0.09409897029399872, 0.11356779932975769, 0.13303662836551666, 0.15250545740127563, 0.1719742864370346, 0.19144311547279358, 0.21091194450855255, 0.23038077354431152, 0.2498496025800705, 0.26931843161582947, 0.28878724575042725, 0.3082560896873474, 0.3277249336242676, 0.34719374775886536, 0.36666256189346313, 0.3861314058303833, 0.40560024976730347, 0.42506906390190125, 0.444537878036499, 0.4640067219734192, 0.48347556591033936, 0.5029443502426147, 0.5224131941795349, 0.5418820381164551, 0.5613508820533752, 0.5808197259902954, 0.6002885103225708, 0.619757354259491, 0.6392261981964111, 0.6586949825286865, 0.6781638264656067, 0.6976326704025269]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 9.0, 5.0, 8.0, 20.0, 30.0, 37.0, 70.0, 98.0, 162.0, 297.0, 497.0, 883.0, 1722.0, 3889.0, 12622.0, 73001.0, 509498.0, 380811.0, 48743.0, 9650.0, 3213.0, 1476.0, 729.0, 429.0, 243.0, 138.0, 93.0, 57.0, 52.0, 31.0, 10.0, 10.0, 2.0, 2.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.912109375, -0.8843841552734375, -0.856658935546875, -0.8289337158203125, -0.80120849609375, -0.7734832763671875, -0.745758056640625, -0.7180328369140625, -0.6903076171875, -0.6625823974609375, -0.634857177734375, -0.6071319580078125, -0.57940673828125, -0.5516815185546875, -0.523956298828125, -0.4962310791015625, -0.468505859375, -0.4407806396484375, -0.413055419921875, -0.3853302001953125, -0.35760498046875, -0.3298797607421875, -0.302154541015625, -0.2744293212890625, -0.2467041015625, -0.2189788818359375, -0.191253662109375, -0.1635284423828125, -0.13580322265625, -0.1080780029296875, -0.080352783203125, -0.0526275634765625, -0.02490234375, 0.0028228759765625, 0.030548095703125, 0.0582733154296875, 0.08599853515625, 0.1137237548828125, 0.141448974609375, 0.1691741943359375, 0.1968994140625, 0.2246246337890625, 0.252349853515625, 0.2800750732421875, 0.30780029296875, 0.3355255126953125, 0.363250732421875, 0.3909759521484375, 0.418701171875, 0.4464263916015625, 0.474151611328125, 0.5018768310546875, 0.52960205078125, 0.5573272705078125, 0.585052490234375, 0.6127777099609375, 0.6405029296875, 0.6682281494140625, 0.695953369140625, 0.7236785888671875, 0.75140380859375, 0.7791290283203125, 0.806854248046875, 0.8345794677734375, 0.8623046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 8.0, 7.0, 20.0, 30.0, 42.0, 61.0, 96.0, 121.0, 121.0, 126.0, 98.0, 103.0, 68.0, 35.0, 26.0, 13.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391845703125, -0.3802680969238281, -0.36869049072265625, -0.3571128845214844, -0.3455352783203125, -0.3339576721191406, -0.32238006591796875, -0.3108024597167969, -0.299224853515625, -0.2876472473144531, -0.27606964111328125, -0.2644920349121094, -0.2529144287109375, -0.24133682250976562, -0.22975921630859375, -0.21818161010742188, -0.20660400390625, -0.19502639770507812, -0.18344879150390625, -0.17187118530273438, -0.1602935791015625, -0.14871597290039062, -0.13713836669921875, -0.12556076049804688, -0.113983154296875, -0.10240554809570312, -0.09082794189453125, -0.07925033569335938, -0.0676727294921875, -0.056095123291015625, -0.04451751708984375, -0.032939910888671875, -0.0213623046875, -0.009784698486328125, 0.00179290771484375, 0.013370513916015625, 0.0249481201171875, 0.036525726318359375, 0.04810333251953125, 0.059680938720703125, 0.071258544921875, 0.08283615112304688, 0.09441375732421875, 0.10599136352539062, 0.1175689697265625, 0.12914657592773438, 0.14072418212890625, 0.15230178833007812, 0.16387939453125, 0.17545700073242188, 0.18703460693359375, 0.19861221313476562, 0.2101898193359375, 0.22176742553710938, 0.23334503173828125, 0.24492263793945312, 0.256500244140625, 0.2680778503417969, 0.27965545654296875, 0.2912330627441406, 0.3028106689453125, 0.3143882751464844, 0.32596588134765625, 0.3375434875488281, 0.34912109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 8.0, 17.0, 17.0, 17.0, 22.0, 21.0, 46.0, 43.0, 70.0, 115.0, 141.0, 274.0, 449.0, 713.0, 1322.0, 2877.0, 8187.0, 32421.0, 154921.0, 462101.0, 294623.0, 65991.0, 14960.0, 4725.0, 1898.0, 959.0, 526.0, 305.0, 214.0, 142.0, 105.0, 74.0, 45.0, 43.0, 29.0, 36.0, 18.0, 20.0, 12.0, 4.0, 7.0, 1.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.59765625, -0.5782089233398438, -0.5587615966796875, -0.5393142700195312, -0.519866943359375, -0.5004196166992188, -0.4809722900390625, -0.46152496337890625, -0.44207763671875, -0.42263031005859375, -0.4031829833984375, -0.38373565673828125, -0.364288330078125, -0.34484100341796875, -0.3253936767578125, -0.30594635009765625, -0.2864990234375, -0.26705169677734375, -0.2476043701171875, -0.22815704345703125, -0.208709716796875, -0.18926239013671875, -0.1698150634765625, -0.15036773681640625, -0.13092041015625, -0.11147308349609375, -0.0920257568359375, -0.07257843017578125, -0.053131103515625, -0.03368377685546875, -0.0142364501953125, 0.00521087646484375, 0.024658203125, 0.04410552978515625, 0.0635528564453125, 0.08300018310546875, 0.102447509765625, 0.12189483642578125, 0.1413421630859375, 0.16078948974609375, 0.18023681640625, 0.19968414306640625, 0.2191314697265625, 0.23857879638671875, 0.258026123046875, 0.27747344970703125, 0.2969207763671875, 0.31636810302734375, 0.3358154296875, 0.35526275634765625, 0.3747100830078125, 0.39415740966796875, 0.413604736328125, 0.43305206298828125, 0.4524993896484375, 0.47194671630859375, 0.49139404296875, 0.5108413696289062, 0.5302886962890625, 0.5497360229492188, 0.569183349609375, 0.5886306762695312, 0.6080780029296875, 0.6275253295898438, 0.64697265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 7.0, 15.0, 9.0, 17.0, 16.0, 14.0, 29.0, 22.0, 35.0, 38.0, 41.0, 42.0, 40.0, 41.0, 55.0, 46.0, 43.0, 54.0, 61.0, 37.0, 42.0, 36.0, 31.0, 31.0, 27.0, 23.0, 22.0, 23.0, 19.0, 11.0, 7.0, 10.0, 6.0, 9.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.92431640625, -0.8982162475585938, -0.8721160888671875, -0.8460159301757812, -0.819915771484375, -0.7938156127929688, -0.7677154541015625, -0.7416152954101562, -0.71551513671875, -0.6894149780273438, -0.6633148193359375, -0.6372146606445312, -0.611114501953125, -0.5850143432617188, -0.5589141845703125, -0.5328140258789062, -0.5067138671875, -0.48061370849609375, -0.4545135498046875, -0.42841339111328125, -0.402313232421875, -0.37621307373046875, -0.3501129150390625, -0.32401275634765625, -0.29791259765625, -0.27181243896484375, -0.2457122802734375, -0.21961212158203125, -0.193511962890625, -0.16741180419921875, -0.1413116455078125, -0.11521148681640625, -0.089111328125, -0.06301116943359375, -0.0369110107421875, -0.01081085205078125, 0.015289306640625, 0.04138946533203125, 0.0674896240234375, 0.09358978271484375, 0.11968994140625, 0.14579010009765625, 0.1718902587890625, 0.19799041748046875, 0.224090576171875, 0.25019073486328125, 0.2762908935546875, 0.30239105224609375, 0.3284912109375, 0.35459136962890625, 0.3806915283203125, 0.40679168701171875, 0.432891845703125, 0.45899200439453125, 0.4850921630859375, 0.5111923217773438, 0.53729248046875, 0.5633926391601562, 0.5894927978515625, 0.6155929565429688, 0.641693115234375, 0.6677932739257812, 0.6938934326171875, 0.7199935913085938, 0.74609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 14.0, 42.0, 78.0, 203.0, 704.0, 3281.0, 49440.0, 838634.0, 148046.0, 6512.0, 1064.0, 312.0, 107.0, 42.0, 24.0, 16.0, 14.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4648551940917969, -0.45143890380859375, -0.4380226135253906, -0.4246063232421875, -0.4111900329589844, -0.39777374267578125, -0.3843574523925781, -0.370941162109375, -0.3575248718261719, -0.34410858154296875, -0.3306922912597656, -0.3172760009765625, -0.3038597106933594, -0.29044342041015625, -0.2770271301269531, -0.26361083984375, -0.2501945495605469, -0.23677825927734375, -0.22336196899414062, -0.2099456787109375, -0.19652938842773438, -0.18311309814453125, -0.16969680786132812, -0.156280517578125, -0.14286422729492188, -0.12944793701171875, -0.11603164672851562, -0.1026153564453125, -0.08919906616210938, -0.07578277587890625, -0.062366485595703125, -0.0489501953125, -0.035533905029296875, -0.02211761474609375, -0.008701324462890625, 0.0047149658203125, 0.018131256103515625, 0.03154754638671875, 0.044963836669921875, 0.058380126953125, 0.07179641723632812, 0.08521270751953125, 0.09862899780273438, 0.1120452880859375, 0.12546157836914062, 0.13887786865234375, 0.15229415893554688, 0.16571044921875, 0.17912673950195312, 0.19254302978515625, 0.20595932006835938, 0.2193756103515625, 0.23279190063476562, 0.24620819091796875, 0.2596244812011719, 0.273040771484375, 0.2864570617675781, 0.29987335205078125, 0.3132896423339844, 0.3267059326171875, 0.3401222229003906, 0.35353851318359375, 0.3669548034667969, 0.38037109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 3.0, 10.0, 7.0, 8.0, 17.0, 13.0, 17.0, 19.0, 28.0, 28.0, 40.0, 49.0, 53.0, 76.0, 92.0, 102.0, 74.0, 75.0, 36.0, 49.0, 26.0, 18.0, 23.0, 26.0, 21.0, 16.0, 20.0, 12.0, 8.0, 6.0, 5.0, 1.0, 3.0, 10.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011044740676879883, -0.00010711606591939926, -0.0001037847250699997, -0.00010045338422060013, -9.712204337120056e-05, -9.3790702521801e-05, -9.045936167240143e-05, -8.712802082300186e-05, -8.37966799736023e-05, -8.046533912420273e-05, -7.713399827480316e-05, -7.38026574254036e-05, -7.047131657600403e-05, -6.713997572660446e-05, -6.38086348772049e-05, -6.047729402780533e-05, -5.714595317840576e-05, -5.3814612329006195e-05, -5.048327147960663e-05, -4.715193063020706e-05, -4.3820589780807495e-05, -4.048924893140793e-05, -3.715790808200836e-05, -3.3826567232608795e-05, -3.049522638320923e-05, -2.7163885533809662e-05, -2.3832544684410095e-05, -2.050120383501053e-05, -1.7169862985610962e-05, -1.3838522136211395e-05, -1.0507181286811829e-05, -7.175840437412262e-06, -3.844499588012695e-06, -5.131587386131287e-07, 2.818182110786438e-06, 6.149522960186005e-06, 9.480863809585571e-06, 1.2812204658985138e-05, 1.6143545508384705e-05, 1.947488635778427e-05, 2.2806227207183838e-05, 2.6137568056583405e-05, 2.946890890598297e-05, 3.280024975538254e-05, 3.6131590604782104e-05, 3.946293145418167e-05, 4.279427230358124e-05, 4.6125613152980804e-05, 4.945695400238037e-05, 5.278829485177994e-05, 5.6119635701179504e-05, 5.945097655057907e-05, 6.278231739997864e-05, 6.61136582493782e-05, 6.944499909877777e-05, 7.277633994817734e-05, 7.61076807975769e-05, 7.943902164697647e-05, 8.277036249637604e-05, 8.61017033457756e-05, 8.943304419517517e-05, 9.276438504457474e-05, 9.60957258939743e-05, 9.942706674337387e-05, 0.00010275840759277344]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 2.0, 6.0, 7.0, 11.0, 11.0, 25.0, 25.0, 32.0, 39.0, 58.0, 96.0, 128.0, 263.0, 372.0, 694.0, 1446.0, 3596.0, 11731.0, 55765.0, 347754.0, 501780.0, 97612.0, 17935.0, 5090.0, 1882.0, 924.0, 448.0, 269.0, 162.0, 109.0, 77.0, 56.0, 35.0, 24.0, 23.0, 17.0, 11.0, 9.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.177734375, -0.17142105102539062, -0.16510772705078125, -0.15879440307617188, -0.1524810791015625, -0.14616775512695312, -0.13985443115234375, -0.13354110717773438, -0.127227783203125, -0.12091445922851562, -0.11460113525390625, -0.10828781127929688, -0.1019744873046875, -0.09566116333007812, -0.08934783935546875, -0.08303451538085938, -0.07672119140625, -0.07040786743164062, -0.06409454345703125, -0.057781219482421875, -0.0514678955078125, -0.045154571533203125, -0.03884124755859375, -0.032527923583984375, -0.026214599609375, -0.019901275634765625, -0.01358795166015625, -0.007274627685546875, -0.0009613037109375, 0.005352020263671875, 0.01166534423828125, 0.017978668212890625, 0.0242919921875, 0.030605316162109375, 0.03691864013671875, 0.043231964111328125, 0.0495452880859375, 0.055858612060546875, 0.06217193603515625, 0.06848526000976562, 0.074798583984375, 0.08111190795898438, 0.08742523193359375, 0.09373855590820312, 0.1000518798828125, 0.10636520385742188, 0.11267852783203125, 0.11899185180664062, 0.12530517578125, 0.13161849975585938, 0.13793182373046875, 0.14424514770507812, 0.1505584716796875, 0.15687179565429688, 0.16318511962890625, 0.16949844360351562, 0.175811767578125, 0.18212509155273438, 0.18843841552734375, 0.19475173950195312, 0.2010650634765625, 0.20737838745117188, 0.21369171142578125, 0.22000503540039062, 0.226318359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 10.0, 11.0, 21.0, 18.0, 30.0, 37.0, 46.0, 53.0, 54.0, 70.0, 89.0, 84.0, 68.0, 61.0, 69.0, 67.0, 50.0, 31.0, 30.0, 23.0, 16.0, 9.0, 13.0, 8.0, 4.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1256103515625, -0.11945533752441406, -0.11330032348632812, -0.10714530944824219, -0.10099029541015625, -0.09483528137207031, -0.08868026733398438, -0.08252525329589844, -0.0763702392578125, -0.07021522521972656, -0.06406021118164062, -0.05790519714355469, -0.05175018310546875, -0.04559516906738281, -0.039440155029296875, -0.03328514099121094, -0.027130126953125, -0.020975112915039062, -0.014820098876953125, -0.008665084838867188, -0.00251007080078125, 0.0036449432373046875, 0.009799957275390625, 0.015954971313476562, 0.0221099853515625, 0.028264999389648438, 0.034420013427734375, 0.04057502746582031, 0.04673004150390625, 0.05288505554199219, 0.059040069580078125, 0.06519508361816406, 0.07135009765625, 0.07750511169433594, 0.08366012573242188, 0.08981513977050781, 0.09597015380859375, 0.10212516784667969, 0.10828018188476562, 0.11443519592285156, 0.1205902099609375, 0.12674522399902344, 0.13290023803710938, 0.1390552520751953, 0.14521026611328125, 0.1513652801513672, 0.15752029418945312, 0.16367530822753906, 0.169830322265625, 0.17598533630371094, 0.18214035034179688, 0.1882953643798828, 0.19445037841796875, 0.2006053924560547, 0.20676040649414062, 0.21291542053222656, 0.2190704345703125, 0.22522544860839844, 0.23138046264648438, 0.2375354766845703, 0.24369049072265625, 0.2498455047607422, 0.2560005187988281, 0.26215553283691406, 0.268310546875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 20.0, 27.0, 86.0, 177.0, 259.0, 223.0, 105.0, 52.0, 26.0, 10.0, 5.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.575613975524902, -5.3596601486206055, -5.143706321716309, -4.927752494812012, -4.711798667907715, -4.495844841003418, -4.279891014099121, -4.063937187194824, -3.8479833602905273, -3.6320295333862305, -3.4160757064819336, -3.2001218795776367, -2.98416805267334, -2.768214225769043, -2.552260398864746, -2.336306571960449, -2.1203525066375732, -1.9043986797332764, -1.6884448528289795, -1.4724910259246826, -1.2565371990203857, -1.0405832529067993, -0.8246294260025024, -0.6086755990982056, -0.3927217721939087, -0.17676793038845062, 0.039185911417007446, 0.2551397681236267, 0.4710935950279236, 0.6870474815368652, 0.9030013084411621, 1.118955135345459, 1.3349089622497559, 1.5508627891540527, 1.7668166160583496, 1.9827704429626465, 2.1987242698669434, 2.4146780967712402, 2.630631923675537, 2.846585750579834, 3.062539577484131, 3.2784934043884277, 3.4944472312927246, 3.7104010581970215, 3.9263548851013184, 4.142308712005615, 4.358262538909912, 4.574216365814209, 4.790170669555664, 5.006124496459961, 5.222078323364258, 5.438032150268555, 5.653985977172852, 5.869939804077148, 6.085893630981445, 6.301847457885742, 6.517801284790039, 6.733755111694336, 6.949708938598633, 7.16566276550293, 7.381616592407227, 7.597570419311523, 7.81352424621582, 8.029478073120117, 8.245431900024414]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 8.0, 9.0, 10.0, 10.0, 13.0, 15.0, 12.0, 21.0, 21.0, 24.0, 31.0, 42.0, 43.0, 44.0, 49.0, 39.0, 48.0, 39.0, 48.0, 64.0, 49.0, 31.0, 36.0, 36.0, 35.0, 29.0, 33.0, 29.0, 31.0, 18.0, 10.0, 15.0, 10.0, 12.0, 11.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.656693935394287, -4.512688636779785, -4.368682861328125, -4.224677562713623, -4.080672264099121, -3.936666488647461, -3.792661190032959, -3.648655652999878, -3.504650115966797, -3.360644578933716, -3.216639280319214, -3.072633743286133, -2.9286282062530518, -2.7846226692199707, -2.6406173706054688, -2.4966118335723877, -2.3526065349578857, -2.2086009979248047, -2.0645956993103027, -1.9205901622772217, -1.7765846252441406, -1.6325792074203491, -1.4885737895965576, -1.3445682525634766, -1.200562834739685, -1.0565574169158936, -0.9125518798828125, -0.768546462059021, -0.6245409846305847, -0.48053550720214844, -0.33653008937835693, -0.19252455234527588, -0.048519134521484375, 0.09548632800579071, 0.2394917905330658, 0.3834972381591797, 0.527502715587616, 0.6715081930160522, 0.8155136108398438, 0.9595191478729248, 1.1035245656967163, 1.2475299835205078, 1.3915355205535889, 1.5355409383773804, 1.6795463562011719, 1.823551893234253, 1.9675573110580444, 2.111562728881836, 2.255568265914917, 2.399573802947998, 2.5435791015625, 2.687584638595581, 2.831590175628662, 2.975595474243164, 3.119601011276245, 3.263606548309326, 3.407611846923828, 3.551617383956909, 3.695622682571411, 3.839628219604492, 3.9836337566375732, 4.127639293670654, 4.271644592285156, 4.415650367736816, 4.559655666351318]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 11.0, 15.0, 18.0, 20.0, 28.0, 35.0, 64.0, 124.0, 205.0, 377.0, 753.0, 1700.0, 5205.0, 27560.0, 1897580.0, 2224042.0, 27734.0, 5435.0, 1790.0, 742.0, 355.0, 188.0, 89.0, 61.0, 43.0, 28.0, 17.0, 15.0, 3.0, 5.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4658203125, -1.4227142333984375, -1.379608154296875, -1.3365020751953125, -1.29339599609375, -1.2502899169921875, -1.207183837890625, -1.1640777587890625, -1.1209716796875, -1.0778656005859375, -1.034759521484375, -0.9916534423828125, -0.94854736328125, -0.9054412841796875, -0.862335205078125, -0.8192291259765625, -0.776123046875, -0.7330169677734375, -0.689910888671875, -0.6468048095703125, -0.60369873046875, -0.5605926513671875, -0.517486572265625, -0.4743804931640625, -0.4312744140625, -0.3881683349609375, -0.345062255859375, -0.3019561767578125, -0.25885009765625, -0.2157440185546875, -0.172637939453125, -0.1295318603515625, -0.08642578125, -0.0433197021484375, -0.000213623046875, 0.0428924560546875, 0.08599853515625, 0.1291046142578125, 0.172210693359375, 0.2153167724609375, 0.2584228515625, 0.3015289306640625, 0.344635009765625, 0.3877410888671875, 0.43084716796875, 0.4739532470703125, 0.517059326171875, 0.5601654052734375, 0.603271484375, 0.6463775634765625, 0.689483642578125, 0.7325897216796875, 0.77569580078125, 0.8188018798828125, 0.861907958984375, 0.9050140380859375, 0.9481201171875, 0.9912261962890625, 1.034332275390625, 1.0774383544921875, 1.12054443359375, 1.1636505126953125, 1.206756591796875, 1.2498626708984375, 1.29296875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 6.0, 8.0, 16.0, 26.0, 26.0, 50.0, 75.0, 106.0, 116.0, 116.0, 114.0, 91.0, 75.0, 80.0, 35.0, 23.0, 16.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3974609375, -0.3856163024902344, -0.37377166748046875, -0.3619270324707031, -0.3500823974609375, -0.3382377624511719, -0.32639312744140625, -0.3145484924316406, -0.302703857421875, -0.2908592224121094, -0.27901458740234375, -0.2671699523925781, -0.2553253173828125, -0.24348068237304688, -0.23163604736328125, -0.21979141235351562, -0.20794677734375, -0.19610214233398438, -0.18425750732421875, -0.17241287231445312, -0.1605682373046875, -0.14872360229492188, -0.13687896728515625, -0.12503433227539062, -0.113189697265625, -0.10134506225585938, -0.08950042724609375, -0.07765579223632812, -0.0658111572265625, -0.053966522216796875, -0.04212188720703125, -0.030277252197265625, -0.0184326171875, -0.006587982177734375, 0.00525665283203125, 0.017101287841796875, 0.0289459228515625, 0.040790557861328125, 0.05263519287109375, 0.06447982788085938, 0.076324462890625, 0.08816909790039062, 0.10001373291015625, 0.11185836791992188, 0.1237030029296875, 0.13554763793945312, 0.14739227294921875, 0.15923690795898438, 0.17108154296875, 0.18292617797851562, 0.19477081298828125, 0.20661544799804688, 0.2184600830078125, 0.23030471801757812, 0.24214935302734375, 0.2539939880371094, 0.265838623046875, 0.2776832580566406, 0.28952789306640625, 0.3013725280761719, 0.3132171630859375, 0.3250617980957031, 0.33690643310546875, 0.3487510681152344, 0.360595703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 9.0, 6.0, 9.0, 9.0, 25.0, 29.0, 46.0, 64.0, 124.0, 224.0, 518.0, 1350.0, 4839.0, 29201.0, 912911.0, 3182606.0, 51711.0, 7270.0, 1963.0, 706.0, 299.0, 140.0, 72.0, 37.0, 42.0, 19.0, 14.0, 11.0, 10.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.880859375, -0.8516082763671875, -0.822357177734375, -0.7931060791015625, -0.76385498046875, -0.7346038818359375, -0.705352783203125, -0.6761016845703125, -0.6468505859375, -0.6175994873046875, -0.588348388671875, -0.5590972900390625, -0.52984619140625, -0.5005950927734375, -0.471343994140625, -0.4420928955078125, -0.412841796875, -0.3835906982421875, -0.354339599609375, -0.3250885009765625, -0.29583740234375, -0.2665863037109375, -0.237335205078125, -0.2080841064453125, -0.1788330078125, -0.1495819091796875, -0.120330810546875, -0.0910797119140625, -0.06182861328125, -0.0325775146484375, -0.003326416015625, 0.0259246826171875, 0.05517578125, 0.0844268798828125, 0.113677978515625, 0.1429290771484375, 0.17218017578125, 0.2014312744140625, 0.230682373046875, 0.2599334716796875, 0.2891845703125, 0.3184356689453125, 0.347686767578125, 0.3769378662109375, 0.40618896484375, 0.4354400634765625, 0.464691162109375, 0.4939422607421875, 0.523193359375, 0.5524444580078125, 0.581695556640625, 0.6109466552734375, 0.64019775390625, 0.6694488525390625, 0.698699951171875, 0.7279510498046875, 0.7572021484375, 0.7864532470703125, 0.815704345703125, 0.8449554443359375, 0.87420654296875, 0.9034576416015625, 0.932708740234375, 0.9619598388671875, 0.9912109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 5.0, 21.0, 27.0, 39.0, 74.0, 137.0, 298.0, 923.0, 1612.0, 483.0, 177.0, 104.0, 55.0, 39.0, 23.0, 11.0, 15.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378173828125, -0.36566925048828125, -0.3531646728515625, -0.34066009521484375, -0.328155517578125, -0.31565093994140625, -0.3031463623046875, -0.29064178466796875, -0.27813720703125, -0.26563262939453125, -0.2531280517578125, -0.24062347412109375, -0.228118896484375, -0.21561431884765625, -0.2031097412109375, -0.19060516357421875, -0.1781005859375, -0.16559600830078125, -0.1530914306640625, -0.14058685302734375, -0.128082275390625, -0.11557769775390625, -0.1030731201171875, -0.09056854248046875, -0.07806396484375, -0.06555938720703125, -0.0530548095703125, -0.04055023193359375, -0.028045654296875, -0.01554107666015625, -0.0030364990234375, 0.00946807861328125, 0.02197265625, 0.03447723388671875, 0.0469818115234375, 0.05948638916015625, 0.071990966796875, 0.08449554443359375, 0.0970001220703125, 0.10950469970703125, 0.12200927734375, 0.13451385498046875, 0.1470184326171875, 0.15952301025390625, 0.172027587890625, 0.18453216552734375, 0.1970367431640625, 0.20954132080078125, 0.2220458984375, 0.23455047607421875, 0.2470550537109375, 0.25955963134765625, 0.272064208984375, 0.28456878662109375, 0.2970733642578125, 0.30957794189453125, 0.32208251953125, 0.33458709716796875, 0.3470916748046875, 0.35959625244140625, 0.372100830078125, 0.38460540771484375, 0.3971099853515625, 0.40961456298828125, 0.422119140625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 10.0, 18.0, 80.0, 129.0, 219.0, 235.0, 174.0, 85.0, 30.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7030043601989746, -1.6262515783309937, -1.5494986772537231, -1.4727458953857422, -1.3959929943084717, -1.3192402124404907, -1.2424874305725098, -1.1657345294952393, -1.0889816284179688, -1.0122288465499878, -0.9354759454727173, -0.8587231636047363, -0.7819702625274658, -0.7052174806594849, -0.6284646391868591, -0.5517117977142334, -0.47495901584625244, -0.3982061743736267, -0.321453332901001, -0.24470052123069763, -0.1679476797580719, -0.09119483828544617, -0.014442026615142822, 0.06231081485748291, 0.13906365633010864, 0.21581649780273438, 0.2925693392753601, 0.36932215094566345, 0.4460749924182892, 0.5228278636932373, 0.5995806455612183, 0.676333487033844, 0.7530863285064697, 0.8298391699790955, 0.9065920114517212, 0.9833447933197021, 1.0600976943969727, 1.1368504762649536, 1.2136032581329346, 1.290356159210205, 1.3671090602874756, 1.4438618421554565, 1.520614743232727, 1.597367525100708, 1.6741204261779785, 1.7508732080459595, 1.8276259899139404, 1.904378890991211, 1.981131672859192, 2.057884454727173, 2.1346373558044434, 2.211390256881714, 2.2881429195404053, 2.364895820617676, 2.4416487216949463, 2.518401622772217, 2.595154285430908, 2.6719071865081787, 2.74865984916687, 2.8254127502441406, 2.902165651321411, 2.9789185523986816, 3.055671215057373, 3.1324241161346436, 3.209177017211914]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 7.0, 14.0, 24.0, 27.0, 46.0, 38.0, 41.0, 43.0, 67.0, 59.0, 75.0, 70.0, 73.0, 65.0, 59.0, 63.0, 60.0, 30.0, 36.0, 26.0, 26.0, 11.0, 15.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.881627082824707, -1.8319774866104126, -1.7823278903961182, -1.7326782941818237, -1.6830286979675293, -1.6333791017532349, -1.5837295055389404, -1.534079909324646, -1.4844303131103516, -1.4347807168960571, -1.3851311206817627, -1.3354815244674683, -1.2858319282531738, -1.2361823320388794, -1.186532735824585, -1.1368831396102905, -1.087233543395996, -1.0375839471817017, -0.9879343509674072, -0.9382847547531128, -0.8886351585388184, -0.8389855623245239, -0.7893359661102295, -0.7396863698959351, -0.6900368928909302, -0.6403872966766357, -0.5907377004623413, -0.5410881042480469, -0.49143850803375244, -0.441788911819458, -0.39213934540748596, -0.34248974919319153, -0.2928401231765747, -0.24319052696228027, -0.19354093074798584, -0.1438913494348526, -0.09424175322055817, -0.04459215700626373, 0.005057424306869507, 0.05470702052116394, 0.10435661673545837, 0.1540062129497528, 0.20365580916404724, 0.2533053755760193, 0.3029549717903137, 0.35260456800460815, 0.4022541642189026, 0.451903760433197, 0.5015533566474915, 0.5512029528617859, 0.6008525490760803, 0.6505021452903748, 0.7001517415046692, 0.7498013377189636, 0.7994508743286133, 0.8491004705429077, 0.8987500667572021, 0.9483996629714966, 0.998049259185791, 1.0476988554000854, 1.0973484516143799, 1.1469980478286743, 1.1966476440429688, 1.2462972402572632, 1.2959468364715576]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 8.0, 6.0, 6.0, 14.0, 25.0, 33.0, 74.0, 100.0, 214.0, 347.0, 728.0, 1361.0, 3182.0, 11057.0, 75068.0, 637980.0, 280081.0, 28118.0, 5913.0, 2123.0, 989.0, 493.0, 278.0, 118.0, 98.0, 52.0, 32.0, 19.0, 14.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.2119140625, -1.176025390625, -1.14013671875, -1.104248046875, -1.068359375, -1.032470703125, -0.99658203125, -0.960693359375, -0.9248046875, -0.888916015625, -0.85302734375, -0.817138671875, -0.78125, -0.745361328125, -0.70947265625, -0.673583984375, -0.6376953125, -0.601806640625, -0.56591796875, -0.530029296875, -0.494140625, -0.458251953125, -0.42236328125, -0.386474609375, -0.3505859375, -0.314697265625, -0.27880859375, -0.242919921875, -0.20703125, -0.171142578125, -0.13525390625, -0.099365234375, -0.0634765625, -0.027587890625, 0.00830078125, 0.044189453125, 0.080078125, 0.115966796875, 0.15185546875, 0.187744140625, 0.2236328125, 0.259521484375, 0.29541015625, 0.331298828125, 0.3671875, 0.403076171875, 0.43896484375, 0.474853515625, 0.5107421875, 0.546630859375, 0.58251953125, 0.618408203125, 0.654296875, 0.690185546875, 0.72607421875, 0.761962890625, 0.7978515625, 0.833740234375, 0.86962890625, 0.905517578125, 0.94140625, 0.977294921875, 1.01318359375, 1.049072265625, 1.0849609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 7.0, 15.0, 26.0, 29.0, 53.0, 85.0, 94.0, 113.0, 113.0, 109.0, 91.0, 79.0, 63.0, 46.0, 29.0, 9.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3857421875, -0.3745841979980469, -0.36342620849609375, -0.3522682189941406, -0.3411102294921875, -0.3299522399902344, -0.31879425048828125, -0.3076362609863281, -0.296478271484375, -0.2853202819824219, -0.27416229248046875, -0.2630043029785156, -0.2518463134765625, -0.24068832397460938, -0.22953033447265625, -0.21837234497070312, -0.20721435546875, -0.19605636596679688, -0.18489837646484375, -0.17374038696289062, -0.1625823974609375, -0.15142440795898438, -0.14026641845703125, -0.12910842895507812, -0.117950439453125, -0.10679244995117188, -0.09563446044921875, -0.08447647094726562, -0.0733184814453125, -0.062160491943359375, -0.05100250244140625, -0.039844512939453125, -0.0286865234375, -0.017528533935546875, -0.00637054443359375, 0.004787445068359375, 0.0159454345703125, 0.027103424072265625, 0.03826141357421875, 0.049419403076171875, 0.060577392578125, 0.07173538208007812, 0.08289337158203125, 0.09405136108398438, 0.1052093505859375, 0.11636734008789062, 0.12752532958984375, 0.13868331909179688, 0.14984130859375, 0.16099929809570312, 0.17215728759765625, 0.18331527709960938, 0.1944732666015625, 0.20563125610351562, 0.21678924560546875, 0.22794723510742188, 0.239105224609375, 0.2502632141113281, 0.26142120361328125, 0.2725791931152344, 0.2837371826171875, 0.2948951721191406, 0.30605316162109375, 0.3172111511230469, 0.328369140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 8.0, 5.0, 13.0, 28.0, 17.0, 44.0, 39.0, 70.0, 96.0, 120.0, 200.0, 350.0, 586.0, 1109.0, 2257.0, 5521.0, 15926.0, 59911.0, 232534.0, 450470.0, 204579.0, 51487.0, 14255.0, 4718.0, 1867.0, 851.0, 489.0, 311.0, 199.0, 128.0, 91.0, 66.0, 51.0, 33.0, 35.0, 19.0, 16.0, 12.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.48876953125, -0.4709625244140625, -0.453155517578125, -0.4353485107421875, -0.41754150390625, -0.3997344970703125, -0.381927490234375, -0.3641204833984375, -0.3463134765625, -0.3285064697265625, -0.310699462890625, -0.2928924560546875, -0.27508544921875, -0.2572784423828125, -0.239471435546875, -0.2216644287109375, -0.203857421875, -0.1860504150390625, -0.168243408203125, -0.1504364013671875, -0.13262939453125, -0.1148223876953125, -0.097015380859375, -0.0792083740234375, -0.0614013671875, -0.0435943603515625, -0.025787353515625, -0.0079803466796875, 0.00982666015625, 0.0276336669921875, 0.045440673828125, 0.0632476806640625, 0.0810546875, 0.0988616943359375, 0.116668701171875, 0.1344757080078125, 0.15228271484375, 0.1700897216796875, 0.187896728515625, 0.2057037353515625, 0.2235107421875, 0.2413177490234375, 0.259124755859375, 0.2769317626953125, 0.29473876953125, 0.3125457763671875, 0.330352783203125, 0.3481597900390625, 0.365966796875, 0.3837738037109375, 0.401580810546875, 0.4193878173828125, 0.43719482421875, 0.4550018310546875, 0.472808837890625, 0.4906158447265625, 0.5084228515625, 0.5262298583984375, 0.544036865234375, 0.5618438720703125, 0.57965087890625, 0.5974578857421875, 0.615264892578125, 0.6330718994140625, 0.65087890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 8.0, 9.0, 14.0, 17.0, 21.0, 21.0, 21.0, 34.0, 31.0, 31.0, 34.0, 49.0, 42.0, 34.0, 41.0, 48.0, 39.0, 44.0, 40.0, 47.0, 43.0, 43.0, 33.0, 36.0, 35.0, 27.0, 24.0, 29.0, 21.0, 5.0, 8.0, 16.0, 9.0, 11.0, 7.0, 6.0, 3.0, 10.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6298828125, -0.603363037109375, -0.57684326171875, -0.550323486328125, -0.5238037109375, -0.497283935546875, -0.47076416015625, -0.444244384765625, -0.417724609375, -0.391204833984375, -0.36468505859375, -0.338165283203125, -0.3116455078125, -0.285125732421875, -0.25860595703125, -0.232086181640625, -0.20556640625, -0.179046630859375, -0.15252685546875, -0.126007080078125, -0.0994873046875, -0.072967529296875, -0.04644775390625, -0.019927978515625, 0.006591796875, 0.033111572265625, 0.05963134765625, 0.086151123046875, 0.1126708984375, 0.139190673828125, 0.16571044921875, 0.192230224609375, 0.21875, 0.245269775390625, 0.27178955078125, 0.298309326171875, 0.3248291015625, 0.351348876953125, 0.37786865234375, 0.404388427734375, 0.430908203125, 0.457427978515625, 0.48394775390625, 0.510467529296875, 0.5369873046875, 0.563507080078125, 0.59002685546875, 0.616546630859375, 0.64306640625, 0.669586181640625, 0.69610595703125, 0.722625732421875, 0.7491455078125, 0.775665283203125, 0.80218505859375, 0.828704833984375, 0.855224609375, 0.881744384765625, 0.90826416015625, 0.934783935546875, 0.9613037109375, 0.987823486328125, 1.01434326171875, 1.040863037109375, 1.0673828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 5.0, 3.0, 2.0, 10.0, 14.0, 20.0, 34.0, 64.0, 100.0, 242.0, 560.0, 1719.0, 9706.0, 205023.0, 798473.0, 27634.0, 3360.0, 909.0, 320.0, 151.0, 81.0, 37.0, 24.0, 19.0, 11.0, 12.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.66259765625, -0.6443023681640625, -0.626007080078125, -0.6077117919921875, -0.58941650390625, -0.5711212158203125, -0.552825927734375, -0.5345306396484375, -0.5162353515625, -0.4979400634765625, -0.479644775390625, -0.4613494873046875, -0.44305419921875, -0.4247589111328125, -0.406463623046875, -0.3881683349609375, -0.369873046875, -0.3515777587890625, -0.333282470703125, -0.3149871826171875, -0.29669189453125, -0.2783966064453125, -0.260101318359375, -0.2418060302734375, -0.2235107421875, -0.2052154541015625, -0.186920166015625, -0.1686248779296875, -0.15032958984375, -0.1320343017578125, -0.113739013671875, -0.0954437255859375, -0.0771484375, -0.0588531494140625, -0.040557861328125, -0.0222625732421875, -0.00396728515625, 0.0143280029296875, 0.032623291015625, 0.0509185791015625, 0.0692138671875, 0.0875091552734375, 0.105804443359375, 0.1240997314453125, 0.14239501953125, 0.1606903076171875, 0.178985595703125, 0.1972808837890625, 0.215576171875, 0.2338714599609375, 0.252166748046875, 0.2704620361328125, 0.28875732421875, 0.3070526123046875, 0.325347900390625, 0.3436431884765625, 0.3619384765625, 0.3802337646484375, 0.398529052734375, 0.4168243408203125, 0.43511962890625, 0.4534149169921875, 0.471710205078125, 0.4900054931640625, 0.50830078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 8.0, 9.0, 12.0, 13.0, 24.0, 27.0, 25.0, 42.0, 50.0, 82.0, 147.0, 140.0, 114.0, 90.0, 59.0, 29.0, 28.0, 22.0, 15.0, 11.0, 13.0, 8.0, 6.0, 10.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.00021386146545410156, -0.00020913872867822647, -0.00020441599190235138, -0.0001996932551264763, -0.0001949705183506012, -0.0001902477815747261, -0.000185525044798851, -0.00018080230802297592, -0.00017607957124710083, -0.00017135683447122574, -0.00016663409769535065, -0.00016191136091947556, -0.00015718862414360046, -0.00015246588736772537, -0.00014774315059185028, -0.0001430204138159752, -0.0001382976770401001, -0.000133574940264225, -0.00012885220348834991, -0.00012412946671247482, -0.00011940672993659973, -0.00011468399316072464, -0.00010996125638484955, -0.00010523851960897446, -0.00010051578283309937, -9.579304605722427e-05, -9.107030928134918e-05, -8.634757250547409e-05, -8.1624835729599e-05, -7.690209895372391e-05, -7.217936217784882e-05, -6.745662540197372e-05, -6.273388862609863e-05, -5.801115185022354e-05, -5.328841507434845e-05, -4.856567829847336e-05, -4.3842941522598267e-05, -3.9120204746723175e-05, -3.4397467970848083e-05, -2.9674731194972992e-05, -2.49519944190979e-05, -2.022925764322281e-05, -1.5506520867347717e-05, -1.0783784091472626e-05, -6.061047315597534e-06, -1.3383105397224426e-06, 3.384426236152649e-06, 8.10716301202774e-06, 1.2829899787902832e-05, 1.7552636563777924e-05, 2.2275373339653015e-05, 2.6998110115528107e-05, 3.17208468914032e-05, 3.644358366727829e-05, 4.116632044315338e-05, 4.588905721902847e-05, 5.0611793994903564e-05, 5.5334530770778656e-05, 6.005726754665375e-05, 6.478000432252884e-05, 6.950274109840393e-05, 7.422547787427902e-05, 7.894821465015411e-05, 8.36709514260292e-05, 8.83936882019043e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 6.0, 9.0, 16.0, 26.0, 31.0, 45.0, 76.0, 139.0, 274.0, 574.0, 1211.0, 2729.0, 8112.0, 39358.0, 536395.0, 415831.0, 31911.0, 6919.0, 2518.0, 1115.0, 536.0, 286.0, 143.0, 88.0, 62.0, 29.0, 22.0, 19.0, 13.0, 8.0, 13.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.38671875, -0.3749809265136719, -0.36324310302734375, -0.3515052795410156, -0.3397674560546875, -0.3280296325683594, -0.31629180908203125, -0.3045539855957031, -0.292816162109375, -0.2810783386230469, -0.26934051513671875, -0.2576026916503906, -0.2458648681640625, -0.23412704467773438, -0.22238922119140625, -0.21065139770507812, -0.19891357421875, -0.18717575073242188, -0.17543792724609375, -0.16370010375976562, -0.1519622802734375, -0.14022445678710938, -0.12848663330078125, -0.11674880981445312, -0.105010986328125, -0.09327316284179688, -0.08153533935546875, -0.06979751586914062, -0.0580596923828125, -0.046321868896484375, -0.03458404541015625, -0.022846221923828125, -0.0111083984375, 0.000629425048828125, 0.01236724853515625, 0.024105072021484375, 0.0358428955078125, 0.047580718994140625, 0.05931854248046875, 0.07105636596679688, 0.082794189453125, 0.09453201293945312, 0.10626983642578125, 0.11800765991210938, 0.1297454833984375, 0.14148330688476562, 0.15322113037109375, 0.16495895385742188, 0.17669677734375, 0.18843460083007812, 0.20017242431640625, 0.21191024780273438, 0.2236480712890625, 0.23538589477539062, 0.24712371826171875, 0.2588615417480469, 0.270599365234375, 0.2823371887207031, 0.29407501220703125, 0.3058128356933594, 0.3175506591796875, 0.3292884826660156, 0.34102630615234375, 0.3527641296386719, 0.364501953125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 7.0, 14.0, 21.0, 29.0, 43.0, 76.0, 117.0, 160.0, 183.0, 120.0, 81.0, 51.0, 24.0, 19.0, 13.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.456298828125, -0.442901611328125, -0.42950439453125, -0.416107177734375, -0.4027099609375, -0.389312744140625, -0.37591552734375, -0.362518310546875, -0.34912109375, -0.335723876953125, -0.32232666015625, -0.308929443359375, -0.2955322265625, -0.282135009765625, -0.26873779296875, -0.255340576171875, -0.241943359375, -0.228546142578125, -0.21514892578125, -0.201751708984375, -0.1883544921875, -0.174957275390625, -0.16156005859375, -0.148162841796875, -0.134765625, -0.121368408203125, -0.10797119140625, -0.094573974609375, -0.0811767578125, -0.067779541015625, -0.05438232421875, -0.040985107421875, -0.027587890625, -0.014190673828125, -0.00079345703125, 0.012603759765625, 0.0260009765625, 0.039398193359375, 0.05279541015625, 0.066192626953125, 0.07958984375, 0.092987060546875, 0.10638427734375, 0.119781494140625, 0.1331787109375, 0.146575927734375, 0.15997314453125, 0.173370361328125, 0.186767578125, 0.200164794921875, 0.21356201171875, 0.226959228515625, 0.2403564453125, 0.253753662109375, 0.26715087890625, 0.280548095703125, 0.2939453125, 0.307342529296875, 0.32073974609375, 0.334136962890625, 0.3475341796875, 0.360931396484375, 0.37432861328125, 0.387725830078125, 0.401123046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 11.0, 36.0, 107.0, 252.0, 327.0, 175.0, 59.0, 24.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.590028762817383, -14.299755096435547, -14.009482383728027, -13.719208717346191, -13.428936004638672, -13.138662338256836, -12.848388671875, -12.558115005493164, -12.267842292785645, -11.977568626403809, -11.687295913696289, -11.397022247314453, -11.106748580932617, -10.816475868225098, -10.526202201843262, -10.235929489135742, -9.945655822753906, -9.65538215637207, -9.36510944366455, -9.074835777282715, -8.784563064575195, -8.49428939819336, -8.204015731811523, -7.913742542266846, -7.623469352722168, -7.33319616317749, -7.0429229736328125, -6.752649307250977, -6.462376117706299, -6.172102928161621, -5.881829261779785, -5.591556072235107, -5.301283359527588, -5.01101016998291, -4.720736503601074, -4.4304633140563965, -4.140190124511719, -3.849916934967041, -3.559643507003784, -3.2693700790405273, -2.9790968894958496, -2.688823699951172, -2.398550271987915, -2.108276844024658, -1.8180036544799805, -1.5277303457260132, -1.237457036972046, -0.9471836090087891, -0.6569104194641113, -0.36663711071014404, -0.07636380195617676, 0.21390950679779053, 0.5041828155517578, 0.7944561243057251, 1.0847294330596924, 1.3750028610229492, 1.665276050567627, 1.9555493593215942, 2.2458226680755615, 2.5360960960388184, 2.826369285583496, 3.116642475128174, 3.4069159030914307, 3.6971893310546875, 3.9874625205993652]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 8.0, 3.0, 9.0, 9.0, 7.0, 10.0, 13.0, 11.0, 16.0, 25.0, 23.0, 30.0, 37.0, 42.0, 35.0, 39.0, 46.0, 54.0, 63.0, 43.0, 51.0, 49.0, 44.0, 34.0, 41.0, 44.0, 39.0, 37.0, 30.0, 19.0, 16.0, 20.0, 10.0, 13.0, 5.0, 12.0, 3.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.251791000366211, -4.087995529174805, -3.9242000579833984, -3.760404586791992, -3.596609115600586, -3.4328136444091797, -3.2690181732177734, -3.105222702026367, -2.941427230834961, -2.7776317596435547, -2.6138362884521484, -2.450040817260742, -2.286245346069336, -2.1224498748779297, -1.9586544036865234, -1.7948589324951172, -1.631063461303711, -1.4672679901123047, -1.3034725189208984, -1.1396770477294922, -0.9758815765380859, -0.8120861053466797, -0.6482906341552734, -0.4844951629638672, -0.32069969177246094, -0.1569042205810547, 0.0068912506103515625, 0.1706867218017578, 0.33448219299316406, 0.4982776641845703, 0.6620731353759766, 0.8258686065673828, 0.9896636009216309, 1.153459072113037, 1.3172545433044434, 1.4810500144958496, 1.6448454856872559, 1.808640956878662, 1.9724364280700684, 2.1362318992614746, 2.300027370452881, 2.463822841644287, 2.6276183128356934, 2.7914137840270996, 2.955209255218506, 3.119004726409912, 3.2828001976013184, 3.4465956687927246, 3.610391139984131, 3.774186611175537, 3.9379820823669434, 4.10177755355835, 4.265573024749756, 4.429368495941162, 4.593163967132568, 4.756959438323975, 4.920754909515381, 5.084550380706787, 5.248345851898193, 5.4121413230896, 5.575936794281006, 5.739732265472412, 5.903527736663818, 6.067323207855225, 6.231118679046631]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 8.0, 19.0, 27.0, 53.0, 106.0, 202.0, 452.0, 1147.0, 4930.0, 47540.0, 4052913.0, 77941.0, 6461.0, 1483.0, 509.0, 235.0, 102.0, 48.0, 39.0, 27.0, 9.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2861328125, -1.241119384765625, -1.19610595703125, -1.151092529296875, -1.1060791015625, -1.061065673828125, -1.01605224609375, -0.971038818359375, -0.926025390625, -0.881011962890625, -0.83599853515625, -0.790985107421875, -0.7459716796875, -0.700958251953125, -0.65594482421875, -0.610931396484375, -0.56591796875, -0.520904541015625, -0.47589111328125, -0.430877685546875, -0.3858642578125, -0.340850830078125, -0.29583740234375, -0.250823974609375, -0.205810546875, -0.160797119140625, -0.11578369140625, -0.070770263671875, -0.0257568359375, 0.019256591796875, 0.06427001953125, 0.109283447265625, 0.154296875, 0.199310302734375, 0.24432373046875, 0.289337158203125, 0.3343505859375, 0.379364013671875, 0.42437744140625, 0.469390869140625, 0.514404296875, 0.559417724609375, 0.60443115234375, 0.649444580078125, 0.6944580078125, 0.739471435546875, 0.78448486328125, 0.829498291015625, 0.87451171875, 0.919525146484375, 0.96453857421875, 1.009552001953125, 1.0545654296875, 1.099578857421875, 1.14459228515625, 1.189605712890625, 1.234619140625, 1.279632568359375, 1.32464599609375, 1.369659423828125, 1.4146728515625, 1.459686279296875, 1.50469970703125, 1.549713134765625, 1.5947265625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 14.0, 20.0, 33.0, 51.0, 66.0, 76.0, 98.0, 108.0, 125.0, 96.0, 85.0, 75.0, 47.0, 31.0, 16.0, 19.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42138671875, -0.40933990478515625, -0.3972930908203125, -0.38524627685546875, -0.373199462890625, -0.36115264892578125, -0.3491058349609375, -0.33705902099609375, -0.32501220703125, -0.31296539306640625, -0.3009185791015625, -0.28887176513671875, -0.276824951171875, -0.26477813720703125, -0.2527313232421875, -0.24068450927734375, -0.2286376953125, -0.21659088134765625, -0.2045440673828125, -0.19249725341796875, -0.180450439453125, -0.16840362548828125, -0.1563568115234375, -0.14430999755859375, -0.13226318359375, -0.12021636962890625, -0.1081695556640625, -0.09612274169921875, -0.084075927734375, -0.07202911376953125, -0.0599822998046875, -0.04793548583984375, -0.035888671875, -0.02384185791015625, -0.0117950439453125, 0.00025177001953125, 0.012298583984375, 0.02434539794921875, 0.0363922119140625, 0.04843902587890625, 0.06048583984375, 0.07253265380859375, 0.0845794677734375, 0.09662628173828125, 0.108673095703125, 0.12071990966796875, 0.1327667236328125, 0.14481353759765625, 0.1568603515625, 0.16890716552734375, 0.1809539794921875, 0.19300079345703125, 0.205047607421875, 0.21709442138671875, 0.2291412353515625, 0.24118804931640625, 0.25323486328125, 0.26528167724609375, 0.2773284912109375, 0.28937530517578125, 0.301422119140625, 0.31346893310546875, 0.3255157470703125, 0.33756256103515625, 0.349609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 5.0, 6.0, 6.0, 9.0, 21.0, 51.0, 110.0, 311.0, 1021.0, 4545.0, 36470.0, 3410455.0, 717112.0, 20175.0, 2845.0, 706.0, 251.0, 84.0, 40.0, 17.0, 11.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85009765625, -0.8216476440429688, -0.7931976318359375, -0.7647476196289062, -0.736297607421875, -0.7078475952148438, -0.6793975830078125, -0.6509475708007812, -0.62249755859375, -0.5940475463867188, -0.5655975341796875, -0.5371475219726562, -0.508697509765625, -0.48024749755859375, -0.4517974853515625, -0.42334747314453125, -0.3948974609375, -0.36644744873046875, -0.3379974365234375, -0.30954742431640625, -0.281097412109375, -0.25264739990234375, -0.2241973876953125, -0.19574737548828125, -0.16729736328125, -0.13884735107421875, -0.1103973388671875, -0.08194732666015625, -0.053497314453125, -0.02504730224609375, 0.0034027099609375, 0.03185272216796875, 0.060302734375, 0.08875274658203125, 0.1172027587890625, 0.14565277099609375, 0.174102783203125, 0.20255279541015625, 0.2310028076171875, 0.25945281982421875, 0.28790283203125, 0.31635284423828125, 0.3448028564453125, 0.37325286865234375, 0.401702880859375, 0.43015289306640625, 0.4586029052734375, 0.48705291748046875, 0.5155029296875, 0.5439529418945312, 0.5724029541015625, 0.6008529663085938, 0.629302978515625, 0.6577529907226562, 0.6862030029296875, 0.7146530151367188, 0.74310302734375, 0.7715530395507812, 0.8000030517578125, 0.8284530639648438, 0.856903076171875, 0.8853530883789062, 0.9138031005859375, 0.9422531127929688, 0.970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 10.0, 10.0, 4.0, 12.0, 14.0, 14.0, 23.0, 39.0, 66.0, 107.0, 241.0, 635.0, 1602.0, 701.0, 225.0, 152.0, 78.0, 40.0, 25.0, 20.0, 10.0, 13.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2164306640625, -0.20934486389160156, -0.20225906372070312, -0.1951732635498047, -0.18808746337890625, -0.1810016632080078, -0.17391586303710938, -0.16683006286621094, -0.1597442626953125, -0.15265846252441406, -0.14557266235351562, -0.1384868621826172, -0.13140106201171875, -0.12431526184082031, -0.11722946166992188, -0.11014366149902344, -0.103057861328125, -0.09597206115722656, -0.08888626098632812, -0.08180046081542969, -0.07471466064453125, -0.06762886047363281, -0.060543060302734375, -0.05345726013183594, -0.0463714599609375, -0.03928565979003906, -0.032199859619140625, -0.025114059448242188, -0.01802825927734375, -0.010942459106445312, -0.003856658935546875, 0.0032291412353515625, 0.01031494140625, 0.017400741577148438, 0.024486541748046875, 0.03157234191894531, 0.03865814208984375, 0.04574394226074219, 0.052829742431640625, 0.05991554260253906, 0.0670013427734375, 0.07408714294433594, 0.08117294311523438, 0.08825874328613281, 0.09534454345703125, 0.10243034362792969, 0.10951614379882812, 0.11660194396972656, 0.123687744140625, 0.13077354431152344, 0.13785934448242188, 0.1449451446533203, 0.15203094482421875, 0.1591167449951172, 0.16620254516601562, 0.17328834533691406, 0.1803741455078125, 0.18745994567871094, 0.19454574584960938, 0.2016315460205078, 0.20871734619140625, 0.2158031463623047, 0.22288894653320312, 0.22997474670410156, 0.237060546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 21.0, 37.0, 50.0, 63.0, 136.0, 146.0, 133.0, 124.0, 112.0, 64.0, 46.0, 21.0, 19.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.381451964378357, -1.3496801853179932, -1.317908525466919, -1.2861367464065552, -1.2543649673461914, -1.2225933074951172, -1.1908215284347534, -1.1590497493743896, -1.1272780895233154, -1.0955063104629517, -1.0637346506118774, -1.0319628715515137, -1.00019109249115, -0.9684193730354309, -0.9366476535797119, -0.9048758745193481, -0.8731040954589844, -0.8413323760032654, -0.8095605969429016, -0.7777888774871826, -0.7460170984268188, -0.7142453789710999, -0.6824736595153809, -0.6507018804550171, -0.6189301609992981, -0.5871584415435791, -0.5553866624832153, -0.5236149430274963, -0.49184319376945496, -0.4600714445114136, -0.4282997250556946, -0.3965279757976532, -0.36475610733032227, -0.3329843580722809, -0.3012126088142395, -0.2694408893585205, -0.23766914010047913, -0.20589739084243774, -0.17412565648555756, -0.14235392212867737, -0.11058217287063599, -0.0788104310631752, -0.047038689255714417, -0.015266947448253632, 0.016504794359207153, 0.048276543617248535, 0.08004827797412872, 0.11182001233100891, 0.1435917615890503, 0.17536351084709167, 0.20713524520397186, 0.23890697956085205, 0.27067872881889343, 0.3024504780769348, 0.3342221975326538, 0.3659939467906952, 0.3977656960487366, 0.42953744530677795, 0.46130919456481934, 0.49308091402053833, 0.5248526334762573, 0.5566244125366211, 0.5883961319923401, 0.6201678514480591, 0.6519396305084229]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 12.0, 7.0, 12.0, 16.0, 20.0, 25.0, 22.0, 20.0, 25.0, 29.0, 45.0, 39.0, 44.0, 51.0, 55.0, 44.0, 55.0, 36.0, 46.0, 52.0, 54.0, 39.0, 30.0, 39.0, 27.0, 41.0, 24.0, 20.0, 23.0, 4.0, 14.0, 5.0, 9.0, 4.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.779086172580719, -0.756797730922699, -0.734509289264679, -0.7122209072113037, -0.6899324655532837, -0.6676440238952637, -0.6453555822372437, -0.6230671405792236, -0.6007787585258484, -0.5784903168678284, -0.5562018752098083, -0.5339134931564331, -0.5116250514984131, -0.48933660984039307, -0.46704816818237305, -0.4447597563266754, -0.4224713146686554, -0.4001828730106354, -0.37789446115493774, -0.3556060194969177, -0.3333176076412201, -0.3110291659832001, -0.28874075412750244, -0.2664523124694824, -0.2441638857126236, -0.22187545895576477, -0.19958703219890594, -0.17729860544204712, -0.1550101637840271, -0.13272175192832947, -0.11043331027030945, -0.08814488351345062, -0.0658564567565918, -0.04356802999973297, -0.021279599517583847, 0.001008830964565277, 0.023297257721424103, 0.04558568447828293, 0.06787411868572235, 0.09016254544258118, 0.11245097219944, 0.13473939895629883, 0.15702782571315765, 0.17931625247001648, 0.2016046941280365, 0.22389310598373413, 0.24618154764175415, 0.26846998929977417, 0.2907584011554718, 0.3130468428134918, 0.33533525466918945, 0.3576236963272095, 0.3799121081829071, 0.4022005498409271, 0.42448896169662476, 0.4467774033546448, 0.4690658450126648, 0.4913542866706848, 0.5136427283287048, 0.5359311103820801, 0.5582195520401001, 0.5805079936981201, 0.6027964353561401, 0.6250848770141602, 0.6473732590675354]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 5.0, 15.0, 7.0, 16.0, 25.0, 34.0, 56.0, 101.0, 111.0, 179.0, 258.0, 390.0, 633.0, 1156.0, 1957.0, 3846.0, 9135.0, 27503.0, 102653.0, 355616.0, 380472.0, 114800.0, 30303.0, 10144.0, 4063.0, 2048.0, 1101.0, 645.0, 420.0, 274.0, 164.0, 112.0, 86.0, 54.0, 52.0, 33.0, 18.0, 19.0, 12.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62353515625, -0.6034469604492188, -0.5833587646484375, -0.5632705688476562, -0.543182373046875, -0.5230941772460938, -0.5030059814453125, -0.48291778564453125, -0.46282958984375, -0.44274139404296875, -0.4226531982421875, -0.40256500244140625, -0.382476806640625, -0.36238861083984375, -0.3423004150390625, -0.32221221923828125, -0.3021240234375, -0.28203582763671875, -0.2619476318359375, -0.24185943603515625, -0.221771240234375, -0.20168304443359375, -0.1815948486328125, -0.16150665283203125, -0.14141845703125, -0.12133026123046875, -0.1012420654296875, -0.08115386962890625, -0.061065673828125, -0.04097747802734375, -0.0208892822265625, -0.00080108642578125, 0.019287109375, 0.03937530517578125, 0.0594635009765625, 0.07955169677734375, 0.099639892578125, 0.11972808837890625, 0.1398162841796875, 0.15990447998046875, 0.17999267578125, 0.20008087158203125, 0.2201690673828125, 0.24025726318359375, 0.260345458984375, 0.28043365478515625, 0.3005218505859375, 0.32061004638671875, 0.3406982421875, 0.36078643798828125, 0.3808746337890625, 0.40096282958984375, 0.421051025390625, 0.44113922119140625, 0.4612274169921875, 0.48131561279296875, 0.50140380859375, 0.5214920043945312, 0.5415802001953125, 0.5616683959960938, 0.581756591796875, 0.6018447875976562, 0.6219329833984375, 0.6420211791992188, 0.662109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 5.0, 7.0, 15.0, 22.0, 40.0, 55.0, 56.0, 82.0, 90.0, 115.0, 113.0, 94.0, 93.0, 66.0, 47.0, 35.0, 18.0, 19.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.41845703125, -0.4068183898925781, -0.39517974853515625, -0.3835411071777344, -0.3719024658203125, -0.3602638244628906, -0.34862518310546875, -0.3369865417480469, -0.325347900390625, -0.3137092590332031, -0.30207061767578125, -0.2904319763183594, -0.2787933349609375, -0.2671546936035156, -0.25551605224609375, -0.24387741088867188, -0.23223876953125, -0.22060012817382812, -0.20896148681640625, -0.19732284545898438, -0.1856842041015625, -0.17404556274414062, -0.16240692138671875, -0.15076828002929688, -0.139129638671875, -0.12749099731445312, -0.11585235595703125, -0.10421371459960938, -0.0925750732421875, -0.08093643188476562, -0.06929779052734375, -0.057659149169921875, -0.0460205078125, -0.034381866455078125, -0.02274322509765625, -0.011104583740234375, 0.0005340576171875, 0.012172698974609375, 0.02381134033203125, 0.035449981689453125, 0.047088623046875, 0.058727264404296875, 0.07036590576171875, 0.08200454711914062, 0.0936431884765625, 0.10528182983398438, 0.11692047119140625, 0.12855911254882812, 0.14019775390625, 0.15183639526367188, 0.16347503662109375, 0.17511367797851562, 0.1867523193359375, 0.19839096069335938, 0.21002960205078125, 0.22166824340820312, 0.233306884765625, 0.24494552612304688, 0.25658416748046875, 0.2682228088378906, 0.2798614501953125, 0.2915000915527344, 0.30313873291015625, 0.3147773742675781, 0.326416015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 22.0, 14.0, 36.0, 51.0, 60.0, 101.0, 136.0, 190.0, 243.0, 427.0, 688.0, 1300.0, 2970.0, 7952.0, 25825.0, 93860.0, 304194.0, 397565.0, 151154.0, 41194.0, 12192.0, 4180.0, 1786.0, 870.0, 484.0, 289.0, 202.0, 146.0, 110.0, 84.0, 45.0, 31.0, 24.0, 17.0, 21.0, 13.0, 9.0, 9.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.548828125, -0.5317764282226562, -0.5147247314453125, -0.49767303466796875, -0.480621337890625, -0.46356964111328125, -0.4465179443359375, -0.42946624755859375, -0.41241455078125, -0.39536285400390625, -0.3783111572265625, -0.36125946044921875, -0.344207763671875, -0.32715606689453125, -0.3101043701171875, -0.29305267333984375, -0.2760009765625, -0.25894927978515625, -0.2418975830078125, -0.22484588623046875, -0.207794189453125, -0.19074249267578125, -0.1736907958984375, -0.15663909912109375, -0.13958740234375, -0.12253570556640625, -0.1054840087890625, -0.08843231201171875, -0.071380615234375, -0.05432891845703125, -0.0372772216796875, -0.02022552490234375, -0.003173828125, 0.01387786865234375, 0.0309295654296875, 0.04798126220703125, 0.065032958984375, 0.08208465576171875, 0.0991363525390625, 0.11618804931640625, 0.13323974609375, 0.15029144287109375, 0.1673431396484375, 0.18439483642578125, 0.201446533203125, 0.21849822998046875, 0.2355499267578125, 0.25260162353515625, 0.2696533203125, 0.28670501708984375, 0.3037567138671875, 0.32080841064453125, 0.337860107421875, 0.35491180419921875, 0.3719635009765625, 0.38901519775390625, 0.40606689453125, 0.42311859130859375, 0.4401702880859375, 0.45722198486328125, 0.474273681640625, 0.49132537841796875, 0.5083770751953125, 0.5254287719726562, 0.54248046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 9.0, 8.0, 12.0, 14.0, 9.0, 17.0, 26.0, 28.0, 20.0, 26.0, 37.0, 35.0, 38.0, 38.0, 36.0, 48.0, 38.0, 38.0, 43.0, 43.0, 49.0, 42.0, 45.0, 26.0, 33.0, 27.0, 24.0, 28.0, 26.0, 20.0, 21.0, 15.0, 6.0, 19.0, 6.0, 5.0, 8.0, 4.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.75244140625, -0.725799560546875, -0.69915771484375, -0.672515869140625, -0.6458740234375, -0.619232177734375, -0.59259033203125, -0.565948486328125, -0.539306640625, -0.512664794921875, -0.48602294921875, -0.459381103515625, -0.4327392578125, -0.406097412109375, -0.37945556640625, -0.352813720703125, -0.326171875, -0.299530029296875, -0.27288818359375, -0.246246337890625, -0.2196044921875, -0.192962646484375, -0.16632080078125, -0.139678955078125, -0.113037109375, -0.086395263671875, -0.05975341796875, -0.033111572265625, -0.0064697265625, 0.020172119140625, 0.04681396484375, 0.073455810546875, 0.10009765625, 0.126739501953125, 0.15338134765625, 0.180023193359375, 0.2066650390625, 0.233306884765625, 0.25994873046875, 0.286590576171875, 0.313232421875, 0.339874267578125, 0.36651611328125, 0.393157958984375, 0.4197998046875, 0.446441650390625, 0.47308349609375, 0.499725341796875, 0.5263671875, 0.553009033203125, 0.57965087890625, 0.606292724609375, 0.6329345703125, 0.659576416015625, 0.68621826171875, 0.712860107421875, 0.739501953125, 0.766143798828125, 0.79278564453125, 0.819427490234375, 0.8460693359375, 0.872711181640625, 0.89935302734375, 0.925994873046875, 0.95263671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 17.0, 26.0, 22.0, 41.0, 74.0, 133.0, 197.0, 451.0, 966.0, 2279.0, 6424.0, 22278.0, 118461.0, 541908.0, 290317.0, 47189.0, 11110.0, 3763.0, 1522.0, 626.0, 301.0, 166.0, 105.0, 46.0, 33.0, 26.0, 20.0, 7.0, 6.0, 12.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.304443359375, -0.29637718200683594, -0.2883110046386719, -0.2802448272705078, -0.27217864990234375, -0.2641124725341797, -0.2560462951660156, -0.24798011779785156, -0.2399139404296875, -0.23184776306152344, -0.22378158569335938, -0.2157154083251953, -0.20764923095703125, -0.1995830535888672, -0.19151687622070312, -0.18345069885253906, -0.175384521484375, -0.16731834411621094, -0.15925216674804688, -0.1511859893798828, -0.14311981201171875, -0.1350536346435547, -0.12698745727539062, -0.11892127990722656, -0.1108551025390625, -0.10278892517089844, -0.09472274780273438, -0.08665657043457031, -0.07859039306640625, -0.07052421569824219, -0.062458038330078125, -0.05439186096191406, -0.04632568359375, -0.03825950622558594, -0.030193328857421875, -0.022127151489257812, -0.01406097412109375, -0.0059947967529296875, 0.002071380615234375, 0.010137557983398438, 0.0182037353515625, 0.026269912719726562, 0.034336090087890625, 0.04240226745605469, 0.05046844482421875, 0.05853462219238281, 0.06660079956054688, 0.07466697692871094, 0.082733154296875, 0.09079933166503906, 0.09886550903320312, 0.10693168640136719, 0.11499786376953125, 0.12306404113769531, 0.13113021850585938, 0.13919639587402344, 0.1472625732421875, 0.15532875061035156, 0.16339492797851562, 0.1714611053466797, 0.17952728271484375, 0.1875934600830078, 0.19565963745117188, 0.20372581481933594, 0.2117919921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 6.0, 21.0, 20.0, 23.0, 32.0, 40.0, 35.0, 48.0, 74.0, 101.0, 131.0, 124.0, 74.0, 59.0, 43.0, 34.0, 27.0, 24.0, 24.0, 17.0, 7.0, 6.0, 9.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.863210678100586e-05, -8.411053568124771e-05, -7.958896458148956e-05, -7.506739348173141e-05, -7.054582238197327e-05, -6.602425128221512e-05, -6.150268018245697e-05, -5.698110908269882e-05, -5.2459537982940674e-05, -4.7937966883182526e-05, -4.341639578342438e-05, -3.889482468366623e-05, -3.437325358390808e-05, -2.9851682484149933e-05, -2.5330111384391785e-05, -2.0808540284633636e-05, -1.6286969184875488e-05, -1.176539808511734e-05, -7.243826985359192e-06, -2.7222558856010437e-06, 1.7993152141571045e-06, 6.320886313915253e-06, 1.0842457413673401e-05, 1.536402851343155e-05, 1.9885599613189697e-05, 2.4407170712947845e-05, 2.8928741812705994e-05, 3.345031291246414e-05, 3.797188401222229e-05, 4.249345511198044e-05, 4.7015026211738586e-05, 5.1536597311496735e-05, 5.605816841125488e-05, 6.057973951101303e-05, 6.510131061077118e-05, 6.962288171052933e-05, 7.414445281028748e-05, 7.866602391004562e-05, 8.318759500980377e-05, 8.770916610956192e-05, 9.223073720932007e-05, 9.675230830907822e-05, 0.00010127387940883636, 0.00010579545050859451, 0.00011031702160835266, 0.00011483859270811081, 0.00011936016380786896, 0.0001238817349076271, 0.00012840330600738525, 0.0001329248771071434, 0.00013744644820690155, 0.0001419680193066597, 0.00014648959040641785, 0.000151011161506176, 0.00015553273260593414, 0.0001600543037056923, 0.00016457587480545044, 0.0001690974459052086, 0.00017361901700496674, 0.00017814058810472488, 0.00018266215920448303, 0.00018718373030424118, 0.00019170530140399933, 0.00019622687250375748, 0.00020074844360351562]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 16.0, 24.0, 16.0, 34.0, 35.0, 70.0, 128.0, 208.0, 399.0, 762.0, 2021.0, 5983.0, 23229.0, 136483.0, 639459.0, 197477.0, 30628.0, 7281.0, 2355.0, 915.0, 395.0, 230.0, 145.0, 75.0, 48.0, 33.0, 21.0, 26.0, 9.0, 9.0, 11.0, 8.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2624168395996094, -0.25383758544921875, -0.24525833129882812, -0.2366790771484375, -0.22809982299804688, -0.21952056884765625, -0.21094131469726562, -0.202362060546875, -0.19378280639648438, -0.18520355224609375, -0.17662429809570312, -0.1680450439453125, -0.15946578979492188, -0.15088653564453125, -0.14230728149414062, -0.13372802734375, -0.12514877319335938, -0.11656951904296875, -0.10799026489257812, -0.0994110107421875, -0.09083175659179688, -0.08225250244140625, -0.07367324829101562, -0.065093994140625, -0.056514739990234375, -0.04793548583984375, -0.039356231689453125, -0.0307769775390625, -0.022197723388671875, -0.01361846923828125, -0.005039215087890625, 0.0035400390625, 0.012119293212890625, 0.02069854736328125, 0.029277801513671875, 0.0378570556640625, 0.046436309814453125, 0.05501556396484375, 0.06359481811523438, 0.072174072265625, 0.08075332641601562, 0.08933258056640625, 0.09791183471679688, 0.1064910888671875, 0.11507034301757812, 0.12364959716796875, 0.13222885131835938, 0.14080810546875, 0.14938735961914062, 0.15796661376953125, 0.16654586791992188, 0.1751251220703125, 0.18370437622070312, 0.19228363037109375, 0.20086288452148438, 0.209442138671875, 0.21802139282226562, 0.22660064697265625, 0.23517990112304688, 0.2437591552734375, 0.2523384094238281, 0.26091766357421875, 0.2694969177246094, 0.278076171875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 3.0, 7.0, 5.0, 19.0, 14.0, 21.0, 19.0, 28.0, 28.0, 43.0, 56.0, 51.0, 72.0, 74.0, 66.0, 70.0, 73.0, 81.0, 51.0, 43.0, 20.0, 35.0, 18.0, 16.0, 12.0, 11.0, 9.0, 8.0, 2.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1673583984375, -0.16108322143554688, -0.15480804443359375, -0.14853286743164062, -0.1422576904296875, -0.13598251342773438, -0.12970733642578125, -0.12343215942382812, -0.117156982421875, -0.11088180541992188, -0.10460662841796875, -0.09833145141601562, -0.0920562744140625, -0.08578109741210938, -0.07950592041015625, -0.07323074340820312, -0.06695556640625, -0.060680389404296875, -0.05440521240234375, -0.048130035400390625, -0.0418548583984375, -0.035579681396484375, -0.02930450439453125, -0.023029327392578125, -0.016754150390625, -0.010478973388671875, -0.00420379638671875, 0.002071380615234375, 0.0083465576171875, 0.014621734619140625, 0.02089691162109375, 0.027172088623046875, 0.033447265625, 0.039722442626953125, 0.04599761962890625, 0.052272796630859375, 0.0585479736328125, 0.06482315063476562, 0.07109832763671875, 0.07737350463867188, 0.083648681640625, 0.08992385864257812, 0.09619903564453125, 0.10247421264648438, 0.1087493896484375, 0.11502456665039062, 0.12129974365234375, 0.12757492065429688, 0.13385009765625, 0.14012527465820312, 0.14640045166015625, 0.15267562866210938, 0.1589508056640625, 0.16522598266601562, 0.17150115966796875, 0.17777633666992188, 0.184051513671875, 0.19032669067382812, 0.19660186767578125, 0.20287704467773438, 0.2091522216796875, 0.21542739868164062, 0.22170257568359375, 0.22797775268554688, 0.2342529296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 9.0, 10.0, 27.0, 62.0, 113.0, 228.0, 270.0, 150.0, 70.0, 38.0, 15.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.998574256896973, -8.744024276733398, -8.489473342895508, -8.234923362731934, -7.980372905731201, -7.725822448730469, -7.4712724685668945, -7.216722011566162, -6.96217155456543, -6.707621097564697, -6.453070640563965, -6.198520660400391, -5.943970203399658, -5.689419746398926, -5.434869766235352, -5.180319309234619, -4.925768852233887, -4.671218395233154, -4.416667938232422, -4.162117958068848, -3.9075675010681152, -3.653017044067383, -3.3984668254852295, -3.143916606903076, -2.8893661499023438, -2.6348156929016113, -2.380265474319458, -2.1257152557373047, -1.8711647987365723, -1.6166144609451294, -1.3620641231536865, -1.1075137853622437, -0.852963924407959, -0.5984135866165161, -0.34386324882507324, -0.08931291103363037, 0.1652374267578125, 0.41978776454925537, 0.6743381023406982, 0.9288884401321411, 1.183438777923584, 1.4379891157150269, 1.6925394535064697, 1.9470897912979126, 2.2016401290893555, 2.456190586090088, 2.710740804672241, 2.9652910232543945, 3.219841480255127, 3.4743919372558594, 3.7289421558380127, 3.983492374420166, 4.238042831420898, 4.492593288421631, 4.747143745422363, 5.0016937255859375, 5.25624418258667, 5.510794639587402, 5.765344619750977, 6.019895076751709, 6.274445533752441, 6.528995990753174, 6.783546447753906, 7.0380964279174805, 7.292646884918213]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 0.0, 3.0, 3.0, 8.0, 8.0, 13.0, 13.0, 18.0, 10.0, 19.0, 17.0, 29.0, 21.0, 28.0, 30.0, 31.0, 44.0, 26.0, 30.0, 58.0, 42.0, 33.0, 41.0, 48.0, 39.0, 37.0, 31.0, 40.0, 25.0, 34.0, 26.0, 23.0, 35.0, 21.0, 26.0, 19.0, 14.0, 9.0, 14.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.910027027130127, -4.753077507019043, -4.596127510070801, -4.439177989959717, -4.282228469848633, -4.125278949737549, -3.9683289527893066, -3.8113794326782227, -3.6544299125671387, -3.4974801540374756, -3.3405306339263916, -3.1835808753967285, -3.0266313552856445, -2.8696815967559814, -2.7127318382263184, -2.5557823181152344, -2.3988325595855713, -2.241882801055908, -2.084933280944824, -1.9279835224151611, -1.7710340023040771, -1.614084243774414, -1.4571346044540405, -1.300184965133667, -1.1432353258132935, -0.9862856864929199, -0.8293360471725464, -0.6723863482475281, -0.5154367089271545, -0.358487069606781, -0.2015373706817627, -0.04458773136138916, 0.11236190795898438, 0.2693115472793579, 0.42626121640205383, 0.5832108855247498, 0.7401605248451233, 0.8971101641654968, 1.0540598630905151, 1.2110095024108887, 1.3679591417312622, 1.5249087810516357, 1.6818584203720093, 1.8388080596923828, 1.995757818222046, 2.15270733833313, 2.309657096862793, 2.466606616973877, 2.62355637550354, 2.780506134033203, 2.937455654144287, 3.09440541267395, 3.251354932785034, 3.4083046913146973, 3.5652542114257812, 3.7222039699554443, 3.8791537284851074, 4.036103248596191, 4.193053245544434, 4.350002765655518, 4.506952285766602, 4.6639018058776855, 4.820851802825928, 4.977801322937012, 5.134750843048096]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 3.0, 3.0, 11.0, 11.0, 14.0, 26.0, 34.0, 29.0, 77.0, 113.0, 147.0, 258.0, 454.0, 876.0, 1870.0, 4896.0, 15929.0, 94407.0, 3765749.0, 270563.0, 26962.0, 6916.0, 2476.0, 1112.0, 563.0, 259.0, 175.0, 105.0, 79.0, 55.0, 33.0, 24.0, 14.0, 9.0, 9.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.93896484375, -0.9118881225585938, -0.8848114013671875, -0.8577346801757812, -0.830657958984375, -0.8035812377929688, -0.7765045166015625, -0.7494277954101562, -0.72235107421875, -0.6952743530273438, -0.6681976318359375, -0.6411209106445312, -0.614044189453125, -0.5869674682617188, -0.5598907470703125, -0.5328140258789062, -0.5057373046875, -0.47866058349609375, -0.4515838623046875, -0.42450714111328125, -0.397430419921875, -0.37035369873046875, -0.3432769775390625, -0.31620025634765625, -0.28912353515625, -0.26204681396484375, -0.2349700927734375, -0.20789337158203125, -0.180816650390625, -0.15373992919921875, -0.1266632080078125, -0.09958648681640625, -0.072509765625, -0.04543304443359375, -0.0183563232421875, 0.00872039794921875, 0.035797119140625, 0.06287384033203125, 0.0899505615234375, 0.11702728271484375, 0.14410400390625, 0.17118072509765625, 0.1982574462890625, 0.22533416748046875, 0.252410888671875, 0.27948760986328125, 0.3065643310546875, 0.33364105224609375, 0.3607177734375, 0.38779449462890625, 0.4148712158203125, 0.44194793701171875, 0.469024658203125, 0.49610137939453125, 0.5231781005859375, 0.5502548217773438, 0.57733154296875, 0.6044082641601562, 0.6314849853515625, 0.6585617065429688, 0.685638427734375, 0.7127151489257812, 0.7397918701171875, 0.7668685913085938, 0.7939453125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 11.0, 6.0, 16.0, 20.0, 25.0, 48.0, 62.0, 64.0, 92.0, 94.0, 75.0, 111.0, 87.0, 69.0, 81.0, 37.0, 31.0, 30.0, 13.0, 6.0, 9.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443603515625, -0.4311180114746094, -0.41863250732421875, -0.4061470031738281, -0.3936614990234375, -0.3811759948730469, -0.36869049072265625, -0.3562049865722656, -0.343719482421875, -0.3312339782714844, -0.31874847412109375, -0.3062629699707031, -0.2937774658203125, -0.2812919616699219, -0.26880645751953125, -0.2563209533691406, -0.24383544921875, -0.23134994506835938, -0.21886444091796875, -0.20637893676757812, -0.1938934326171875, -0.18140792846679688, -0.16892242431640625, -0.15643692016601562, -0.143951416015625, -0.13146591186523438, -0.11898040771484375, -0.10649490356445312, -0.0940093994140625, -0.08152389526367188, -0.06903839111328125, -0.056552886962890625, -0.0440673828125, -0.031581878662109375, -0.01909637451171875, -0.006610870361328125, 0.0058746337890625, 0.018360137939453125, 0.03084564208984375, 0.043331146240234375, 0.055816650390625, 0.06830215454101562, 0.08078765869140625, 0.09327316284179688, 0.1057586669921875, 0.11824417114257812, 0.13072967529296875, 0.14321517944335938, 0.15570068359375, 0.16818618774414062, 0.18067169189453125, 0.19315719604492188, 0.2056427001953125, 0.21812820434570312, 0.23061370849609375, 0.24309921264648438, 0.255584716796875, 0.2680702209472656, 0.28055572509765625, 0.2930412292480469, 0.3055267333984375, 0.3180122375488281, 0.33049774169921875, 0.3429832458496094, 0.35546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 11.0, 32.0, 81.0, 256.0, 776.0, 3455.0, 35933.0, 3924463.0, 218055.0, 8765.0, 1654.0, 524.0, 149.0, 59.0, 19.0, 18.0, 3.0, 9.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.1497955322265625, -1.111114501953125, -1.0724334716796875, -1.03375244140625, -0.9950714111328125, -0.956390380859375, -0.9177093505859375, -0.8790283203125, -0.8403472900390625, -0.801666259765625, -0.7629852294921875, -0.72430419921875, -0.6856231689453125, -0.646942138671875, -0.6082611083984375, -0.569580078125, -0.5308990478515625, -0.492218017578125, -0.4535369873046875, -0.41485595703125, -0.3761749267578125, -0.337493896484375, -0.2988128662109375, -0.2601318359375, -0.2214508056640625, -0.182769775390625, -0.1440887451171875, -0.10540771484375, -0.0667266845703125, -0.028045654296875, 0.0106353759765625, 0.04931640625, 0.0879974365234375, 0.126678466796875, 0.1653594970703125, 0.20404052734375, 0.2427215576171875, 0.281402587890625, 0.3200836181640625, 0.3587646484375, 0.3974456787109375, 0.436126708984375, 0.4748077392578125, 0.51348876953125, 0.5521697998046875, 0.590850830078125, 0.6295318603515625, 0.668212890625, 0.7068939208984375, 0.745574951171875, 0.7842559814453125, 0.82293701171875, 0.8616180419921875, 0.900299072265625, 0.9389801025390625, 0.9776611328125, 1.0163421630859375, 1.055023193359375, 1.0937042236328125, 1.13238525390625, 1.1710662841796875, 1.209747314453125, 1.2484283447265625, 1.287109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 3.0, 8.0, 14.0, 18.0, 37.0, 42.0, 78.0, 150.0, 457.0, 1600.0, 1011.0, 305.0, 118.0, 79.0, 37.0, 26.0, 21.0, 21.0, 10.0, 5.0, 4.0, 9.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.297607421875, -0.2869110107421875, -0.276214599609375, -0.2655181884765625, -0.25482177734375, -0.2441253662109375, -0.233428955078125, -0.2227325439453125, -0.2120361328125, -0.2013397216796875, -0.190643310546875, -0.1799468994140625, -0.16925048828125, -0.1585540771484375, -0.147857666015625, -0.1371612548828125, -0.12646484375, -0.1157684326171875, -0.105072021484375, -0.0943756103515625, -0.08367919921875, -0.0729827880859375, -0.062286376953125, -0.0515899658203125, -0.0408935546875, -0.0301971435546875, -0.019500732421875, -0.0088043212890625, 0.00189208984375, 0.0125885009765625, 0.023284912109375, 0.0339813232421875, 0.044677734375, 0.0553741455078125, 0.066070556640625, 0.0767669677734375, 0.08746337890625, 0.0981597900390625, 0.108856201171875, 0.1195526123046875, 0.1302490234375, 0.1409454345703125, 0.151641845703125, 0.1623382568359375, 0.17303466796875, 0.1837310791015625, 0.194427490234375, 0.2051239013671875, 0.2158203125, 0.2265167236328125, 0.237213134765625, 0.2479095458984375, 0.25860595703125, 0.2693023681640625, 0.279998779296875, 0.2906951904296875, 0.3013916015625, 0.3120880126953125, 0.322784423828125, 0.3334808349609375, 0.34417724609375, 0.3548736572265625, 0.365570068359375, 0.3762664794921875, 0.386962890625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 10.0, 98.0, 364.0, 378.0, 127.0, 20.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3329033851623535, -1.1986160278320312, -1.0643285512924194, -0.9300411343574524, -0.7957537174224854, -0.6614663004875183, -0.5271788835525513, -0.39289146661758423, -0.2586040496826172, -0.12431663274765015, 0.009970784187316895, 0.14425820112228394, 0.278545618057251, 0.412833034992218, 0.5471204519271851, 0.6814078688621521, 0.8156952857971191, 0.9499827027320862, 1.0842701196670532, 1.218557596206665, 1.3528449535369873, 1.4871323108673096, 1.6214197874069214, 1.7557072639465332, 1.8899946212768555, 2.0242819786071777, 2.1585693359375, 2.2928569316864014, 2.4271442890167236, 2.561431646347046, 2.6957192420959473, 2.8300065994262695, 2.96429443359375, 3.0985817909240723, 3.2328691482543945, 3.367156744003296, 3.501444101333618, 3.6357314586639404, 3.770019054412842, 3.904306411743164, 4.038593769073486, 4.172881126403809, 4.307168483734131, 4.441455841064453, 4.575743675231934, 4.710031032562256, 4.844318389892578, 4.9786057472229, 5.112893104553223, 5.247180461883545, 5.381467819213867, 5.5157551765441895, 5.650042533874512, 5.784330368041992, 5.9186177253723145, 6.052905082702637, 6.187192440032959, 6.321479797363281, 6.4557671546936035, 6.590054512023926, 6.724342346191406, 6.8586297035217285, 6.992917060852051, 7.127204418182373, 7.261491775512695]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 11.0, 1.0, 15.0, 12.0, 20.0, 21.0, 27.0, 31.0, 33.0, 41.0, 51.0, 39.0, 52.0, 66.0, 80.0, 51.0, 53.0, 55.0, 60.0, 59.0, 46.0, 37.0, 35.0, 27.0, 19.0, 14.0, 14.0, 9.0, 6.0, 7.0, 1.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5803892612457275, -1.5391221046447754, -1.4978550672531128, -1.4565880298614502, -1.415320873260498, -1.374053716659546, -1.3327866792678833, -1.2915196418762207, -1.2502524852752686, -1.2089853286743164, -1.1677182912826538, -1.1264512538909912, -1.085184097290039, -1.043916940689087, -1.0026499032974243, -0.9613828063011169, -0.9201157093048096, -0.8788486123085022, -0.8375815153121948, -0.7963144183158875, -0.7550473213195801, -0.7137802243232727, -0.6725131273269653, -0.631246030330658, -0.5899789333343506, -0.5487118363380432, -0.5074447393417358, -0.46617764234542847, -0.4249105453491211, -0.3836434483528137, -0.34237635135650635, -0.301109254360199, -0.25984203815460205, -0.21857494115829468, -0.1773078441619873, -0.13604074716567993, -0.09477365016937256, -0.053506553173065186, -0.012239456176757812, 0.02902764081954956, 0.07029473781585693, 0.1115618348121643, 0.15282893180847168, 0.19409602880477905, 0.23536312580108643, 0.2766302227973938, 0.31789731979370117, 0.35916441679000854, 0.4004315137863159, 0.4416986107826233, 0.48296570777893066, 0.524232804775238, 0.5654999017715454, 0.6067669987678528, 0.6480340957641602, 0.6893011927604675, 0.7305682897567749, 0.7718353867530823, 0.8131024837493896, 0.854369580745697, 0.8956366777420044, 0.9369037747383118, 0.9781708717346191, 1.0194380283355713, 1.0607050657272339]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 4.0, 4.0, 9.0, 6.0, 7.0, 8.0, 23.0, 26.0, 27.0, 54.0, 78.0, 115.0, 208.0, 331.0, 558.0, 1006.0, 2231.0, 5225.0, 17180.0, 79217.0, 507642.0, 357564.0, 55463.0, 13124.0, 4387.0, 1874.0, 923.0, 493.0, 274.0, 168.0, 107.0, 66.0, 45.0, 35.0, 14.0, 15.0, 10.0, 6.0, 5.0, 11.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.94189453125, -0.9149017333984375, -0.887908935546875, -0.8609161376953125, -0.83392333984375, -0.8069305419921875, -0.779937744140625, -0.7529449462890625, -0.7259521484375, -0.6989593505859375, -0.671966552734375, -0.6449737548828125, -0.61798095703125, -0.5909881591796875, -0.563995361328125, -0.5370025634765625, -0.510009765625, -0.4830169677734375, -0.456024169921875, -0.4290313720703125, -0.40203857421875, -0.3750457763671875, -0.348052978515625, -0.3210601806640625, -0.2940673828125, -0.2670745849609375, -0.240081787109375, -0.2130889892578125, -0.18609619140625, -0.1591033935546875, -0.132110595703125, -0.1051177978515625, -0.078125, -0.0511322021484375, -0.024139404296875, 0.0028533935546875, 0.02984619140625, 0.0568389892578125, 0.083831787109375, 0.1108245849609375, 0.1378173828125, 0.1648101806640625, 0.191802978515625, 0.2187957763671875, 0.24578857421875, 0.2727813720703125, 0.299774169921875, 0.3267669677734375, 0.353759765625, 0.3807525634765625, 0.407745361328125, 0.4347381591796875, 0.46173095703125, 0.4887237548828125, 0.515716552734375, 0.5427093505859375, 0.5697021484375, 0.5966949462890625, 0.623687744140625, 0.6506805419921875, 0.67767333984375, 0.7046661376953125, 0.731658935546875, 0.7586517333984375, 0.78564453125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 9.0, 10.0, 19.0, 26.0, 33.0, 46.0, 63.0, 86.0, 96.0, 89.0, 73.0, 102.0, 87.0, 72.0, 53.0, 43.0, 31.0, 27.0, 6.0, 12.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43017578125, -0.4179344177246094, -0.40569305419921875, -0.3934516906738281, -0.3812103271484375, -0.3689689636230469, -0.35672760009765625, -0.3444862365722656, -0.332244873046875, -0.3200035095214844, -0.30776214599609375, -0.2955207824707031, -0.2832794189453125, -0.2710380554199219, -0.25879669189453125, -0.24655532836914062, -0.23431396484375, -0.22207260131835938, -0.20983123779296875, -0.19758987426757812, -0.1853485107421875, -0.17310714721679688, -0.16086578369140625, -0.14862442016601562, -0.136383056640625, -0.12414169311523438, -0.11190032958984375, -0.09965896606445312, -0.0874176025390625, -0.07517623901367188, -0.06293487548828125, -0.050693511962890625, -0.0384521484375, -0.026210784912109375, -0.01396942138671875, -0.001728057861328125, 0.0105133056640625, 0.022754669189453125, 0.03499603271484375, 0.047237396240234375, 0.059478759765625, 0.07172012329101562, 0.08396148681640625, 0.09620285034179688, 0.1084442138671875, 0.12068557739257812, 0.13292694091796875, 0.14516830444335938, 0.15740966796875, 0.16965103149414062, 0.18189239501953125, 0.19413375854492188, 0.2063751220703125, 0.21861648559570312, 0.23085784912109375, 0.24309921264648438, 0.255340576171875, 0.2675819396972656, 0.27982330322265625, 0.2920646667480469, 0.3043060302734375, 0.3165473937988281, 0.32878875732421875, 0.3410301208496094, 0.353271484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 5.0, 5.0, 14.0, 17.0, 17.0, 21.0, 23.0, 33.0, 59.0, 76.0, 108.0, 163.0, 248.0, 551.0, 1309.0, 3607.0, 15611.0, 116072.0, 714794.0, 167551.0, 20876.0, 4481.0, 1395.0, 622.0, 300.0, 173.0, 100.0, 71.0, 53.0, 30.0, 32.0, 40.0, 25.0, 14.0, 9.0, 10.0, 11.0, 7.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.05859375, -1.028839111328125, -0.99908447265625, -0.969329833984375, -0.9395751953125, -0.909820556640625, -0.88006591796875, -0.850311279296875, -0.820556640625, -0.790802001953125, -0.76104736328125, -0.731292724609375, -0.7015380859375, -0.671783447265625, -0.64202880859375, -0.612274169921875, -0.58251953125, -0.552764892578125, -0.52301025390625, -0.493255615234375, -0.4635009765625, -0.433746337890625, -0.40399169921875, -0.374237060546875, -0.344482421875, -0.314727783203125, -0.28497314453125, -0.255218505859375, -0.2254638671875, -0.195709228515625, -0.16595458984375, -0.136199951171875, -0.1064453125, -0.076690673828125, -0.04693603515625, -0.017181396484375, 0.0125732421875, 0.042327880859375, 0.07208251953125, 0.101837158203125, 0.131591796875, 0.161346435546875, 0.19110107421875, 0.220855712890625, 0.2506103515625, 0.280364990234375, 0.31011962890625, 0.339874267578125, 0.36962890625, 0.399383544921875, 0.42913818359375, 0.458892822265625, 0.4886474609375, 0.518402099609375, 0.54815673828125, 0.577911376953125, 0.607666015625, 0.637420654296875, 0.66717529296875, 0.696929931640625, 0.7266845703125, 0.756439208984375, 0.78619384765625, 0.815948486328125, 0.845703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 7.0, 7.0, 19.0, 11.0, 15.0, 13.0, 21.0, 23.0, 32.0, 45.0, 49.0, 42.0, 56.0, 48.0, 57.0, 49.0, 62.0, 51.0, 73.0, 47.0, 42.0, 47.0, 32.0, 29.0, 23.0, 14.0, 19.0, 7.0, 8.0, 8.0, 11.0, 5.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.2265625, -1.1919403076171875, -1.157318115234375, -1.1226959228515625, -1.08807373046875, -1.0534515380859375, -1.018829345703125, -0.9842071533203125, -0.9495849609375, -0.9149627685546875, -0.880340576171875, -0.8457183837890625, -0.81109619140625, -0.7764739990234375, -0.741851806640625, -0.7072296142578125, -0.672607421875, -0.6379852294921875, -0.603363037109375, -0.5687408447265625, -0.53411865234375, -0.4994964599609375, -0.464874267578125, -0.4302520751953125, -0.3956298828125, -0.3610076904296875, -0.326385498046875, -0.2917633056640625, -0.25714111328125, -0.2225189208984375, -0.187896728515625, -0.1532745361328125, -0.11865234375, -0.0840301513671875, -0.049407958984375, -0.0147857666015625, 0.01983642578125, 0.0544586181640625, 0.089080810546875, 0.1237030029296875, 0.1583251953125, 0.1929473876953125, 0.227569580078125, 0.2621917724609375, 0.29681396484375, 0.3314361572265625, 0.366058349609375, 0.4006805419921875, 0.435302734375, 0.4699249267578125, 0.504547119140625, 0.5391693115234375, 0.57379150390625, 0.6084136962890625, 0.643035888671875, 0.6776580810546875, 0.7122802734375, 0.7469024658203125, 0.781524658203125, 0.8161468505859375, 0.85076904296875, 0.8853912353515625, 0.920013427734375, 0.9546356201171875, 0.9892578125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 8.0, 12.0, 21.0, 15.0, 31.0, 46.0, 92.0, 174.0, 259.0, 542.0, 1338.0, 4021.0, 16535.0, 99089.0, 736906.0, 158257.0, 22764.0, 5303.0, 1739.0, 651.0, 295.0, 165.0, 110.0, 61.0, 39.0, 23.0, 11.0, 8.0, 7.0, 3.0, 9.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.264404296875, -0.2557640075683594, -0.24712371826171875, -0.23848342895507812, -0.2298431396484375, -0.22120285034179688, -0.21256256103515625, -0.20392227172851562, -0.195281982421875, -0.18664169311523438, -0.17800140380859375, -0.16936111450195312, -0.1607208251953125, -0.15208053588867188, -0.14344024658203125, -0.13479995727539062, -0.12615966796875, -0.11751937866210938, -0.10887908935546875, -0.10023880004882812, -0.0915985107421875, -0.08295822143554688, -0.07431793212890625, -0.06567764282226562, -0.057037353515625, -0.048397064208984375, -0.03975677490234375, -0.031116485595703125, -0.0224761962890625, -0.013835906982421875, -0.00519561767578125, 0.003444671630859375, 0.0120849609375, 0.020725250244140625, 0.02936553955078125, 0.038005828857421875, 0.0466461181640625, 0.055286407470703125, 0.06392669677734375, 0.07256698608398438, 0.081207275390625, 0.08984756469726562, 0.09848785400390625, 0.10712814331054688, 0.1157684326171875, 0.12440872192382812, 0.13304901123046875, 0.14168930053710938, 0.15032958984375, 0.15896987915039062, 0.16761016845703125, 0.17625045776367188, 0.1848907470703125, 0.19353103637695312, 0.20217132568359375, 0.21081161499023438, 0.219451904296875, 0.22809219360351562, 0.23673248291015625, 0.24537277221679688, 0.2540130615234375, 0.2626533508300781, 0.27129364013671875, 0.2799339294433594, 0.28857421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 12.0, 9.0, 19.0, 24.0, 40.0, 46.0, 102.0, 195.0, 217.0, 127.0, 77.0, 49.0, 28.0, 16.0, 11.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011241436004638672, -0.0001062583178281784, -0.00010010227560997009, -9.394623339176178e-05, -8.779019117355347e-05, -8.163414895534515e-05, -7.547810673713684e-05, -6.932206451892853e-05, -6.316602230072021e-05, -5.70099800825119e-05, -5.085393786430359e-05, -4.4697895646095276e-05, -3.854185342788696e-05, -3.238581120967865e-05, -2.6229768991470337e-05, -2.0073726773262024e-05, -1.3917684555053711e-05, -7.761642336845398e-06, -1.605600118637085e-06, 4.550442099571228e-06, 1.0706484317779541e-05, 1.6862526535987854e-05, 2.3018568754196167e-05, 2.917461097240448e-05, 3.533065319061279e-05, 4.1486695408821106e-05, 4.764273762702942e-05, 5.379877984523773e-05, 5.9954822063446045e-05, 6.611086428165436e-05, 7.226690649986267e-05, 7.842294871807098e-05, 8.45789909362793e-05, 9.073503315448761e-05, 9.689107537269592e-05, 0.00010304711759090424, 0.00010920315980911255, 0.00011535920202732086, 0.00012151524424552917, 0.0001276712864637375, 0.0001338273286819458, 0.00013998337090015411, 0.00014613941311836243, 0.00015229545533657074, 0.00015845149755477905, 0.00016460753977298737, 0.00017076358199119568, 0.000176919624209404, 0.0001830756664276123, 0.00018923170864582062, 0.00019538775086402893, 0.00020154379308223724, 0.00020769983530044556, 0.00021385587751865387, 0.00022001191973686218, 0.0002261679619550705, 0.0002323240041732788, 0.00023848004639148712, 0.00024463608860969543, 0.00025079213082790375, 0.00025694817304611206, 0.0002631042152643204, 0.0002692602574825287, 0.000275416299700737, 0.0002815723419189453]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 7.0, 16.0, 16.0, 17.0, 33.0, 59.0, 71.0, 129.0, 263.0, 532.0, 1358.0, 5245.0, 29760.0, 398062.0, 565679.0, 38365.0, 6165.0, 1553.0, 537.0, 251.0, 130.0, 108.0, 43.0, 35.0, 31.0, 18.0, 11.0, 10.0, 11.0, 5.0, 5.0, 1.0, 7.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.2957305908203125, -0.285552978515625, -0.2753753662109375, -0.26519775390625, -0.2550201416015625, -0.244842529296875, -0.2346649169921875, -0.2244873046875, -0.2143096923828125, -0.204132080078125, -0.1939544677734375, -0.18377685546875, -0.1735992431640625, -0.163421630859375, -0.1532440185546875, -0.14306640625, -0.1328887939453125, -0.122711181640625, -0.1125335693359375, -0.10235595703125, -0.0921783447265625, -0.082000732421875, -0.0718231201171875, -0.0616455078125, -0.0514678955078125, -0.041290283203125, -0.0311126708984375, -0.02093505859375, -0.0107574462890625, -0.000579833984375, 0.0095977783203125, 0.019775390625, 0.0299530029296875, 0.040130615234375, 0.0503082275390625, 0.06048583984375, 0.0706634521484375, 0.080841064453125, 0.0910186767578125, 0.1011962890625, 0.1113739013671875, 0.121551513671875, 0.1317291259765625, 0.14190673828125, 0.1520843505859375, 0.162261962890625, 0.1724395751953125, 0.1826171875, 0.1927947998046875, 0.202972412109375, 0.2131500244140625, 0.22332763671875, 0.2335052490234375, 0.243682861328125, 0.2538604736328125, 0.2640380859375, 0.2742156982421875, 0.284393310546875, 0.2945709228515625, 0.30474853515625, 0.3149261474609375, 0.325103759765625, 0.3352813720703125, 0.345458984375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 11.0, 14.0, 19.0, 29.0, 36.0, 36.0, 81.0, 95.0, 109.0, 114.0, 85.0, 85.0, 62.0, 48.0, 35.0, 21.0, 18.0, 15.0, 14.0, 12.0, 8.0, 2.0, 4.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.26416015625, -0.2567253112792969, -0.24929046630859375, -0.24185562133789062, -0.2344207763671875, -0.22698593139648438, -0.21955108642578125, -0.21211624145507812, -0.204681396484375, -0.19724655151367188, -0.18981170654296875, -0.18237686157226562, -0.1749420166015625, -0.16750717163085938, -0.16007232666015625, -0.15263748168945312, -0.14520263671875, -0.13776779174804688, -0.13033294677734375, -0.12289810180664062, -0.1154632568359375, -0.10802841186523438, -0.10059356689453125, -0.09315872192382812, -0.085723876953125, -0.07828903198242188, -0.07085418701171875, -0.06341934204101562, -0.0559844970703125, -0.048549652099609375, -0.04111480712890625, -0.033679962158203125, -0.0262451171875, -0.018810272216796875, -0.01137542724609375, -0.003940582275390625, 0.0034942626953125, 0.010929107666015625, 0.01836395263671875, 0.025798797607421875, 0.033233642578125, 0.040668487548828125, 0.04810333251953125, 0.055538177490234375, 0.0629730224609375, 0.07040786743164062, 0.07784271240234375, 0.08527755737304688, 0.09271240234375, 0.10014724731445312, 0.10758209228515625, 0.11501693725585938, 0.1224517822265625, 0.12988662719726562, 0.13732147216796875, 0.14475631713867188, 0.152191162109375, 0.15962600708007812, 0.16706085205078125, 0.17449569702148438, 0.1819305419921875, 0.18936538696289062, 0.19680023193359375, 0.20423507690429688, 0.211669921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 11.0, 31.0, 116.0, 354.0, 336.0, 118.0, 19.0, 15.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.554365158081055, -9.172805786132812, -8.791247367858887, -8.409687995910645, -8.028129577636719, -7.646570205688477, -7.265010833740234, -6.88345193862915, -6.501893043518066, -6.120334148406982, -5.738775253295898, -5.357215881347656, -4.975656986236572, -4.594098091125488, -4.212538719177246, -3.830979824066162, -3.449420928955078, -3.067862033843994, -2.686302900314331, -2.304743766784668, -1.923184871673584, -1.5416258573532104, -1.160066843032837, -0.7785077095031738, -0.39694881439208984, -0.015389800071716309, 0.3661692142486572, 0.7477282285690308, 1.1292872428894043, 1.5108462572097778, 1.8924052715301514, 2.2739644050598145, 2.6555233001708984, 3.0370821952819824, 3.4186413288116455, 3.8002004623413086, 4.181759357452393, 4.563318252563477, 4.944877624511719, 5.326436519622803, 5.707995414733887, 6.089554309844971, 6.471113204956055, 6.852672576904297, 7.234231472015381, 7.615790367126465, 7.997349739074707, 8.378908157348633, 8.760467529296875, 9.142026901245117, 9.523585319519043, 9.905144691467285, 10.286703109741211, 10.668262481689453, 11.049821853637695, 11.431381225585938, 11.812939643859863, 12.194499015808105, 12.576057434082031, 12.957616806030273, 13.339176177978516, 13.720734596252441, 14.102293968200684, 14.48385238647461, 14.865411758422852]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 6.0, 13.0, 5.0, 8.0, 17.0, 23.0, 20.0, 28.0, 29.0, 33.0, 43.0, 42.0, 47.0, 42.0, 43.0, 53.0, 56.0, 38.0, 40.0, 60.0, 35.0, 36.0, 40.0, 33.0, 40.0, 29.0, 29.0, 18.0, 16.0, 18.0, 12.0, 16.0, 4.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.960765838623047, -4.781157493591309, -4.60154914855957, -4.421940803527832, -4.242332458496094, -4.0627241134643555, -3.883115530014038, -3.7035071849823, -3.5238988399505615, -3.3442904949188232, -3.164682149887085, -2.9850735664367676, -2.8054652214050293, -2.625856876373291, -2.4462485313415527, -2.2666401863098145, -2.087031841278076, -1.907423496246338, -1.7278151512145996, -1.5482066869735718, -1.3685983419418335, -1.1889899969100952, -1.0093815326690674, -0.8297731876373291, -0.6501648426055908, -0.47055646777153015, -0.2909480929374695, -0.11133968830108643, 0.06826865673065186, 0.24787700176239014, 0.42748546600341797, 0.6070938110351562, 0.7867021560668945, 0.9663105010986328, 1.145918846130371, 1.325527310371399, 1.5051356554031372, 1.6847440004348755, 1.8643524646759033, 2.0439608097076416, 2.22356915473938, 2.403177499771118, 2.5827858448028564, 2.762394428253174, 2.942002773284912, 3.1216111183166504, 3.3012194633483887, 3.480827808380127, 3.6604361534118652, 3.8400444984436035, 4.019652843475342, 4.19926118850708, 4.378869533538818, 4.558477878570557, 4.738086700439453, 4.917695045471191, 5.09730339050293, 5.276911735534668, 5.456520080566406, 5.6361284255981445, 5.815736770629883, 5.995345115661621, 6.174953460693359, 6.354561805725098, 6.534170150756836]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 2.0, 6.0, 12.0, 10.0, 20.0, 23.0, 36.0, 43.0, 93.0, 137.0, 256.0, 438.0, 960.0, 2325.0, 6745.0, 26895.0, 429309.0, 3662089.0, 49056.0, 10031.0, 3214.0, 1208.0, 604.0, 288.0, 174.0, 109.0, 59.0, 43.0, 24.0, 22.0, 16.0, 5.0, 8.0, 7.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0257110595703125, -0.994781494140625, -0.9638519287109375, -0.93292236328125, -0.9019927978515625, -0.871063232421875, -0.8401336669921875, -0.8092041015625, -0.7782745361328125, -0.747344970703125, -0.7164154052734375, -0.68548583984375, -0.6545562744140625, -0.623626708984375, -0.5926971435546875, -0.561767578125, -0.5308380126953125, -0.499908447265625, -0.4689788818359375, -0.43804931640625, -0.4071197509765625, -0.376190185546875, -0.3452606201171875, -0.3143310546875, -0.2834014892578125, -0.252471923828125, -0.2215423583984375, -0.19061279296875, -0.1596832275390625, -0.128753662109375, -0.0978240966796875, -0.06689453125, -0.0359649658203125, -0.005035400390625, 0.0258941650390625, 0.05682373046875, 0.0877532958984375, 0.118682861328125, 0.1496124267578125, 0.1805419921875, 0.2114715576171875, 0.242401123046875, 0.2733306884765625, 0.30426025390625, 0.3351898193359375, 0.366119384765625, 0.3970489501953125, 0.427978515625, 0.4589080810546875, 0.489837646484375, 0.5207672119140625, 0.55169677734375, 0.5826263427734375, 0.613555908203125, 0.6444854736328125, 0.6754150390625, 0.7063446044921875, 0.737274169921875, 0.7682037353515625, 0.79913330078125, 0.8300628662109375, 0.860992431640625, 0.8919219970703125, 0.9228515625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 15.0, 19.0, 26.0, 38.0, 40.0, 50.0, 67.0, 70.0, 91.0, 81.0, 84.0, 83.0, 73.0, 58.0, 61.0, 40.0, 33.0, 24.0, 17.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.488037109375, -0.4754600524902344, -0.46288299560546875, -0.4503059387207031, -0.4377288818359375, -0.4251518249511719, -0.41257476806640625, -0.3999977111816406, -0.387420654296875, -0.3748435974121094, -0.36226654052734375, -0.3496894836425781, -0.3371124267578125, -0.3245353698730469, -0.31195831298828125, -0.2993812561035156, -0.28680419921875, -0.2742271423339844, -0.26165008544921875, -0.24907302856445312, -0.2364959716796875, -0.22391891479492188, -0.21134185791015625, -0.19876480102539062, -0.186187744140625, -0.17361068725585938, -0.16103363037109375, -0.14845657348632812, -0.1358795166015625, -0.12330245971679688, -0.11072540283203125, -0.09814834594726562, -0.0855712890625, -0.07299423217773438, -0.06041717529296875, -0.047840118408203125, -0.0352630615234375, -0.022686004638671875, -0.01010894775390625, 0.002468109130859375, 0.015045166015625, 0.027622222900390625, 0.04019927978515625, 0.052776336669921875, 0.0653533935546875, 0.07793045043945312, 0.09050750732421875, 0.10308456420898438, 0.11566162109375, 0.12823867797851562, 0.14081573486328125, 0.15339279174804688, 0.1659698486328125, 0.17854690551757812, 0.19112396240234375, 0.20370101928710938, 0.216278076171875, 0.22885513305664062, 0.24143218994140625, 0.2540092468261719, 0.2665863037109375, 0.2791633605957031, 0.29174041748046875, 0.3043174743652344, 0.31689453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 16.0, 24.0, 45.0, 101.0, 207.0, 524.0, 1814.0, 6868.0, 39653.0, 3283027.0, 826250.0, 28073.0, 5415.0, 1460.0, 474.0, 147.0, 72.0, 39.0, 25.0, 14.0, 6.0, 6.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0], "bins": [-1.314453125, -1.285186767578125, -1.25592041015625, -1.226654052734375, -1.1973876953125, -1.168121337890625, -1.13885498046875, -1.109588623046875, -1.080322265625, -1.051055908203125, -1.02178955078125, -0.992523193359375, -0.9632568359375, -0.933990478515625, -0.90472412109375, -0.875457763671875, -0.84619140625, -0.816925048828125, -0.78765869140625, -0.758392333984375, -0.7291259765625, -0.699859619140625, -0.67059326171875, -0.641326904296875, -0.612060546875, -0.582794189453125, -0.55352783203125, -0.524261474609375, -0.4949951171875, -0.465728759765625, -0.43646240234375, -0.407196044921875, -0.3779296875, -0.348663330078125, -0.31939697265625, -0.290130615234375, -0.2608642578125, -0.231597900390625, -0.20233154296875, -0.173065185546875, -0.143798828125, -0.114532470703125, -0.08526611328125, -0.055999755859375, -0.0267333984375, 0.002532958984375, 0.03179931640625, 0.061065673828125, 0.09033203125, 0.119598388671875, 0.14886474609375, 0.178131103515625, 0.2073974609375, 0.236663818359375, 0.26593017578125, 0.295196533203125, 0.324462890625, 0.353729248046875, 0.38299560546875, 0.412261962890625, 0.4415283203125, 0.470794677734375, 0.50006103515625, 0.529327392578125, 0.55859375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 13.0, 15.0, 23.0, 59.0, 84.0, 229.0, 926.0, 2060.0, 336.0, 112.0, 69.0, 39.0, 20.0, 12.0, 8.0, 16.0, 5.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430419921875, -0.4191627502441406, -0.40790557861328125, -0.3966484069824219, -0.3853912353515625, -0.3741340637207031, -0.36287689208984375, -0.3516197204589844, -0.340362548828125, -0.3291053771972656, -0.31784820556640625, -0.3065910339355469, -0.2953338623046875, -0.2840766906738281, -0.27281951904296875, -0.2615623474121094, -0.25030517578125, -0.23904800415039062, -0.22779083251953125, -0.21653366088867188, -0.2052764892578125, -0.19401931762695312, -0.18276214599609375, -0.17150497436523438, -0.160247802734375, -0.14899063110351562, -0.13773345947265625, -0.12647628784179688, -0.1152191162109375, -0.10396194458007812, -0.09270477294921875, -0.08144760131835938, -0.0701904296875, -0.058933258056640625, -0.04767608642578125, -0.036418914794921875, -0.0251617431640625, -0.013904571533203125, -0.00264739990234375, 0.008609771728515625, 0.019866943359375, 0.031124114990234375, 0.04238128662109375, 0.053638458251953125, 0.0648956298828125, 0.07615280151367188, 0.08740997314453125, 0.09866714477539062, 0.10992431640625, 0.12118148803710938, 0.13243865966796875, 0.14369583129882812, 0.1549530029296875, 0.16621017456054688, 0.17746734619140625, 0.18872451782226562, 0.199981689453125, 0.21123886108398438, 0.22249603271484375, 0.23375320434570312, 0.2450103759765625, 0.2562675476074219, 0.26752471923828125, 0.2787818908691406, 0.2900390625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 9.0, 36.0, 187.0, 437.0, 275.0, 52.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.744811058044434, -5.624825954437256, -5.504840850830078, -5.3848557472229, -5.264870643615723, -5.144885063171387, -5.024900436401367, -4.904914855957031, -4.7849297523498535, -4.664944648742676, -4.544959545135498, -4.42497444152832, -4.304989337921143, -4.185004234313965, -4.065018653869629, -3.9450337886810303, -3.8250486850738525, -3.705063581466675, -3.585078477859497, -3.4650931358337402, -3.3451080322265625, -3.2251229286193848, -3.105137825012207, -2.9851527214050293, -2.8651676177978516, -2.745182514190674, -2.625197410583496, -2.5052123069763184, -2.3852269649505615, -2.265241861343384, -2.145256757736206, -2.0252716541290283, -1.9052865505218506, -1.7853014469146729, -1.6653162240982056, -1.5453311204910278, -1.4253458976745605, -1.3053607940673828, -1.185375690460205, -1.0653905868530273, -0.9454053640365601, -0.8254202008247375, -0.705435037612915, -0.5854499340057373, -0.4654647707939148, -0.3454796075820923, -0.22549450397491455, -0.10550934076309204, 0.014475822448730469, 0.13446097075939178, 0.2544461190700531, 0.3744312524795532, 0.49441641569137573, 0.6144015789031982, 0.734386682510376, 0.8543718457221985, 0.974357008934021, 1.0943421125411987, 1.214327335357666, 1.3343124389648438, 1.4542975425720215, 1.5742827653884888, 1.6942678689956665, 1.8142530918121338, 1.9342381954193115]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 9.0, 16.0, 23.0, 31.0, 33.0, 65.0, 58.0, 59.0, 75.0, 74.0, 79.0, 75.0, 70.0, 62.0, 46.0, 63.0, 38.0, 31.0, 29.0, 22.0, 15.0, 12.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7874689102172852, -1.7381811141967773, -1.6888933181762695, -1.6396055221557617, -1.590317726135254, -1.5410298109054565, -1.4917420148849487, -1.442454218864441, -1.393166422843933, -1.3438786268234253, -1.2945908308029175, -1.2453030347824097, -1.1960151195526123, -1.1467273235321045, -1.0974395275115967, -1.0481517314910889, -0.998863935470581, -0.9495761394500732, -0.9002883434295654, -0.8510004878044128, -0.801712691783905, -0.7524248957633972, -0.7031370401382446, -0.6538492441177368, -0.604561448097229, -0.5552736520767212, -0.5059858560562134, -0.4566980004310608, -0.407410204410553, -0.35812240839004517, -0.30883458256721497, -0.25954675674438477, -0.2102588415145874, -0.1609710305929184, -0.11168321967124939, -0.06239540874958038, -0.013107597827911377, 0.03618021309375763, 0.08546802401542664, 0.13475584983825684, 0.18404364585876465, 0.23333145678043365, 0.28261926770210266, 0.33190709352493286, 0.3811948895454407, 0.4304826855659485, 0.4797705113887787, 0.5290583372116089, 0.5783461332321167, 0.6276339292526245, 0.6769217252731323, 0.7262095808982849, 0.7754973769187927, 0.8247851729393005, 0.8740730285644531, 0.9233608245849609, 0.9726486206054688, 1.0219364166259766, 1.0712242126464844, 1.1205120086669922, 1.1697998046875, 1.2190877199172974, 1.2683755159378052, 1.317663311958313, 1.3669511079788208]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 5.0, 13.0, 15.0, 20.0, 52.0, 61.0, 115.0, 182.0, 296.0, 541.0, 1180.0, 3083.0, 11036.0, 55358.0, 389803.0, 493259.0, 73391.0, 13608.0, 3757.0, 1316.0, 613.0, 349.0, 191.0, 105.0, 73.0, 54.0, 24.0, 10.0, 12.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.109375, -1.0794525146484375, -1.049530029296875, -1.0196075439453125, -0.98968505859375, -0.9597625732421875, -0.929840087890625, -0.8999176025390625, -0.8699951171875, -0.8400726318359375, -0.810150146484375, -0.7802276611328125, -0.75030517578125, -0.7203826904296875, -0.690460205078125, -0.6605377197265625, -0.630615234375, -0.6006927490234375, -0.570770263671875, -0.5408477783203125, -0.51092529296875, -0.4810028076171875, -0.451080322265625, -0.4211578369140625, -0.3912353515625, -0.3613128662109375, -0.331390380859375, -0.3014678955078125, -0.27154541015625, -0.2416229248046875, -0.211700439453125, -0.1817779541015625, -0.15185546875, -0.1219329833984375, -0.092010498046875, -0.0620880126953125, -0.03216552734375, -0.0022430419921875, 0.027679443359375, 0.0576019287109375, 0.0875244140625, 0.1174468994140625, 0.147369384765625, 0.1772918701171875, 0.20721435546875, 0.2371368408203125, 0.267059326171875, 0.2969818115234375, 0.326904296875, 0.3568267822265625, 0.386749267578125, 0.4166717529296875, 0.44659423828125, 0.4765167236328125, 0.506439208984375, 0.5363616943359375, 0.5662841796875, 0.5962066650390625, 0.626129150390625, 0.6560516357421875, 0.68597412109375, 0.7158966064453125, 0.745819091796875, 0.7757415771484375, 0.8056640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 3.0, 9.0, 17.0, 21.0, 36.0, 40.0, 45.0, 56.0, 74.0, 81.0, 78.0, 81.0, 91.0, 75.0, 71.0, 53.0, 52.0, 41.0, 23.0, 18.0, 11.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.468994140625, -0.4567413330078125, -0.444488525390625, -0.4322357177734375, -0.41998291015625, -0.4077301025390625, -0.395477294921875, -0.3832244873046875, -0.3709716796875, -0.3587188720703125, -0.346466064453125, -0.3342132568359375, -0.32196044921875, -0.3097076416015625, -0.297454833984375, -0.2852020263671875, -0.27294921875, -0.2606964111328125, -0.248443603515625, -0.2361907958984375, -0.22393798828125, -0.2116851806640625, -0.199432373046875, -0.1871795654296875, -0.1749267578125, -0.1626739501953125, -0.150421142578125, -0.1381683349609375, -0.12591552734375, -0.1136627197265625, -0.101409912109375, -0.0891571044921875, -0.076904296875, -0.0646514892578125, -0.052398681640625, -0.0401458740234375, -0.02789306640625, -0.0156402587890625, -0.003387451171875, 0.0088653564453125, 0.0211181640625, 0.0333709716796875, 0.045623779296875, 0.0578765869140625, 0.07012939453125, 0.0823822021484375, 0.094635009765625, 0.1068878173828125, 0.119140625, 0.1313934326171875, 0.143646240234375, 0.1558990478515625, 0.16815185546875, 0.1804046630859375, 0.192657470703125, 0.2049102783203125, 0.2171630859375, 0.2294158935546875, 0.241668701171875, 0.2539215087890625, 0.26617431640625, 0.2784271240234375, 0.290679931640625, 0.3029327392578125, 0.315185546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 6.0, 6.0, 6.0, 8.0, 11.0, 12.0, 19.0, 28.0, 24.0, 31.0, 37.0, 51.0, 52.0, 65.0, 89.0, 145.0, 249.0, 468.0, 1102.0, 3297.0, 11749.0, 57327.0, 372024.0, 498811.0, 80570.0, 15593.0, 3933.0, 1337.0, 566.0, 270.0, 165.0, 93.0, 92.0, 48.0, 64.0, 51.0, 21.0, 30.0, 22.0, 25.0, 13.0, 10.0, 7.0, 8.0, 7.0, 7.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7802734375, -0.7551803588867188, -0.7300872802734375, -0.7049942016601562, -0.679901123046875, -0.6548080444335938, -0.6297149658203125, -0.6046218872070312, -0.57952880859375, -0.5544357299804688, -0.5293426513671875, -0.5042495727539062, -0.479156494140625, -0.45406341552734375, -0.4289703369140625, -0.40387725830078125, -0.3787841796875, -0.35369110107421875, -0.3285980224609375, -0.30350494384765625, -0.278411865234375, -0.25331878662109375, -0.2282257080078125, -0.20313262939453125, -0.17803955078125, -0.15294647216796875, -0.1278533935546875, -0.10276031494140625, -0.077667236328125, -0.05257415771484375, -0.0274810791015625, -0.00238800048828125, 0.022705078125, 0.04779815673828125, 0.0728912353515625, 0.09798431396484375, 0.123077392578125, 0.14817047119140625, 0.1732635498046875, 0.19835662841796875, 0.22344970703125, 0.24854278564453125, 0.2736358642578125, 0.29872894287109375, 0.323822021484375, 0.34891510009765625, 0.3740081787109375, 0.39910125732421875, 0.4241943359375, 0.44928741455078125, 0.4743804931640625, 0.49947357177734375, 0.524566650390625, 0.5496597290039062, 0.5747528076171875, 0.5998458862304688, 0.62493896484375, 0.6500320434570312, 0.6751251220703125, 0.7002182006835938, 0.725311279296875, 0.7504043579101562, 0.7754974365234375, 0.8005905151367188, 0.82568359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 2.0, 6.0, 4.0, 10.0, 8.0, 10.0, 14.0, 19.0, 26.0, 23.0, 32.0, 32.0, 33.0, 38.0, 49.0, 46.0, 57.0, 52.0, 52.0, 56.0, 46.0, 43.0, 38.0, 50.0, 45.0, 29.0, 30.0, 29.0, 19.0, 22.0, 16.0, 7.0, 4.0, 14.0, 4.0, 4.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.044921875, -1.0123748779296875, -0.979827880859375, -0.9472808837890625, -0.91473388671875, -0.8821868896484375, -0.849639892578125, -0.8170928955078125, -0.7845458984375, -0.7519989013671875, -0.719451904296875, -0.6869049072265625, -0.65435791015625, -0.6218109130859375, -0.589263916015625, -0.5567169189453125, -0.524169921875, -0.4916229248046875, -0.459075927734375, -0.4265289306640625, -0.39398193359375, -0.3614349365234375, -0.328887939453125, -0.2963409423828125, -0.2637939453125, -0.2312469482421875, -0.198699951171875, -0.1661529541015625, -0.13360595703125, -0.1010589599609375, -0.068511962890625, -0.0359649658203125, -0.00341796875, 0.0291290283203125, 0.061676025390625, 0.0942230224609375, 0.12677001953125, 0.1593170166015625, 0.191864013671875, 0.2244110107421875, 0.2569580078125, 0.2895050048828125, 0.322052001953125, 0.3545989990234375, 0.38714599609375, 0.4196929931640625, 0.452239990234375, 0.4847869873046875, 0.517333984375, 0.5498809814453125, 0.582427978515625, 0.6149749755859375, 0.64752197265625, 0.6800689697265625, 0.712615966796875, 0.7451629638671875, 0.7777099609375, 0.8102569580078125, 0.842803955078125, 0.8753509521484375, 0.90789794921875, 0.9404449462890625, 0.972991943359375, 1.0055389404296875, 1.0380859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 7.0, 8.0, 12.0, 25.0, 40.0, 50.0, 102.0, 195.0, 425.0, 1070.0, 3170.0, 13030.0, 84927.0, 734571.0, 180604.0, 22664.0, 4976.0, 1463.0, 569.0, 279.0, 147.0, 86.0, 49.0, 27.0, 16.0, 8.0, 7.0, 9.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.35107421875, -0.3417530059814453, -0.3324317932128906, -0.32311058044433594, -0.31378936767578125, -0.30446815490722656, -0.2951469421386719, -0.2858257293701172, -0.2765045166015625, -0.2671833038330078, -0.2578620910644531, -0.24854087829589844, -0.23921966552734375, -0.22989845275878906, -0.22057723999023438, -0.2112560272216797, -0.201934814453125, -0.1926136016845703, -0.18329238891601562, -0.17397117614746094, -0.16464996337890625, -0.15532875061035156, -0.14600753784179688, -0.1366863250732422, -0.1273651123046875, -0.11804389953613281, -0.10872268676757812, -0.09940147399902344, -0.09008026123046875, -0.08075904846191406, -0.07143783569335938, -0.06211662292480469, -0.05279541015625, -0.04347419738769531, -0.034152984619140625, -0.024831771850585938, -0.01551055908203125, -0.0061893463134765625, 0.003131866455078125, 0.012453079223632812, 0.0217742919921875, 0.031095504760742188, 0.040416717529296875, 0.04973793029785156, 0.05905914306640625, 0.06838035583496094, 0.07770156860351562, 0.08702278137207031, 0.096343994140625, 0.10566520690917969, 0.11498641967773438, 0.12430763244628906, 0.13362884521484375, 0.14295005798339844, 0.15227127075195312, 0.1615924835205078, 0.1709136962890625, 0.1802349090576172, 0.18955612182617188, 0.19887733459472656, 0.20819854736328125, 0.21751976013183594, 0.22684097290039062, 0.2361621856689453, 0.2454833984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 8.0, 6.0, 10.0, 14.0, 15.0, 13.0, 30.0, 37.0, 59.0, 118.0, 126.0, 158.0, 136.0, 68.0, 40.0, 27.0, 27.0, 13.0, 25.0, 8.0, 12.0, 2.0, 11.0, 8.0, 8.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012350082397460938, -0.00011966470628976822, -0.00011582858860492706, -0.00011199247092008591, -0.00010815635323524475, -0.0001043202355504036, -0.00010048411786556244, -9.664800018072128e-05, -9.281188249588013e-05, -8.897576481103897e-05, -8.513964712619781e-05, -8.130352944135666e-05, -7.74674117565155e-05, -7.363129407167435e-05, -6.979517638683319e-05, -6.595905870199203e-05, -6.212294101715088e-05, -5.828682333230972e-05, -5.445070564746857e-05, -5.061458796262741e-05, -4.6778470277786255e-05, -4.29423525929451e-05, -3.910623490810394e-05, -3.527011722326279e-05, -3.143399953842163e-05, -2.7597881853580475e-05, -2.376176416873932e-05, -1.9925646483898163e-05, -1.6089528799057007e-05, -1.225341111421585e-05, -8.417293429374695e-06, -4.581175744533539e-06, -7.450580596923828e-07, 3.091059625148773e-06, 6.927177309989929e-06, 1.0763294994831085e-05, 1.4599412679672241e-05, 1.8435530364513397e-05, 2.2271648049354553e-05, 2.610776573419571e-05, 2.9943883419036865e-05, 3.378000110387802e-05, 3.761611878871918e-05, 4.145223647356033e-05, 4.528835415840149e-05, 4.9124471843242645e-05, 5.29605895280838e-05, 5.679670721292496e-05, 6.063282489776611e-05, 6.446894258260727e-05, 6.830506026744843e-05, 7.214117795228958e-05, 7.597729563713074e-05, 7.98134133219719e-05, 8.364953100681305e-05, 8.74856486916542e-05, 9.132176637649536e-05, 9.515788406133652e-05, 9.899400174617767e-05, 0.00010283011943101883, 0.00010666623711585999, 0.00011050235480070114, 0.0001143384724855423, 0.00011817459017038345, 0.00012201070785522461]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 9.0, 10.0, 10.0, 6.0, 25.0, 21.0, 45.0, 58.0, 87.0, 192.0, 550.0, 2452.0, 26021.0, 874809.0, 135892.0, 6673.0, 1065.0, 283.0, 136.0, 61.0, 54.0, 45.0, 20.0, 12.0, 11.0, 6.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.578125, -0.5614814758300781, -0.5448379516601562, -0.5281944274902344, -0.5115509033203125, -0.4949073791503906, -0.47826385498046875, -0.4616203308105469, -0.444976806640625, -0.4283332824707031, -0.41168975830078125, -0.3950462341308594, -0.3784027099609375, -0.3617591857910156, -0.34511566162109375, -0.3284721374511719, -0.31182861328125, -0.2951850891113281, -0.27854156494140625, -0.2618980407714844, -0.2452545166015625, -0.22861099243164062, -0.21196746826171875, -0.19532394409179688, -0.178680419921875, -0.16203689575195312, -0.14539337158203125, -0.12874984741210938, -0.1121063232421875, -0.09546279907226562, -0.07881927490234375, -0.062175750732421875, -0.0455322265625, -0.028888702392578125, -0.01224517822265625, 0.004398345947265625, 0.0210418701171875, 0.037685394287109375, 0.05432891845703125, 0.07097244262695312, 0.087615966796875, 0.10425949096679688, 0.12090301513671875, 0.13754653930664062, 0.1541900634765625, 0.17083358764648438, 0.18747711181640625, 0.20412063598632812, 0.22076416015625, 0.23740768432617188, 0.25405120849609375, 0.2706947326660156, 0.2873382568359375, 0.3039817810058594, 0.32062530517578125, 0.3372688293457031, 0.353912353515625, 0.3705558776855469, 0.38719940185546875, 0.4038429260253906, 0.4204864501953125, 0.4371299743652344, 0.45377349853515625, 0.4704170227050781, 0.487060546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 10.0, 16.0, 27.0, 43.0, 87.0, 134.0, 207.0, 197.0, 106.0, 64.0, 42.0, 24.0, 16.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19677734375, -0.18143463134765625, -0.1660919189453125, -0.15074920654296875, -0.135406494140625, -0.12006378173828125, -0.1047210693359375, -0.08937835693359375, -0.07403564453125, -0.05869293212890625, -0.0433502197265625, -0.02800750732421875, -0.012664794921875, 0.00267791748046875, 0.0180206298828125, 0.03336334228515625, 0.0487060546875, 0.06404876708984375, 0.0793914794921875, 0.09473419189453125, 0.110076904296875, 0.12541961669921875, 0.1407623291015625, 0.15610504150390625, 0.17144775390625, 0.18679046630859375, 0.2021331787109375, 0.21747589111328125, 0.232818603515625, 0.24816131591796875, 0.2635040283203125, 0.27884674072265625, 0.294189453125, 0.30953216552734375, 0.3248748779296875, 0.34021759033203125, 0.355560302734375, 0.37090301513671875, 0.3862457275390625, 0.40158843994140625, 0.41693115234375, 0.43227386474609375, 0.4476165771484375, 0.46295928955078125, 0.478302001953125, 0.49364471435546875, 0.5089874267578125, 0.5243301391601562, 0.5396728515625, 0.5550155639648438, 0.5703582763671875, 0.5857009887695312, 0.601043701171875, 0.6163864135742188, 0.6317291259765625, 0.6470718383789062, 0.66241455078125, 0.6777572631835938, 0.6930999755859375, 0.7084426879882812, 0.723785400390625, 0.7391281127929688, 0.7544708251953125, 0.7698135375976562, 0.78515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 19.0, 43.0, 120.0, 212.0, 255.0, 183.0, 96.0, 44.0, 20.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.625969886779785, -4.4003801345825195, -4.174789905548096, -3.94920015335083, -3.7236099243164062, -3.4980201721191406, -3.272430181503296, -3.046840190887451, -2.8212502002716064, -2.5956602096557617, -2.370070219039917, -2.1444802284240723, -1.918890357017517, -1.6933003664016724, -1.4677104949951172, -1.2421205043792725, -1.0165305137634277, -0.790940523147583, -0.5653505921363831, -0.3397606611251831, -0.11417067050933838, 0.11141932010650635, 0.3370091915130615, 0.5625991821289062, 0.788189172744751, 1.0137791633605957, 1.2393691539764404, 1.4649590253829956, 1.6905490159988403, 1.916139006614685, 2.1417288780212402, 2.367318868637085, 2.5929088592529297, 2.8184988498687744, 3.044088840484619, 3.2696785926818848, 3.4952688217163086, 3.720858573913574, 3.946448564529419, 4.172038555145264, 4.3976287841796875, 4.623218536376953, 4.848808765411377, 5.074398517608643, 5.299988746643066, 5.525578498840332, 5.751168251037598, 5.9767584800720215, 6.202348232269287, 6.427937984466553, 6.653528213500977, 6.879117965698242, 7.104708194732666, 7.330297946929932, 7.5558881759643555, 7.781477928161621, 8.007067680358887, 8.232657432556152, 8.458247184753418, 8.683837890625, 8.909427642822266, 9.135017395019531, 9.360607147216797, 9.586196899414062, 9.811787605285645]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 4.0, 5.0, 12.0, 8.0, 14.0, 16.0, 17.0, 21.0, 25.0, 28.0, 22.0, 23.0, 28.0, 27.0, 30.0, 43.0, 42.0, 45.0, 47.0, 42.0, 38.0, 42.0, 43.0, 36.0, 32.0, 31.0, 35.0, 41.0, 28.0, 31.0, 19.0, 18.0, 7.0, 19.0, 11.0, 13.0, 10.0, 11.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.008632659912109, -3.873178005218506, -3.7377235889434814, -3.602268934249878, -3.4668145179748535, -3.33135986328125, -3.1959052085876465, -3.060450553894043, -2.9249961376190186, -2.789541482925415, -2.6540870666503906, -2.518632411956787, -2.3831777572631836, -2.247723340988159, -2.1122686862945557, -1.9768141508102417, -1.8413596153259277, -1.7059050798416138, -1.5704505443572998, -1.4349958896636963, -1.2995413541793823, -1.1640868186950684, -1.0286321640014648, -0.8931776285171509, -0.7577230930328369, -0.622268557548523, -0.4868139624595642, -0.35135939717292786, -0.2159048318862915, -0.08045029640197754, 0.0550042986869812, 0.19045889377593994, 0.3259134292602539, 0.46136799454689026, 0.5968225598335266, 0.7322771549224854, 0.8677316904067993, 1.0031862258911133, 1.1386408805847168, 1.2740954160690308, 1.4095499515533447, 1.5450044870376587, 1.6804590225219727, 1.8159136772155762, 1.9513682126998901, 2.086822748184204, 2.2222774028778076, 2.357731819152832, 2.4931864738464355, 2.628641128540039, 2.7640955448150635, 2.899550199508667, 3.0350046157836914, 3.170459270477295, 3.3059139251708984, 3.441368579864502, 3.5768229961395264, 3.71227765083313, 3.8477320671081543, 3.983186721801758, 4.118641376495361, 4.254096031188965, 4.38955020904541, 4.525004863739014, 4.660459518432617]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 3.0, 11.0, 9.0, 11.0, 20.0, 31.0, 44.0, 71.0, 110.0, 174.0, 290.0, 587.0, 1297.0, 3267.0, 10032.0, 49869.0, 3666985.0, 422226.0, 27793.0, 6938.0, 2337.0, 968.0, 475.0, 251.0, 168.0, 103.0, 78.0, 47.0, 28.0, 13.0, 11.0, 8.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3818359375, -1.3421783447265625, -1.302520751953125, -1.2628631591796875, -1.22320556640625, -1.1835479736328125, -1.143890380859375, -1.1042327880859375, -1.0645751953125, -1.0249176025390625, -0.985260009765625, -0.9456024169921875, -0.90594482421875, -0.8662872314453125, -0.826629638671875, -0.7869720458984375, -0.747314453125, -0.7076568603515625, -0.667999267578125, -0.6283416748046875, -0.58868408203125, -0.5490264892578125, -0.509368896484375, -0.4697113037109375, -0.4300537109375, -0.3903961181640625, -0.350738525390625, -0.3110809326171875, -0.27142333984375, -0.2317657470703125, -0.192108154296875, -0.1524505615234375, -0.11279296875, -0.0731353759765625, -0.033477783203125, 0.0061798095703125, 0.04583740234375, 0.0854949951171875, 0.125152587890625, 0.1648101806640625, 0.2044677734375, 0.2441253662109375, 0.283782958984375, 0.3234405517578125, 0.36309814453125, 0.4027557373046875, 0.442413330078125, 0.4820709228515625, 0.521728515625, 0.5613861083984375, 0.601043701171875, 0.6407012939453125, 0.68035888671875, 0.7200164794921875, 0.759674072265625, 0.7993316650390625, 0.8389892578125, 0.8786468505859375, 0.918304443359375, 0.9579620361328125, 0.99761962890625, 1.0372772216796875, 1.076934814453125, 1.1165924072265625, 1.15625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 8.0, 3.0, 5.0, 13.0, 13.0, 26.0, 31.0, 45.0, 50.0, 48.0, 74.0, 90.0, 66.0, 68.0, 76.0, 78.0, 70.0, 68.0, 46.0, 45.0, 23.0, 25.0, 15.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.486572265625, -0.4735450744628906, -0.46051788330078125, -0.4474906921386719, -0.4344635009765625, -0.4214363098144531, -0.40840911865234375, -0.3953819274902344, -0.382354736328125, -0.3693275451660156, -0.35630035400390625, -0.3432731628417969, -0.3302459716796875, -0.3172187805175781, -0.30419158935546875, -0.2911643981933594, -0.27813720703125, -0.2651100158691406, -0.25208282470703125, -0.23905563354492188, -0.2260284423828125, -0.21300125122070312, -0.19997406005859375, -0.18694686889648438, -0.173919677734375, -0.16089248657226562, -0.14786529541015625, -0.13483810424804688, -0.1218109130859375, -0.10878372192382812, -0.09575653076171875, -0.08272933959960938, -0.0697021484375, -0.056674957275390625, -0.04364776611328125, -0.030620574951171875, -0.0175933837890625, -0.004566192626953125, 0.00846099853515625, 0.021488189697265625, 0.034515380859375, 0.047542572021484375, 0.06056976318359375, 0.07359695434570312, 0.0866241455078125, 0.09965133666992188, 0.11267852783203125, 0.12570571899414062, 0.13873291015625, 0.15176010131835938, 0.16478729248046875, 0.17781448364257812, 0.1908416748046875, 0.20386886596679688, 0.21689605712890625, 0.22992324829101562, 0.242950439453125, 0.2559776306152344, 0.26900482177734375, 0.2820320129394531, 0.2950592041015625, 0.3080863952636719, 0.32111358642578125, 0.3341407775878906, 0.34716796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 24.0, 62.0, 148.0, 348.0, 1038.0, 3763.0, 22734.0, 2162847.0, 1974805.0, 22810.0, 3964.0, 1070.0, 364.0, 157.0, 64.0, 32.0, 12.0, 12.0, 8.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.3892364501953125, -1.342926025390625, -1.2966156005859375, -1.25030517578125, -1.2039947509765625, -1.157684326171875, -1.1113739013671875, -1.0650634765625, -1.0187530517578125, -0.972442626953125, -0.9261322021484375, -0.87982177734375, -0.8335113525390625, -0.787200927734375, -0.7408905029296875, -0.694580078125, -0.6482696533203125, -0.601959228515625, -0.5556488037109375, -0.50933837890625, -0.4630279541015625, -0.416717529296875, -0.3704071044921875, -0.3240966796875, -0.2777862548828125, -0.231475830078125, -0.1851654052734375, -0.13885498046875, -0.0925445556640625, -0.046234130859375, 7.62939453125e-05, 0.04638671875, 0.0926971435546875, 0.139007568359375, 0.1853179931640625, 0.23162841796875, 0.2779388427734375, 0.324249267578125, 0.3705596923828125, 0.4168701171875, 0.4631805419921875, 0.509490966796875, 0.5558013916015625, 0.60211181640625, 0.6484222412109375, 0.694732666015625, 0.7410430908203125, 0.787353515625, 0.8336639404296875, 0.879974365234375, 0.9262847900390625, 0.97259521484375, 1.0189056396484375, 1.065216064453125, 1.1115264892578125, 1.1578369140625, 1.2041473388671875, 1.250457763671875, 1.2967681884765625, 1.34307861328125, 1.3893890380859375, 1.435699462890625, 1.4820098876953125, 1.5283203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 12.0, 14.0, 9.0, 22.0, 32.0, 63.0, 118.0, 302.0, 2092.0, 923.0, 211.0, 80.0, 50.0, 37.0, 24.0, 17.0, 10.0, 7.0, 6.0, 3.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3720703125, -0.3591728210449219, -0.34627532958984375, -0.3333778381347656, -0.3204803466796875, -0.3075828552246094, -0.29468536376953125, -0.2817878723144531, -0.268890380859375, -0.2559928894042969, -0.24309539794921875, -0.23019790649414062, -0.2173004150390625, -0.20440292358398438, -0.19150543212890625, -0.17860794067382812, -0.16571044921875, -0.15281295776367188, -0.13991546630859375, -0.12701797485351562, -0.1141204833984375, -0.10122299194335938, -0.08832550048828125, -0.07542800903320312, -0.062530517578125, -0.049633026123046875, -0.03673553466796875, -0.023838043212890625, -0.0109405517578125, 0.001956939697265625, 0.01485443115234375, 0.027751922607421875, 0.0406494140625, 0.053546905517578125, 0.06644439697265625, 0.07934188842773438, 0.0922393798828125, 0.10513687133789062, 0.11803436279296875, 0.13093185424804688, 0.143829345703125, 0.15672683715820312, 0.16962432861328125, 0.18252182006835938, 0.1954193115234375, 0.20831680297851562, 0.22121429443359375, 0.23411178588867188, 0.24700927734375, 0.2599067687988281, 0.27280426025390625, 0.2857017517089844, 0.2985992431640625, 0.3114967346191406, 0.32439422607421875, 0.3372917175292969, 0.350189208984375, 0.3630867004394531, 0.37598419189453125, 0.3888816833496094, 0.4017791748046875, 0.4146766662597656, 0.42757415771484375, 0.4404716491699219, 0.453369140625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 36.0, 244.0, 520.0, 166.0, 28.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.623776435852051, -5.450555801391602, -5.2773356437683105, -5.1041154861450195, -4.93089485168457, -4.757674217224121, -4.58445405960083, -4.411233901977539, -4.23801326751709, -4.064792633056641, -3.8915724754333496, -3.7183520793914795, -3.5451316833496094, -3.3719112873077393, -3.198690891265869, -3.025470495223999, -2.852250099182129, -2.679029703140259, -2.5058093070983887, -2.3325889110565186, -2.1593685150146484, -1.9861481189727783, -1.8129277229309082, -1.639707326889038, -1.466486930847168, -1.2932665348052979, -1.1200461387634277, -0.9468257427215576, -0.7736053466796875, -0.6003849506378174, -0.42716455459594727, -0.25394415855407715, -0.08072376251220703, 0.09249663352966309, 0.2657170295715332, 0.4389374256134033, 0.6121578216552734, 0.7853782176971436, 0.9585986137390137, 1.1318190097808838, 1.305039405822754, 1.478259801864624, 1.6514801979064941, 1.8247005939483643, 1.9979209899902344, 2.1711413860321045, 2.3443617820739746, 2.5175821781158447, 2.690802574157715, 2.864022970199585, 3.037243366241455, 3.210463762283325, 3.3836841583251953, 3.5569045543670654, 3.7301249504089355, 3.9033453464508057, 4.076565742492676, 4.249786376953125, 4.423006534576416, 4.596226692199707, 4.769447326660156, 4.9426679611206055, 5.1158881187438965, 5.2891082763671875, 5.462328910827637]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 9.0, 14.0, 13.0, 14.0, 24.0, 22.0, 26.0, 32.0, 44.0, 57.0, 42.0, 58.0, 39.0, 61.0, 65.0, 68.0, 60.0, 55.0, 37.0, 48.0, 43.0, 40.0, 33.0, 26.0, 16.0, 13.0, 15.0, 10.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7152187824249268, -1.6714156866073608, -1.6276124715805054, -1.5838093757629395, -1.5400062799453735, -1.4962031841278076, -1.4523999691009521, -1.4085968732833862, -1.3647937774658203, -1.3209906816482544, -1.277187466621399, -1.233384370803833, -1.189581274986267, -1.1457781791687012, -1.1019749641418457, -1.0581718683242798, -1.0143686532974243, -0.9705654978752136, -0.9267624020576477, -0.882959246635437, -0.8391561508178711, -0.7953529953956604, -0.7515498399734497, -0.7077467441558838, -0.6639435887336731, -0.6201404333114624, -0.5763373374938965, -0.5325341820716858, -0.4887310564517975, -0.4449279308319092, -0.4011247754096985, -0.3573216497898102, -0.3135184049606323, -0.269715279340744, -0.22591213881969452, -0.18210899829864502, -0.1383058726787567, -0.09450274705886841, -0.050699591636657715, -0.006896466016769409, 0.036906659603118896, 0.0807097926735878, 0.1245129257440567, 0.1683160662651062, 0.2121191918849945, 0.2559223175048828, 0.2997254729270935, 0.3435285985469818, 0.3873317241668701, 0.4311348497867584, 0.47493797540664673, 0.5187411308288574, 0.5625442266464233, 0.606347382068634, 0.6501505374908447, 0.6939536333084106, 0.7377567887306213, 0.781559944152832, 0.825363039970398, 0.8691661953926086, 0.9129693508148193, 0.9567724466323853, 1.0005755424499512, 1.0443787574768066, 1.0881818532943726]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 14.0, 19.0, 18.0, 35.0, 56.0, 106.0, 168.0, 243.0, 483.0, 895.0, 2107.0, 6063.0, 20354.0, 88257.0, 407938.0, 404253.0, 87501.0, 19762.0, 6017.0, 2142.0, 933.0, 478.0, 265.0, 173.0, 77.0, 63.0, 45.0, 28.0, 15.0, 15.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77294921875, -0.7420272827148438, -0.7111053466796875, -0.6801834106445312, -0.649261474609375, -0.6183395385742188, -0.5874176025390625, -0.5564956665039062, -0.52557373046875, -0.49465179443359375, -0.4637298583984375, -0.43280792236328125, -0.401885986328125, -0.37096405029296875, -0.3400421142578125, -0.30912017822265625, -0.2781982421875, -0.24727630615234375, -0.2163543701171875, -0.18543243408203125, -0.154510498046875, -0.12358856201171875, -0.0926666259765625, -0.06174468994140625, -0.03082275390625, 9.918212890625e-05, 0.0310211181640625, 0.06194305419921875, 0.092864990234375, 0.12378692626953125, 0.1547088623046875, 0.18563079833984375, 0.216552734375, 0.24747467041015625, 0.2783966064453125, 0.30931854248046875, 0.340240478515625, 0.37116241455078125, 0.4020843505859375, 0.43300628662109375, 0.46392822265625, 0.49485015869140625, 0.5257720947265625, 0.5566940307617188, 0.587615966796875, 0.6185379028320312, 0.6494598388671875, 0.6803817749023438, 0.7113037109375, 0.7422256469726562, 0.7731475830078125, 0.8040695190429688, 0.834991455078125, 0.8659133911132812, 0.8968353271484375, 0.9277572631835938, 0.95867919921875, 0.9896011352539062, 1.0205230712890625, 1.0514450073242188, 1.082366943359375, 1.1132888793945312, 1.1442108154296875, 1.1751327514648438, 1.2060546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 5.0, 12.0, 17.0, 20.0, 31.0, 43.0, 50.0, 59.0, 79.0, 67.0, 79.0, 81.0, 73.0, 77.0, 82.0, 50.0, 50.0, 40.0, 31.0, 12.0, 19.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.515625, -0.5024986267089844, -0.48937225341796875, -0.4762458801269531, -0.4631195068359375, -0.4499931335449219, -0.43686676025390625, -0.4237403869628906, -0.410614013671875, -0.3974876403808594, -0.38436126708984375, -0.3712348937988281, -0.3581085205078125, -0.3449821472167969, -0.33185577392578125, -0.3187294006347656, -0.30560302734375, -0.2924766540527344, -0.27935028076171875, -0.2662239074707031, -0.2530975341796875, -0.23997116088867188, -0.22684478759765625, -0.21371841430664062, -0.200592041015625, -0.18746566772460938, -0.17433929443359375, -0.16121292114257812, -0.1480865478515625, -0.13496017456054688, -0.12183380126953125, -0.10870742797851562, -0.0955810546875, -0.08245468139648438, -0.06932830810546875, -0.056201934814453125, -0.0430755615234375, -0.029949188232421875, -0.01682281494140625, -0.003696441650390625, 0.009429931640625, 0.022556304931640625, 0.03568267822265625, 0.048809051513671875, 0.0619354248046875, 0.07506179809570312, 0.08818817138671875, 0.10131454467773438, 0.11444091796875, 0.12756729125976562, 0.14069366455078125, 0.15382003784179688, 0.1669464111328125, 0.18007278442382812, 0.19319915771484375, 0.20632553100585938, 0.219451904296875, 0.23257827758789062, 0.24570465087890625, 0.2588310241699219, 0.2719573974609375, 0.2850837707519531, 0.29821014404296875, 0.3113365173339844, 0.324462890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 3.0, 3.0, 12.0, 10.0, 11.0, 13.0, 28.0, 52.0, 52.0, 89.0, 176.0, 393.0, 787.0, 2061.0, 6962.0, 37025.0, 379407.0, 553650.0, 54567.0, 8926.0, 2475.0, 900.0, 421.0, 212.0, 107.0, 63.0, 44.0, 34.0, 12.0, 12.0, 6.0, 6.0, 6.0, 5.0, 5.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4169921875, -1.374176025390625, -1.33135986328125, -1.288543701171875, -1.2457275390625, -1.202911376953125, -1.16009521484375, -1.117279052734375, -1.074462890625, -1.031646728515625, -0.98883056640625, -0.946014404296875, -0.9031982421875, -0.860382080078125, -0.81756591796875, -0.774749755859375, -0.73193359375, -0.689117431640625, -0.64630126953125, -0.603485107421875, -0.5606689453125, -0.517852783203125, -0.47503662109375, -0.432220458984375, -0.389404296875, -0.346588134765625, -0.30377197265625, -0.260955810546875, -0.2181396484375, -0.175323486328125, -0.13250732421875, -0.089691162109375, -0.046875, -0.004058837890625, 0.03875732421875, 0.081573486328125, 0.1243896484375, 0.167205810546875, 0.21002197265625, 0.252838134765625, 0.295654296875, 0.338470458984375, 0.38128662109375, 0.424102783203125, 0.4669189453125, 0.509735107421875, 0.55255126953125, 0.595367431640625, 0.63818359375, 0.680999755859375, 0.72381591796875, 0.766632080078125, 0.8094482421875, 0.852264404296875, 0.89508056640625, 0.937896728515625, 0.980712890625, 1.023529052734375, 1.06634521484375, 1.109161376953125, 1.1519775390625, 1.194793701171875, 1.23760986328125, 1.280426025390625, 1.3232421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 1.0, 2.0, 8.0, 8.0, 10.0, 11.0, 16.0, 16.0, 18.0, 33.0, 37.0, 52.0, 48.0, 61.0, 76.0, 62.0, 72.0, 69.0, 66.0, 68.0, 57.0, 43.0, 34.0, 32.0, 20.0, 24.0, 13.0, 6.0, 12.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7958984375, -1.737060546875, -1.67822265625, -1.619384765625, -1.560546875, -1.501708984375, -1.44287109375, -1.384033203125, -1.3251953125, -1.266357421875, -1.20751953125, -1.148681640625, -1.08984375, -1.031005859375, -0.97216796875, -0.913330078125, -0.8544921875, -0.795654296875, -0.73681640625, -0.677978515625, -0.619140625, -0.560302734375, -0.50146484375, -0.442626953125, -0.3837890625, -0.324951171875, -0.26611328125, -0.207275390625, -0.1484375, -0.089599609375, -0.03076171875, 0.028076171875, 0.0869140625, 0.145751953125, 0.20458984375, 0.263427734375, 0.322265625, 0.381103515625, 0.43994140625, 0.498779296875, 0.5576171875, 0.616455078125, 0.67529296875, 0.734130859375, 0.79296875, 0.851806640625, 0.91064453125, 0.969482421875, 1.0283203125, 1.087158203125, 1.14599609375, 1.204833984375, 1.263671875, 1.322509765625, 1.38134765625, 1.440185546875, 1.4990234375, 1.557861328125, 1.61669921875, 1.675537109375, 1.734375, 1.793212890625, 1.85205078125, 1.910888671875, 1.9697265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 8.0, 10.0, 14.0, 36.0, 31.0, 68.0, 115.0, 233.0, 481.0, 1073.0, 3097.0, 17338.0, 920183.0, 96065.0, 6620.0, 1753.0, 698.0, 310.0, 187.0, 92.0, 53.0, 31.0, 31.0, 6.0, 7.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8076171875, -1.7570648193359375, -1.706512451171875, -1.6559600830078125, -1.60540771484375, -1.5548553466796875, -1.504302978515625, -1.4537506103515625, -1.4031982421875, -1.3526458740234375, -1.302093505859375, -1.2515411376953125, -1.20098876953125, -1.1504364013671875, -1.099884033203125, -1.0493316650390625, -0.998779296875, -0.9482269287109375, -0.897674560546875, -0.8471221923828125, -0.79656982421875, -0.7460174560546875, -0.695465087890625, -0.6449127197265625, -0.5943603515625, -0.5438079833984375, -0.493255615234375, -0.4427032470703125, -0.39215087890625, -0.3415985107421875, -0.291046142578125, -0.2404937744140625, -0.18994140625, -0.1393890380859375, -0.088836669921875, -0.0382843017578125, 0.01226806640625, 0.0628204345703125, 0.113372802734375, 0.1639251708984375, 0.2144775390625, 0.2650299072265625, 0.315582275390625, 0.3661346435546875, 0.41668701171875, 0.4672393798828125, 0.517791748046875, 0.5683441162109375, 0.618896484375, 0.6694488525390625, 0.720001220703125, 0.7705535888671875, 0.82110595703125, 0.8716583251953125, 0.922210693359375, 0.9727630615234375, 1.0233154296875, 1.0738677978515625, 1.124420166015625, 1.1749725341796875, 1.22552490234375, 1.2760772705078125, 1.326629638671875, 1.3771820068359375, 1.427734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 9.0, 12.0, 25.0, 32.0, 48.0, 81.0, 153.0, 282.0, 115.0, 75.0, 48.0, 35.0, 25.0, 14.0, 11.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002751350402832031, -0.0002660974860191345, -0.0002570599317550659, -0.0002480223774909973, -0.0002389848232269287, -0.0002299472689628601, -0.0002209097146987915, -0.0002118721604347229, -0.0002028346061706543, -0.0001937970519065857, -0.0001847594976425171, -0.00017572194337844849, -0.00016668438911437988, -0.00015764683485031128, -0.00014860928058624268, -0.00013957172632217407, -0.00013053417205810547, -0.00012149661779403687, -0.00011245906352996826, -0.00010342150926589966, -9.438395500183105e-05, -8.534640073776245e-05, -7.630884647369385e-05, -6.727129220962524e-05, -5.823373794555664e-05, -4.919618368148804e-05, -4.0158629417419434e-05, -3.112107515335083e-05, -2.2083520889282227e-05, -1.3045966625213623e-05, -4.0084123611450195e-06, 5.029141902923584e-06, 1.4066696166992188e-05, 2.310425043106079e-05, 3.2141804695129395e-05, 4.1179358959198e-05, 5.02169132232666e-05, 5.9254467487335205e-05, 6.829202175140381e-05, 7.732957601547241e-05, 8.636713027954102e-05, 9.540468454360962e-05, 0.00010444223880767822, 0.00011347979307174683, 0.00012251734733581543, 0.00013155490159988403, 0.00014059245586395264, 0.00014963001012802124, 0.00015866756439208984, 0.00016770511865615845, 0.00017674267292022705, 0.00018578022718429565, 0.00019481778144836426, 0.00020385533571243286, 0.00021289288997650146, 0.00022193044424057007, 0.00023096799850463867, 0.00024000555276870728, 0.0002490431070327759, 0.0002580806612968445, 0.0002671182155609131, 0.0002761557698249817, 0.0002851933240890503, 0.0002942308783531189, 0.0003032684326171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 9.0, 15.0, 30.0, 36.0, 68.0, 117.0, 189.0, 348.0, 739.0, 2145.0, 9993.0, 271421.0, 744044.0, 14902.0, 2705.0, 898.0, 365.0, 224.0, 120.0, 72.0, 42.0, 27.0, 17.0, 6.0, 9.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.3720703125, -1.3306121826171875, -1.289154052734375, -1.2476959228515625, -1.20623779296875, -1.1647796630859375, -1.123321533203125, -1.0818634033203125, -1.0404052734375, -0.9989471435546875, -0.957489013671875, -0.9160308837890625, -0.87457275390625, -0.8331146240234375, -0.791656494140625, -0.7501983642578125, -0.708740234375, -0.6672821044921875, -0.625823974609375, -0.5843658447265625, -0.54290771484375, -0.5014495849609375, -0.459991455078125, -0.4185333251953125, -0.3770751953125, -0.3356170654296875, -0.294158935546875, -0.2527008056640625, -0.21124267578125, -0.1697845458984375, -0.128326416015625, -0.0868682861328125, -0.04541015625, -0.0039520263671875, 0.037506103515625, 0.0789642333984375, 0.12042236328125, 0.1618804931640625, 0.203338623046875, 0.2447967529296875, 0.2862548828125, 0.3277130126953125, 0.369171142578125, 0.4106292724609375, 0.45208740234375, 0.4935455322265625, 0.535003662109375, 0.5764617919921875, 0.617919921875, 0.6593780517578125, 0.700836181640625, 0.7422943115234375, 0.78375244140625, 0.8252105712890625, 0.866668701171875, 0.9081268310546875, 0.9495849609375, 0.9910430908203125, 1.032501220703125, 1.0739593505859375, 1.11541748046875, 1.1568756103515625, 1.198333740234375, 1.2397918701171875, 1.28125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 3.0, 11.0, 10.0, 22.0, 45.0, 86.0, 290.0, 330.0, 101.0, 39.0, 28.0, 16.0, 13.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7421875, -1.6894683837890625, -1.636749267578125, -1.5840301513671875, -1.53131103515625, -1.4785919189453125, -1.425872802734375, -1.3731536865234375, -1.3204345703125, -1.2677154541015625, -1.214996337890625, -1.1622772216796875, -1.10955810546875, -1.0568389892578125, -1.004119873046875, -0.9514007568359375, -0.898681640625, -0.8459625244140625, -0.793243408203125, -0.7405242919921875, -0.68780517578125, -0.6350860595703125, -0.582366943359375, -0.5296478271484375, -0.4769287109375, -0.4242095947265625, -0.371490478515625, -0.3187713623046875, -0.26605224609375, -0.2133331298828125, -0.160614013671875, -0.1078948974609375, -0.05517578125, -0.0024566650390625, 0.050262451171875, 0.1029815673828125, 0.15570068359375, 0.2084197998046875, 0.261138916015625, 0.3138580322265625, 0.3665771484375, 0.4192962646484375, 0.472015380859375, 0.5247344970703125, 0.57745361328125, 0.6301727294921875, 0.682891845703125, 0.7356109619140625, 0.788330078125, 0.8410491943359375, 0.893768310546875, 0.9464874267578125, 0.99920654296875, 1.0519256591796875, 1.104644775390625, 1.1573638916015625, 1.2100830078125, 1.2628021240234375, 1.315521240234375, 1.3682403564453125, 1.42095947265625, 1.4736785888671875, 1.526397705078125, 1.5791168212890625, 1.6318359375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 13.0, 22.0, 48.0, 87.0, 109.0, 159.0, 167.0, 152.0, 96.0, 52.0, 35.0, 24.0, 11.0, 9.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.946060180664062, -10.6210355758667, -10.296010971069336, -9.970987319946289, -9.645962715148926, -9.320938110351562, -8.9959135055542, -8.670888900756836, -8.345864295959473, -8.02083969116211, -7.695815563201904, -7.370790958404541, -7.045766353607178, -6.720742225646973, -6.395717620849609, -6.070693016052246, -5.745668888092041, -5.420644283294678, -5.095620155334473, -4.770595550537109, -4.445570945739746, -4.120546340942383, -3.7955222129821777, -3.4704976081848145, -3.1454732418060303, -2.820448875427246, -2.495424270629883, -2.1703999042510986, -1.845375418663025, -1.5203509330749512, -1.195326566696167, -0.8703019618988037, -0.5452775955200195, -0.2202531397342682, 0.10477131605148315, 0.4297957420349121, 0.7548202276229858, 1.0798447132110596, 1.4048690795898438, 1.729893684387207, 2.054918050765991, 2.3799424171447754, 2.7049670219421387, 3.029991388320923, 3.355015754699707, 3.6800403594970703, 4.005064964294434, 4.330089569091797, 4.655113697052002, 4.980138301849365, 5.30516242980957, 5.630187034606934, 5.955211639404297, 6.28023624420166, 6.605260372161865, 6.9302849769592285, 7.255309104919434, 7.580333709716797, 7.905357837677002, 8.230382919311523, 8.55540657043457, 8.880431175231934, 9.205455780029297, 9.53048038482666, 9.855504989624023]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 8.0, 12.0, 13.0, 15.0, 17.0, 13.0, 21.0, 21.0, 37.0, 25.0, 37.0, 29.0, 46.0, 60.0, 47.0, 53.0, 44.0, 55.0, 47.0, 51.0, 46.0, 42.0, 28.0, 40.0, 39.0, 31.0, 21.0, 23.0, 11.0, 15.0, 7.0, 6.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.29542350769043, -8.990609169006348, -8.685794830322266, -8.3809814453125, -8.076167106628418, -7.771352767944336, -7.466538906097412, -7.161725044250488, -6.856910705566406, -6.552096366882324, -6.2472825050354, -5.942468643188477, -5.6376543045043945, -5.3328399658203125, -5.028026103973389, -4.723212242126465, -4.418397903442383, -4.113583564758301, -3.808769702911377, -3.503955602645874, -3.199141502380371, -2.894327402114868, -2.5895133018493652, -2.2846992015838623, -1.9798851013183594, -1.6750710010528564, -1.3702569007873535, -1.0654428005218506, -0.7606287002563477, -0.4558145999908447, -0.1510004997253418, 0.15381360054016113, 0.45862770080566406, 0.763441801071167, 1.06825590133667, 1.3730700016021729, 1.6778841018676758, 1.9826982021331787, 2.2875123023986816, 2.5923264026641846, 2.8971405029296875, 3.2019546031951904, 3.5067687034606934, 3.8115828037261963, 4.116396903991699, 4.421211242675781, 4.726025104522705, 5.030838966369629, 5.335653305053711, 5.640467643737793, 5.945281505584717, 6.250095367431641, 6.554909706115723, 6.859724044799805, 7.1645379066467285, 7.469351768493652, 7.774166107177734, 8.078980445861816, 8.383794784545898, 8.688608169555664, 8.993422508239746, 9.298236846923828, 9.603050231933594, 9.907864570617676, 10.212678909301758]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 16.0, 12.0, 31.0, 46.0, 82.0, 156.0, 316.0, 708.0, 1764.0, 5370.0, 24344.0, 624173.0, 3488755.0, 37455.0, 7140.0, 2261.0, 858.0, 381.0, 202.0, 100.0, 49.0, 24.0, 16.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.95703125, -1.9042816162109375, -1.851531982421875, -1.7987823486328125, -1.74603271484375, -1.6932830810546875, -1.640533447265625, -1.5877838134765625, -1.5350341796875, -1.4822845458984375, -1.429534912109375, -1.3767852783203125, -1.32403564453125, -1.2712860107421875, -1.218536376953125, -1.1657867431640625, -1.113037109375, -1.0602874755859375, -1.007537841796875, -0.9547882080078125, -0.90203857421875, -0.8492889404296875, -0.796539306640625, -0.7437896728515625, -0.6910400390625, -0.6382904052734375, -0.585540771484375, -0.5327911376953125, -0.48004150390625, -0.4272918701171875, -0.374542236328125, -0.3217926025390625, -0.26904296875, -0.2162933349609375, -0.163543701171875, -0.1107940673828125, -0.05804443359375, -0.0052947998046875, 0.047454833984375, 0.1002044677734375, 0.1529541015625, 0.2057037353515625, 0.258453369140625, 0.3112030029296875, 0.36395263671875, 0.4167022705078125, 0.469451904296875, 0.5222015380859375, 0.574951171875, 0.6277008056640625, 0.680450439453125, 0.7332000732421875, 0.78594970703125, 0.8386993408203125, 0.891448974609375, 0.9441986083984375, 0.9969482421875, 1.0496978759765625, 1.102447509765625, 1.1551971435546875, 1.20794677734375, 1.2606964111328125, 1.313446044921875, 1.3661956787109375, 1.4189453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 13.0, 12.0, 13.0, 12.0, 16.0, 24.0, 21.0, 30.0, 46.0, 55.0, 60.0, 57.0, 71.0, 59.0, 65.0, 72.0, 59.0, 57.0, 45.0, 40.0, 48.0, 26.0, 31.0, 18.0, 12.0, 8.0, 9.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.55224609375, -0.5384368896484375, -0.524627685546875, -0.5108184814453125, -0.49700927734375, -0.4832000732421875, -0.469390869140625, -0.4555816650390625, -0.4417724609375, -0.4279632568359375, -0.414154052734375, -0.4003448486328125, -0.38653564453125, -0.3727264404296875, -0.358917236328125, -0.3451080322265625, -0.331298828125, -0.3174896240234375, -0.303680419921875, -0.2898712158203125, -0.27606201171875, -0.2622528076171875, -0.248443603515625, -0.2346343994140625, -0.2208251953125, -0.2070159912109375, -0.193206787109375, -0.1793975830078125, -0.16558837890625, -0.1517791748046875, -0.137969970703125, -0.1241607666015625, -0.1103515625, -0.0965423583984375, -0.082733154296875, -0.0689239501953125, -0.05511474609375, -0.0413055419921875, -0.027496337890625, -0.0136871337890625, 0.0001220703125, 0.0139312744140625, 0.027740478515625, 0.0415496826171875, 0.05535888671875, 0.0691680908203125, 0.082977294921875, 0.0967864990234375, 0.110595703125, 0.1244049072265625, 0.138214111328125, 0.1520233154296875, 0.16583251953125, 0.1796417236328125, 0.193450927734375, 0.2072601318359375, 0.2210693359375, 0.2348785400390625, 0.248687744140625, 0.2624969482421875, 0.27630615234375, 0.2901153564453125, 0.303924560546875, 0.3177337646484375, 0.33154296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 7.0, 4.0, 14.0, 14.0, 31.0, 56.0, 98.0, 168.0, 282.0, 479.0, 881.0, 1620.0, 3714.0, 10178.0, 37778.0, 265504.0, 3651427.0, 176345.0, 30415.0, 8690.0, 3229.0, 1536.0, 786.0, 426.0, 267.0, 138.0, 94.0, 28.0, 32.0, 18.0, 7.0, 10.0, 1.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.869140625, -0.83856201171875, -0.8079833984375, -0.77740478515625, -0.746826171875, -0.71624755859375, -0.6856689453125, -0.65509033203125, -0.62451171875, -0.59393310546875, -0.5633544921875, -0.53277587890625, -0.502197265625, -0.47161865234375, -0.4410400390625, -0.41046142578125, -0.3798828125, -0.34930419921875, -0.3187255859375, -0.28814697265625, -0.257568359375, -0.22698974609375, -0.1964111328125, -0.16583251953125, -0.13525390625, -0.10467529296875, -0.0740966796875, -0.04351806640625, -0.012939453125, 0.01763916015625, 0.0482177734375, 0.07879638671875, 0.109375, 0.13995361328125, 0.1705322265625, 0.20111083984375, 0.231689453125, 0.26226806640625, 0.2928466796875, 0.32342529296875, 0.35400390625, 0.38458251953125, 0.4151611328125, 0.44573974609375, 0.476318359375, 0.50689697265625, 0.5374755859375, 0.56805419921875, 0.5986328125, 0.62921142578125, 0.6597900390625, 0.69036865234375, 0.720947265625, 0.75152587890625, 0.7821044921875, 0.81268310546875, 0.84326171875, 0.87384033203125, 0.9044189453125, 0.93499755859375, 0.965576171875, 0.99615478515625, 1.0267333984375, 1.05731201171875, 1.087890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 5.0, 5.0, 7.0, 8.0, 17.0, 24.0, 24.0, 39.0, 66.0, 108.0, 254.0, 1047.0, 1749.0, 333.0, 134.0, 74.0, 42.0, 38.0, 17.0, 23.0, 8.0, 15.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.52490234375, -0.5062332153320312, -0.4875640869140625, -0.46889495849609375, -0.450225830078125, -0.43155670166015625, -0.4128875732421875, -0.39421844482421875, -0.37554931640625, -0.35688018798828125, -0.3382110595703125, -0.31954193115234375, -0.300872802734375, -0.28220367431640625, -0.2635345458984375, -0.24486541748046875, -0.2261962890625, -0.20752716064453125, -0.1888580322265625, -0.17018890380859375, -0.151519775390625, -0.13285064697265625, -0.1141815185546875, -0.09551239013671875, -0.07684326171875, -0.05817413330078125, -0.0395050048828125, -0.02083587646484375, -0.002166748046875, 0.01650238037109375, 0.0351715087890625, 0.05384063720703125, 0.072509765625, 0.09117889404296875, 0.1098480224609375, 0.12851715087890625, 0.147186279296875, 0.16585540771484375, 0.1845245361328125, 0.20319366455078125, 0.22186279296875, 0.24053192138671875, 0.2592010498046875, 0.27787017822265625, 0.296539306640625, 0.31520843505859375, 0.3338775634765625, 0.35254669189453125, 0.3712158203125, 0.38988494873046875, 0.4085540771484375, 0.42722320556640625, 0.445892333984375, 0.46456146240234375, 0.4832305908203125, 0.5018997192382812, 0.52056884765625, 0.5392379760742188, 0.5579071044921875, 0.5765762329101562, 0.595245361328125, 0.6139144897460938, 0.6325836181640625, 0.6512527465820312, 0.669921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 13.0, 78.0, 212.0, 351.0, 246.0, 66.0, 21.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3294878005981445, -4.137293815612793, -3.9450998306274414, -3.75290584564209, -3.5607118606567383, -3.3685178756713867, -3.176323890686035, -2.9841299057006836, -2.791935920715332, -2.5997419357299805, -2.407547950744629, -2.2153539657592773, -2.023159980773926, -1.8309659957885742, -1.638771891593933, -1.4465779066085815, -1.2543838024139404, -1.0621898174285889, -0.8699958324432373, -0.677801787853241, -0.4856078028678894, -0.29341381788253784, -0.1012197732925415, 0.09097421169281006, 0.2831681966781616, 0.4753621816635132, 0.6675561666488647, 0.8597502112388611, 1.0519442558288574, 1.244138240814209, 1.4363322257995605, 1.628526210784912, 1.8207201957702637, 2.0129141807556152, 2.205108165740967, 2.3973021507263184, 2.58949613571167, 2.7816901206970215, 2.973884105682373, 3.1660780906677246, 3.358272075653076, 3.5504660606384277, 3.7426600456237793, 3.934854030609131, 4.127048015594482, 4.319242000579834, 4.5114359855651855, 4.703629970550537, 4.895824432373047, 5.088018417358398, 5.28021240234375, 5.472406387329102, 5.664600372314453, 5.856794357299805, 6.048988342285156, 6.241182327270508, 6.433376312255859, 6.625570297241211, 6.8177642822265625, 7.009958267211914, 7.202152252197266, 7.394346237182617, 7.586540222167969, 7.77873420715332, 7.970928192138672]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 9.0, 7.0, 8.0, 10.0, 19.0, 24.0, 29.0, 41.0, 33.0, 35.0, 46.0, 56.0, 57.0, 72.0, 65.0, 62.0, 64.0, 66.0, 49.0, 51.0, 42.0, 33.0, 25.0, 16.0, 20.0, 22.0, 12.0, 12.0, 9.0, 7.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.9040982723236084, -2.8329567909240723, -2.761815309524536, -2.690673828125, -2.6195321083068848, -2.5483906269073486, -2.4772491455078125, -2.4061076641082764, -2.3349661827087402, -2.263824701309204, -2.192683219909668, -2.121541738510132, -2.0504002571105957, -1.97925865650177, -1.9081170558929443, -1.8369755744934082, -1.765834093093872, -1.694692611694336, -1.6235511302947998, -1.5524095296859741, -1.481268048286438, -1.4101265668869019, -1.3389849662780762, -1.26784348487854, -1.196702003479004, -1.1255605220794678, -1.0544190406799316, -0.983277440071106, -0.9121359586715698, -0.8409944772720337, -0.7698529362678528, -0.6987113952636719, -0.6275696754455566, -0.5564281940460205, -0.4852866530418396, -0.4141451418399811, -0.34300363063812256, -0.27186211943626404, -0.20072060823440552, -0.129579097032547, -0.05843758583068848, 0.012703925371170044, 0.08384543657302856, 0.15498694777488708, 0.2261284589767456, 0.2972699701786041, 0.36841148138046265, 0.43955299258232117, 0.5106945037841797, 0.5818359851837158, 0.6529775261878967, 0.7241190671920776, 0.7952605485916138, 0.8664020299911499, 0.9375435709953308, 1.0086851119995117, 1.0798265933990479, 1.150968074798584, 1.2221095561981201, 1.2932511568069458, 1.364392638206482, 1.435534119606018, 1.5066757202148438, 1.5778172016143799, 1.648958683013916]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 10.0, 12.0, 26.0, 48.0, 71.0, 100.0, 191.0, 300.0, 598.0, 1111.0, 2709.0, 7038.0, 22795.0, 82856.0, 298524.0, 422799.0, 150424.0, 39541.0, 11746.0, 4150.0, 1767.0, 798.0, 381.0, 203.0, 137.0, 80.0, 49.0, 36.0, 14.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.2490234375, -1.2171783447265625, -1.185333251953125, -1.1534881591796875, -1.12164306640625, -1.0897979736328125, -1.057952880859375, -1.0261077880859375, -0.9942626953125, -0.9624176025390625, -0.930572509765625, -0.8987274169921875, -0.86688232421875, -0.8350372314453125, -0.803192138671875, -0.7713470458984375, -0.739501953125, -0.7076568603515625, -0.675811767578125, -0.6439666748046875, -0.61212158203125, -0.5802764892578125, -0.548431396484375, -0.5165863037109375, -0.4847412109375, -0.4528961181640625, -0.421051025390625, -0.3892059326171875, -0.35736083984375, -0.3255157470703125, -0.293670654296875, -0.2618255615234375, -0.22998046875, -0.1981353759765625, -0.166290283203125, -0.1344451904296875, -0.10260009765625, -0.0707550048828125, -0.038909912109375, -0.0070648193359375, 0.0247802734375, 0.0566253662109375, 0.088470458984375, 0.1203155517578125, 0.15216064453125, 0.1840057373046875, 0.215850830078125, 0.2476959228515625, 0.279541015625, 0.3113861083984375, 0.343231201171875, 0.3750762939453125, 0.40692138671875, 0.4387664794921875, 0.470611572265625, 0.5024566650390625, 0.5343017578125, 0.5661468505859375, 0.597991943359375, 0.6298370361328125, 0.66168212890625, 0.6935272216796875, 0.725372314453125, 0.7572174072265625, 0.7890625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 13.0, 8.0, 14.0, 16.0, 18.0, 24.0, 29.0, 33.0, 31.0, 57.0, 58.0, 68.0, 76.0, 69.0, 69.0, 63.0, 57.0, 50.0, 53.0, 44.0, 42.0, 28.0, 25.0, 14.0, 13.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.53369140625, -0.519927978515625, -0.50616455078125, -0.492401123046875, -0.4786376953125, -0.464874267578125, -0.45111083984375, -0.437347412109375, -0.423583984375, -0.409820556640625, -0.39605712890625, -0.382293701171875, -0.3685302734375, -0.354766845703125, -0.34100341796875, -0.327239990234375, -0.3134765625, -0.299713134765625, -0.28594970703125, -0.272186279296875, -0.2584228515625, -0.244659423828125, -0.23089599609375, -0.217132568359375, -0.203369140625, -0.189605712890625, -0.17584228515625, -0.162078857421875, -0.1483154296875, -0.134552001953125, -0.12078857421875, -0.107025146484375, -0.09326171875, -0.079498291015625, -0.06573486328125, -0.051971435546875, -0.0382080078125, -0.024444580078125, -0.01068115234375, 0.003082275390625, 0.016845703125, 0.030609130859375, 0.04437255859375, 0.058135986328125, 0.0718994140625, 0.085662841796875, 0.09942626953125, 0.113189697265625, 0.126953125, 0.140716552734375, 0.15447998046875, 0.168243408203125, 0.1820068359375, 0.195770263671875, 0.20953369140625, 0.223297119140625, 0.237060546875, 0.250823974609375, 0.26458740234375, 0.278350830078125, 0.2921142578125, 0.305877685546875, 0.31964111328125, 0.333404541015625, 0.34716796875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 12.0, 12.0, 14.0, 33.0, 36.0, 32.0, 49.0, 65.0, 98.0, 153.0, 228.0, 383.0, 765.0, 1587.0, 4188.0, 13534.0, 56294.0, 308708.0, 518749.0, 109144.0, 23013.0, 6565.0, 2385.0, 1018.0, 547.0, 296.0, 178.0, 106.0, 76.0, 63.0, 42.0, 30.0, 27.0, 16.0, 20.0, 16.0, 12.0, 8.0, 10.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0], "bins": [-1.58203125, -1.538330078125, -1.49462890625, -1.450927734375, -1.4072265625, -1.363525390625, -1.31982421875, -1.276123046875, -1.232421875, -1.188720703125, -1.14501953125, -1.101318359375, -1.0576171875, -1.013916015625, -0.97021484375, -0.926513671875, -0.8828125, -0.839111328125, -0.79541015625, -0.751708984375, -0.7080078125, -0.664306640625, -0.62060546875, -0.576904296875, -0.533203125, -0.489501953125, -0.44580078125, -0.402099609375, -0.3583984375, -0.314697265625, -0.27099609375, -0.227294921875, -0.18359375, -0.139892578125, -0.09619140625, -0.052490234375, -0.0087890625, 0.034912109375, 0.07861328125, 0.122314453125, 0.166015625, 0.209716796875, 0.25341796875, 0.297119140625, 0.3408203125, 0.384521484375, 0.42822265625, 0.471923828125, 0.515625, 0.559326171875, 0.60302734375, 0.646728515625, 0.6904296875, 0.734130859375, 0.77783203125, 0.821533203125, 0.865234375, 0.908935546875, 0.95263671875, 0.996337890625, 1.0400390625, 1.083740234375, 1.12744140625, 1.171142578125, 1.21484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 5.0, 8.0, 11.0, 7.0, 15.0, 22.0, 24.0, 24.0, 20.0, 35.0, 24.0, 37.0, 40.0, 46.0, 42.0, 46.0, 40.0, 49.0, 46.0, 55.0, 57.0, 36.0, 40.0, 39.0, 39.0, 34.0, 29.0, 19.0, 21.0, 14.0, 19.0, 16.0, 12.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.03125, -1.961151123046875, -1.89105224609375, -1.820953369140625, -1.7508544921875, -1.680755615234375, -1.61065673828125, -1.540557861328125, -1.470458984375, -1.400360107421875, -1.33026123046875, -1.260162353515625, -1.1900634765625, -1.119964599609375, -1.04986572265625, -0.979766845703125, -0.90966796875, -0.839569091796875, -0.76947021484375, -0.699371337890625, -0.6292724609375, -0.559173583984375, -0.48907470703125, -0.418975830078125, -0.348876953125, -0.278778076171875, -0.20867919921875, -0.138580322265625, -0.0684814453125, 0.001617431640625, 0.07171630859375, 0.141815185546875, 0.2119140625, 0.282012939453125, 0.35211181640625, 0.422210693359375, 0.4923095703125, 0.562408447265625, 0.63250732421875, 0.702606201171875, 0.772705078125, 0.842803955078125, 0.91290283203125, 0.983001708984375, 1.0531005859375, 1.123199462890625, 1.19329833984375, 1.263397216796875, 1.33349609375, 1.403594970703125, 1.47369384765625, 1.543792724609375, 1.6138916015625, 1.683990478515625, 1.75408935546875, 1.824188232421875, 1.894287109375, 1.964385986328125, 2.03448486328125, 2.104583740234375, 2.1746826171875, 2.244781494140625, 2.31488037109375, 2.384979248046875, 2.455078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 8.0, 4.0, 2.0, 7.0, 30.0, 33.0, 40.0, 54.0, 80.0, 128.0, 201.0, 355.0, 758.0, 1792.0, 5558.0, 31875.0, 551230.0, 422240.0, 25831.0, 5029.0, 1702.0, 664.0, 328.0, 217.0, 110.0, 78.0, 44.0, 42.0, 30.0, 17.0, 17.0, 12.0, 1.0, 7.0, 2.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9013671875, -0.86663818359375, -0.8319091796875, -0.79718017578125, -0.762451171875, -0.72772216796875, -0.6929931640625, -0.65826416015625, -0.62353515625, -0.58880615234375, -0.5540771484375, -0.51934814453125, -0.484619140625, -0.44989013671875, -0.4151611328125, -0.38043212890625, -0.345703125, -0.31097412109375, -0.2762451171875, -0.24151611328125, -0.206787109375, -0.17205810546875, -0.1373291015625, -0.10260009765625, -0.06787109375, -0.03314208984375, 0.0015869140625, 0.03631591796875, 0.071044921875, 0.10577392578125, 0.1405029296875, 0.17523193359375, 0.2099609375, 0.24468994140625, 0.2794189453125, 0.31414794921875, 0.348876953125, 0.38360595703125, 0.4183349609375, 0.45306396484375, 0.48779296875, 0.52252197265625, 0.5572509765625, 0.59197998046875, 0.626708984375, 0.66143798828125, 0.6961669921875, 0.73089599609375, 0.765625, 0.80035400390625, 0.8350830078125, 0.86981201171875, 0.904541015625, 0.93927001953125, 0.9739990234375, 1.00872802734375, 1.04345703125, 1.07818603515625, 1.1129150390625, 1.14764404296875, 1.182373046875, 1.21710205078125, 1.2518310546875, 1.28656005859375, 1.3212890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 13.0, 27.0, 46.0, 59.0, 101.0, 142.0, 180.0, 145.0, 112.0, 64.0, 48.0, 21.0, 10.0, 11.0, 9.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004057884216308594, -0.00039441511034965515, -0.00038304179906845093, -0.0003716684877872467, -0.0003602951765060425, -0.00034892186522483826, -0.00033754855394363403, -0.0003261752426624298, -0.0003148019313812256, -0.00030342862010002136, -0.00029205530881881714, -0.0002806819975376129, -0.0002693086862564087, -0.00025793537497520447, -0.00024656206369400024, -0.00023518875241279602, -0.0002238154411315918, -0.00021244212985038757, -0.00020106881856918335, -0.00018969550728797913, -0.0001783221960067749, -0.00016694888472557068, -0.00015557557344436646, -0.00014420226216316223, -0.000132828950881958, -0.00012145563960075378, -0.00011008232831954956, -9.870901703834534e-05, -8.733570575714111e-05, -7.596239447593689e-05, -6.458908319473267e-05, -5.321577191352844e-05, -4.184246063232422e-05, -3.0469149351119995e-05, -1.909583806991577e-05, -7.722526788711548e-06, 3.6507844924926758e-06, 1.50240957736969e-05, 2.6397407054901123e-05, 3.777071833610535e-05, 4.914402961730957e-05, 6.0517340898513794e-05, 7.189065217971802e-05, 8.326396346092224e-05, 9.463727474212646e-05, 0.00010601058602333069, 0.00011738389730453491, 0.00012875720858573914, 0.00014013051986694336, 0.00015150383114814758, 0.0001628771424293518, 0.00017425045371055603, 0.00018562376499176025, 0.00019699707627296448, 0.0002083703875541687, 0.00021974369883537292, 0.00023111701011657715, 0.00024249032139778137, 0.0002538636326789856, 0.0002652369439601898, 0.00027661025524139404, 0.00028798356652259827, 0.0002993568778038025, 0.0003107301890850067, 0.00032210350036621094]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 5.0, 2.0, 6.0, 10.0, 5.0, 13.0, 10.0, 14.0, 24.0, 39.0, 55.0, 92.0, 184.0, 293.0, 558.0, 1181.0, 3459.0, 14392.0, 110119.0, 723972.0, 167794.0, 19219.0, 4238.0, 1443.0, 621.0, 324.0, 164.0, 108.0, 51.0, 45.0, 31.0, 25.0, 16.0, 8.0, 12.0, 5.0, 4.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.89794921875, -0.8719863891601562, -0.8460235595703125, -0.8200607299804688, -0.794097900390625, -0.7681350708007812, -0.7421722412109375, -0.7162094116210938, -0.69024658203125, -0.6642837524414062, -0.6383209228515625, -0.6123580932617188, -0.586395263671875, -0.5604324340820312, -0.5344696044921875, -0.5085067749023438, -0.4825439453125, -0.45658111572265625, -0.4306182861328125, -0.40465545654296875, -0.378692626953125, -0.35272979736328125, -0.3267669677734375, -0.30080413818359375, -0.27484130859375, -0.24887847900390625, -0.2229156494140625, -0.19695281982421875, -0.170989990234375, -0.14502716064453125, -0.1190643310546875, -0.09310150146484375, -0.067138671875, -0.04117584228515625, -0.0152130126953125, 0.01074981689453125, 0.036712646484375, 0.06267547607421875, 0.0886383056640625, 0.11460113525390625, 0.14056396484375, 0.16652679443359375, 0.1924896240234375, 0.21845245361328125, 0.244415283203125, 0.27037811279296875, 0.2963409423828125, 0.32230377197265625, 0.3482666015625, 0.37422943115234375, 0.4001922607421875, 0.42615509033203125, 0.452117919921875, 0.47808074951171875, 0.5040435791015625, 0.5300064086914062, 0.55596923828125, 0.5819320678710938, 0.6078948974609375, 0.6338577270507812, 0.659820556640625, 0.6857833862304688, 0.7117462158203125, 0.7377090454101562, 0.763671875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 6.0, 7.0, 7.0, 7.0, 11.0, 7.0, 20.0, 23.0, 22.0, 35.0, 64.0, 92.0, 135.0, 179.0, 130.0, 73.0, 59.0, 35.0, 25.0, 20.0, 13.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.218353271484375, -1.18182373046875, -1.145294189453125, -1.1087646484375, -1.072235107421875, -1.03570556640625, -0.999176025390625, -0.962646484375, -0.926116943359375, -0.88958740234375, -0.853057861328125, -0.8165283203125, -0.779998779296875, -0.74346923828125, -0.706939697265625, -0.67041015625, -0.633880615234375, -0.59735107421875, -0.560821533203125, -0.5242919921875, -0.487762451171875, -0.45123291015625, -0.414703369140625, -0.378173828125, -0.341644287109375, -0.30511474609375, -0.268585205078125, -0.2320556640625, -0.195526123046875, -0.15899658203125, -0.122467041015625, -0.0859375, -0.049407958984375, -0.01287841796875, 0.023651123046875, 0.0601806640625, 0.096710205078125, 0.13323974609375, 0.169769287109375, 0.206298828125, 0.242828369140625, 0.27935791015625, 0.315887451171875, 0.3524169921875, 0.388946533203125, 0.42547607421875, 0.462005615234375, 0.49853515625, 0.535064697265625, 0.57159423828125, 0.608123779296875, 0.6446533203125, 0.681182861328125, 0.71771240234375, 0.754241943359375, 0.790771484375, 0.827301025390625, 0.86383056640625, 0.900360107421875, 0.9368896484375, 0.973419189453125, 1.00994873046875, 1.046478271484375, 1.0830078125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 24.0, 95.0, 299.0, 394.0, 159.0, 29.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.806396484375, -21.77716064453125, -20.7479248046875, -19.71868896484375, -18.689451217651367, -17.660215377807617, -16.630979537963867, -15.601743698120117, -14.57250690460205, -13.5432710647583, -12.514034271240234, -11.484798431396484, -10.455562591552734, -9.426325798034668, -8.397089958190918, -7.36785364151001, -6.338617324829102, -5.309381008148193, -4.280144691467285, -3.250908851623535, -2.221672534942627, -1.1924362182617188, -0.16320037841796875, 0.8660359382629395, 1.8952722549438477, 2.924508571624756, 3.953744649887085, 4.982980728149414, 6.012217044830322, 7.0414533615112305, 8.07068920135498, 9.099925994873047, 10.129161834716797, 11.158397674560547, 12.187634468078613, 13.216870307922363, 14.24610710144043, 15.27534294128418, 16.30457878112793, 17.33381462097168, 18.363052368164062, 19.392288208007812, 20.421524047851562, 21.450759887695312, 22.479997634887695, 23.509233474731445, 24.538469314575195, 25.567705154418945, 26.596940994262695, 27.626176834106445, 28.655412673950195, 29.684650421142578, 30.713886260986328, 31.743122100830078, 32.77235794067383, 33.80159378051758, 34.83082962036133, 35.86006546020508, 36.88930130004883, 37.91853713989258, 38.94777297973633, 39.977012634277344, 41.006248474121094, 42.035484313964844, 43.064720153808594]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 6.0, 4.0, 6.0, 20.0, 16.0, 11.0, 17.0, 24.0, 29.0, 33.0, 37.0, 43.0, 46.0, 61.0, 63.0, 72.0, 58.0, 43.0, 61.0, 44.0, 43.0, 36.0, 44.0, 34.0, 29.0, 25.0, 22.0, 13.0, 10.0, 10.0, 8.0, 2.0, 6.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.344871520996094, -10.91799545288086, -10.491120338439941, -10.064244270324707, -9.637369155883789, -9.210493087768555, -8.783617973327637, -8.356741905212402, -7.929866790771484, -7.502991199493408, -7.076115608215332, -6.649240016937256, -6.22236442565918, -5.795488357543945, -5.368613243103027, -4.941737174987793, -4.514861583709717, -4.087985992431641, -3.6611104011535645, -3.2342348098754883, -2.807359218597412, -2.380483388900757, -1.9536077976226807, -1.5267322063446045, -1.0998566150665283, -0.6729810237884521, -0.2461053729057312, 0.18077027797698975, 0.6076458692550659, 1.0345215797424316, 1.4613971710205078, 1.888272762298584, 2.31514835357666, 2.7420239448547363, 3.1688995361328125, 3.5957751274108887, 4.022650718688965, 4.449526786804199, 4.876401901245117, 5.303277969360352, 5.7301530838012695, 6.157028675079346, 6.583904266357422, 7.010779857635498, 7.437655448913574, 7.864531517028809, 8.291406631469727, 8.718282699584961, 9.145158767700195, 9.57203483581543, 9.998909950256348, 10.425786018371582, 10.8526611328125, 11.279537200927734, 11.706412315368652, 12.133288383483887, 12.560163497924805, 12.987039566040039, 13.413914680480957, 13.840790748596191, 14.26766586303711, 14.694541931152344, 15.121417045593262, 15.548293113708496, 15.975168228149414]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 12.0, 10.0, 13.0, 23.0, 38.0, 88.0, 154.0, 301.0, 576.0, 1289.0, 3161.0, 8693.0, 30998.0, 246978.0, 3817183.0, 61583.0, 14307.0, 4915.0, 1938.0, 920.0, 445.0, 263.0, 151.0, 73.0, 65.0, 36.0, 18.0, 16.0, 11.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.226837158203125, -1.19097900390625, -1.155120849609375, -1.1192626953125, -1.083404541015625, -1.04754638671875, -1.011688232421875, -0.975830078125, -0.939971923828125, -0.90411376953125, -0.868255615234375, -0.8323974609375, -0.796539306640625, -0.76068115234375, -0.724822998046875, -0.68896484375, -0.653106689453125, -0.61724853515625, -0.581390380859375, -0.5455322265625, -0.509674072265625, -0.47381591796875, -0.437957763671875, -0.402099609375, -0.366241455078125, -0.33038330078125, -0.294525146484375, -0.2586669921875, -0.222808837890625, -0.18695068359375, -0.151092529296875, -0.115234375, -0.079376220703125, -0.04351806640625, -0.007659912109375, 0.0281982421875, 0.064056396484375, 0.09991455078125, 0.135772705078125, 0.171630859375, 0.207489013671875, 0.24334716796875, 0.279205322265625, 0.3150634765625, 0.350921630859375, 0.38677978515625, 0.422637939453125, 0.45849609375, 0.494354248046875, 0.53021240234375, 0.566070556640625, 0.6019287109375, 0.637786865234375, 0.67364501953125, 0.709503173828125, 0.745361328125, 0.781219482421875, 0.81707763671875, 0.852935791015625, 0.8887939453125, 0.924652099609375, 0.96051025390625, 0.996368408203125, 1.0322265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 4.0, 6.0, 9.0, 17.0, 18.0, 24.0, 31.0, 25.0, 36.0, 51.0, 56.0, 71.0, 84.0, 62.0, 87.0, 55.0, 74.0, 55.0, 53.0, 30.0, 38.0, 23.0, 19.0, 18.0, 7.0, 16.0, 7.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5606002807617188, -0.5425872802734375, -0.5245742797851562, -0.506561279296875, -0.48854827880859375, -0.4705352783203125, -0.45252227783203125, -0.43450927734375, -0.41649627685546875, -0.3984832763671875, -0.38047027587890625, -0.362457275390625, -0.34444427490234375, -0.3264312744140625, -0.30841827392578125, -0.2904052734375, -0.27239227294921875, -0.2543792724609375, -0.23636627197265625, -0.218353271484375, -0.20034027099609375, -0.1823272705078125, -0.16431427001953125, -0.14630126953125, -0.12828826904296875, -0.1102752685546875, -0.09226226806640625, -0.074249267578125, -0.05623626708984375, -0.0382232666015625, -0.02021026611328125, -0.002197265625, 0.01581573486328125, 0.0338287353515625, 0.05184173583984375, 0.069854736328125, 0.08786773681640625, 0.1058807373046875, 0.12389373779296875, 0.14190673828125, 0.15991973876953125, 0.1779327392578125, 0.19594573974609375, 0.213958740234375, 0.23197174072265625, 0.2499847412109375, 0.26799774169921875, 0.2860107421875, 0.30402374267578125, 0.3220367431640625, 0.34004974365234375, 0.358062744140625, 0.37607574462890625, 0.3940887451171875, 0.41210174560546875, 0.43011474609375, 0.44812774658203125, 0.4661407470703125, 0.48415374755859375, 0.502166748046875, 0.5201797485351562, 0.5381927490234375, 0.5562057495117188, 0.57421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 9.0, 18.0, 16.0, 21.0, 33.0, 41.0, 73.0, 104.0, 166.0, 249.0, 408.0, 644.0, 1073.0, 1827.0, 3501.0, 7022.0, 16315.0, 51942.0, 402801.0, 3580192.0, 86038.0, 22899.0, 9207.0, 4197.0, 2135.0, 1264.0, 762.0, 448.0, 288.0, 188.0, 114.0, 78.0, 60.0, 50.0, 31.0, 18.0, 17.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6181640625, -0.5936050415039062, -0.5690460205078125, -0.5444869995117188, -0.519927978515625, -0.49536895751953125, -0.4708099365234375, -0.44625091552734375, -0.42169189453125, -0.39713287353515625, -0.3725738525390625, -0.34801483154296875, -0.323455810546875, -0.29889678955078125, -0.2743377685546875, -0.24977874755859375, -0.2252197265625, -0.20066070556640625, -0.1761016845703125, -0.15154266357421875, -0.126983642578125, -0.10242462158203125, -0.0778656005859375, -0.05330657958984375, -0.02874755859375, -0.00418853759765625, 0.0203704833984375, 0.04492950439453125, 0.069488525390625, 0.09404754638671875, 0.1186065673828125, 0.14316558837890625, 0.167724609375, 0.19228363037109375, 0.2168426513671875, 0.24140167236328125, 0.265960693359375, 0.29051971435546875, 0.3150787353515625, 0.33963775634765625, 0.36419677734375, 0.38875579833984375, 0.4133148193359375, 0.43787384033203125, 0.462432861328125, 0.48699188232421875, 0.5115509033203125, 0.5361099243164062, 0.5606689453125, 0.5852279663085938, 0.6097869873046875, 0.6343460083007812, 0.658905029296875, 0.6834640502929688, 0.7080230712890625, 0.7325820922851562, 0.75714111328125, 0.7817001342773438, 0.8062591552734375, 0.8308181762695312, 0.855377197265625, 0.8799362182617188, 0.9044952392578125, 0.9290542602539062, 0.95361328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 3.0, 4.0, 9.0, 13.0, 15.0, 25.0, 43.0, 73.0, 191.0, 2681.0, 727.0, 123.0, 55.0, 35.0, 16.0, 15.0, 6.0, 7.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.254150390625, -0.24565505981445312, -0.23715972900390625, -0.22866439819335938, -0.2201690673828125, -0.21167373657226562, -0.20317840576171875, -0.19468307495117188, -0.186187744140625, -0.17769241333007812, -0.16919708251953125, -0.16070175170898438, -0.1522064208984375, -0.14371109008789062, -0.13521575927734375, -0.12672042846679688, -0.11822509765625, -0.10972976684570312, -0.10123443603515625, -0.09273910522460938, -0.0842437744140625, -0.07574844360351562, -0.06725311279296875, -0.058757781982421875, -0.050262451171875, -0.041767120361328125, -0.03327178955078125, -0.024776458740234375, -0.0162811279296875, -0.007785797119140625, 0.00070953369140625, 0.009204864501953125, 0.0177001953125, 0.026195526123046875, 0.03469085693359375, 0.043186187744140625, 0.0516815185546875, 0.060176849365234375, 0.06867218017578125, 0.07716751098632812, 0.085662841796875, 0.09415817260742188, 0.10265350341796875, 0.11114883422851562, 0.1196441650390625, 0.12813949584960938, 0.13663482666015625, 0.14513015747070312, 0.15362548828125, 0.16212081909179688, 0.17061614990234375, 0.17911148071289062, 0.1876068115234375, 0.19610214233398438, 0.20459747314453125, 0.21309280395507812, 0.221588134765625, 0.23008346557617188, 0.23857879638671875, 0.24707412719726562, 0.2555694580078125, 0.2640647888183594, 0.27256011962890625, 0.2810554504394531, 0.28955078125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 15.0, 30.0, 66.0, 136.0, 195.0, 202.0, 176.0, 100.0, 49.0, 15.0, 11.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6148810386657715, -1.5642696619033813, -1.5136581659317017, -1.4630467891693115, -1.4124352931976318, -1.3618239164352417, -1.3112125396728516, -1.2606010437011719, -1.2099895477294922, -1.159378170967102, -1.1087666749954224, -1.0581552982330322, -1.0075438022613525, -0.9569324254989624, -0.9063209891319275, -0.8557095527648926, -0.8050981760025024, -0.7544867396354675, -0.7038753032684326, -0.6532639265060425, -0.6026524305343628, -0.5520410537719727, -0.5014296174049377, -0.45081818103790283, -0.4002067446708679, -0.349595308303833, -0.2989838719367981, -0.24837246537208557, -0.19776102900505066, -0.14714959263801575, -0.09653818607330322, -0.04592674970626831, 0.0046846866607666016, 0.05529611557722092, 0.10590754449367523, 0.15651896595954895, 0.20713040232658386, 0.2577418386936188, 0.3083532452583313, 0.3589646816253662, 0.4095761179924011, 0.46018755435943604, 0.510798990726471, 0.5614104270935059, 0.612021803855896, 0.6626332998275757, 0.7132446765899658, 0.7638561129570007, 0.8144675493240356, 0.8650789856910706, 0.9156904220581055, 0.9663017988204956, 1.0169132947921753, 1.0675246715545654, 1.1181361675262451, 1.1687475442886353, 1.2193589210510254, 1.2699702978134155, 1.3205817937850952, 1.3711931705474854, 1.421804666519165, 1.4724160432815552, 1.5230274200439453, 1.573638916015625, 1.6242504119873047]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 7.0, 7.0, 10.0, 13.0, 15.0, 13.0, 19.0, 21.0, 23.0, 24.0, 29.0, 33.0, 26.0, 30.0, 29.0, 29.0, 30.0, 27.0, 32.0, 36.0, 29.0, 32.0, 34.0, 39.0, 35.0, 32.0, 41.0, 27.0, 21.0, 29.0, 24.0, 28.0, 26.0, 24.0, 12.0, 18.0, 15.0, 13.0, 10.0, 8.0, 8.0, 10.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5489764213562012, -0.5324448347091675, -0.515913188457489, -0.4993816018104553, -0.48285001516342163, -0.46631839871406555, -0.4497867822647095, -0.4332551956176758, -0.4167235791683197, -0.4001919627189636, -0.38366037607192993, -0.36712875962257385, -0.3505971431732178, -0.3340655565261841, -0.317533940076828, -0.3010023236274719, -0.28447073698043823, -0.26793912053108215, -0.25140753388404846, -0.23487591743469238, -0.2183443158864975, -0.2018127143383026, -0.18528109788894653, -0.16874949634075165, -0.15221789479255676, -0.13568629324436188, -0.1191546842455864, -0.10262307524681091, -0.08609147369861603, -0.06955987215042114, -0.05302826315164566, -0.03649665415287018, -0.019964993000030518, -0.003433387726545334, 0.01309821754693985, 0.029629822820425034, 0.04616142809391022, 0.0626930296421051, 0.07922463864088058, 0.09575624763965607, 0.11228784918785095, 0.12881945073604584, 0.14535105228424072, 0.1618826687335968, 0.1784142702817917, 0.19494587182998657, 0.21147748827934265, 0.22800908982753754, 0.24454069137573242, 0.2610723078250885, 0.2776038944721222, 0.29413551092147827, 0.31066709756851196, 0.32719871401786804, 0.3437303304672241, 0.3602619171142578, 0.3767935335636139, 0.39332515001296997, 0.40985673666000366, 0.42638835310935974, 0.4429199695587158, 0.4594515562057495, 0.4759831726551056, 0.49251478910446167, 0.5090463757514954]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 28.0, 33.0, 55.0, 83.0, 161.0, 379.0, 895.0, 2942.0, 12090.0, 69020.0, 407432.0, 454410.0, 81439.0, 14194.0, 3441.0, 1082.0, 409.0, 209.0, 88.0, 44.0, 40.0, 11.0, 16.0, 13.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.634765625, -1.585296630859375, -1.53582763671875, -1.486358642578125, -1.4368896484375, -1.387420654296875, -1.33795166015625, -1.288482666015625, -1.239013671875, -1.189544677734375, -1.14007568359375, -1.090606689453125, -1.0411376953125, -0.991668701171875, -0.94219970703125, -0.892730712890625, -0.84326171875, -0.793792724609375, -0.74432373046875, -0.694854736328125, -0.6453857421875, -0.595916748046875, -0.54644775390625, -0.496978759765625, -0.447509765625, -0.398040771484375, -0.34857177734375, -0.299102783203125, -0.2496337890625, -0.200164794921875, -0.15069580078125, -0.101226806640625, -0.0517578125, -0.002288818359375, 0.04718017578125, 0.096649169921875, 0.1461181640625, 0.195587158203125, 0.24505615234375, 0.294525146484375, 0.343994140625, 0.393463134765625, 0.44293212890625, 0.492401123046875, 0.5418701171875, 0.591339111328125, 0.64080810546875, 0.690277099609375, 0.73974609375, 0.789215087890625, 0.83868408203125, 0.888153076171875, 0.9376220703125, 0.987091064453125, 1.03656005859375, 1.086029052734375, 1.135498046875, 1.184967041015625, 1.23443603515625, 1.283905029296875, 1.3333740234375, 1.382843017578125, 1.43231201171875, 1.481781005859375, 1.53125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 9.0, 5.0, 13.0, 24.0, 20.0, 29.0, 31.0, 34.0, 39.0, 65.0, 66.0, 67.0, 72.0, 78.0, 71.0, 66.0, 45.0, 57.0, 47.0, 33.0, 27.0, 18.0, 21.0, 15.0, 10.0, 10.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.583984375, -0.56597900390625, -0.5479736328125, -0.52996826171875, -0.511962890625, -0.49395751953125, -0.4759521484375, -0.45794677734375, -0.43994140625, -0.42193603515625, -0.4039306640625, -0.38592529296875, -0.367919921875, -0.34991455078125, -0.3319091796875, -0.31390380859375, -0.2958984375, -0.27789306640625, -0.2598876953125, -0.24188232421875, -0.223876953125, -0.20587158203125, -0.1878662109375, -0.16986083984375, -0.15185546875, -0.13385009765625, -0.1158447265625, -0.09783935546875, -0.079833984375, -0.06182861328125, -0.0438232421875, -0.02581787109375, -0.0078125, 0.01019287109375, 0.0281982421875, 0.04620361328125, 0.064208984375, 0.08221435546875, 0.1002197265625, 0.11822509765625, 0.13623046875, 0.15423583984375, 0.1722412109375, 0.19024658203125, 0.208251953125, 0.22625732421875, 0.2442626953125, 0.26226806640625, 0.2802734375, 0.29827880859375, 0.3162841796875, 0.33428955078125, 0.352294921875, 0.37030029296875, 0.3883056640625, 0.40631103515625, 0.42431640625, 0.44232177734375, 0.4603271484375, 0.47833251953125, 0.496337890625, 0.51434326171875, 0.5323486328125, 0.55035400390625, 0.568359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 12.0, 5.0, 13.0, 16.0, 22.0, 33.0, 40.0, 72.0, 131.0, 222.0, 410.0, 987.0, 3208.0, 15067.0, 146144.0, 751668.0, 113096.0, 12738.0, 2842.0, 923.0, 382.0, 195.0, 109.0, 59.0, 47.0, 29.0, 24.0, 13.0, 14.0, 8.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.63671875, -2.566314697265625, -2.49591064453125, -2.425506591796875, -2.3551025390625, -2.284698486328125, -2.21429443359375, -2.143890380859375, -2.073486328125, -2.003082275390625, -1.93267822265625, -1.862274169921875, -1.7918701171875, -1.721466064453125, -1.65106201171875, -1.580657958984375, -1.51025390625, -1.439849853515625, -1.36944580078125, -1.299041748046875, -1.2286376953125, -1.158233642578125, -1.08782958984375, -1.017425537109375, -0.947021484375, -0.876617431640625, -0.80621337890625, -0.735809326171875, -0.6654052734375, -0.595001220703125, -0.52459716796875, -0.454193115234375, -0.3837890625, -0.313385009765625, -0.24298095703125, -0.172576904296875, -0.1021728515625, -0.031768798828125, 0.03863525390625, 0.109039306640625, 0.179443359375, 0.249847412109375, 0.32025146484375, 0.390655517578125, 0.4610595703125, 0.531463623046875, 0.60186767578125, 0.672271728515625, 0.74267578125, 0.813079833984375, 0.88348388671875, 0.953887939453125, 1.0242919921875, 1.094696044921875, 1.16510009765625, 1.235504150390625, 1.305908203125, 1.376312255859375, 1.44671630859375, 1.517120361328125, 1.5875244140625, 1.657928466796875, 1.72833251953125, 1.798736572265625, 1.869140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 8.0, 5.0, 10.0, 9.0, 10.0, 16.0, 13.0, 25.0, 29.0, 24.0, 21.0, 44.0, 33.0, 48.0, 65.0, 63.0, 54.0, 49.0, 61.0, 64.0, 45.0, 60.0, 33.0, 39.0, 25.0, 21.0, 28.0, 15.0, 14.0, 14.0, 16.0, 11.0, 4.0, 8.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 4.0], "bins": [-3.75, -3.657470703125, -3.56494140625, -3.472412109375, -3.3798828125, -3.287353515625, -3.19482421875, -3.102294921875, -3.009765625, -2.917236328125, -2.82470703125, -2.732177734375, -2.6396484375, -2.547119140625, -2.45458984375, -2.362060546875, -2.26953125, -2.177001953125, -2.08447265625, -1.991943359375, -1.8994140625, -1.806884765625, -1.71435546875, -1.621826171875, -1.529296875, -1.436767578125, -1.34423828125, -1.251708984375, -1.1591796875, -1.066650390625, -0.97412109375, -0.881591796875, -0.7890625, -0.696533203125, -0.60400390625, -0.511474609375, -0.4189453125, -0.326416015625, -0.23388671875, -0.141357421875, -0.048828125, 0.043701171875, 0.13623046875, 0.228759765625, 0.3212890625, 0.413818359375, 0.50634765625, 0.598876953125, 0.69140625, 0.783935546875, 0.87646484375, 0.968994140625, 1.0615234375, 1.154052734375, 1.24658203125, 1.339111328125, 1.431640625, 1.524169921875, 1.61669921875, 1.709228515625, 1.8017578125, 1.894287109375, 1.98681640625, 2.079345703125, 2.171875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 15.0, 18.0, 40.0, 90.0, 171.0, 554.0, 2993.0, 157988.0, 878257.0, 7110.0, 839.0, 241.0, 109.0, 55.0, 25.0, 17.0, 15.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.326171875, -3.249114990234375, -3.17205810546875, -3.095001220703125, -3.0179443359375, -2.940887451171875, -2.86383056640625, -2.786773681640625, -2.709716796875, -2.632659912109375, -2.55560302734375, -2.478546142578125, -2.4014892578125, -2.324432373046875, -2.24737548828125, -2.170318603515625, -2.09326171875, -2.016204833984375, -1.93914794921875, -1.862091064453125, -1.7850341796875, -1.707977294921875, -1.63092041015625, -1.553863525390625, -1.476806640625, -1.399749755859375, -1.32269287109375, -1.245635986328125, -1.1685791015625, -1.091522216796875, -1.01446533203125, -0.937408447265625, -0.8603515625, -0.783294677734375, -0.70623779296875, -0.629180908203125, -0.5521240234375, -0.475067138671875, -0.39801025390625, -0.320953369140625, -0.243896484375, -0.166839599609375, -0.08978271484375, -0.012725830078125, 0.0643310546875, 0.141387939453125, 0.21844482421875, 0.295501708984375, 0.37255859375, 0.449615478515625, 0.52667236328125, 0.603729248046875, 0.6807861328125, 0.757843017578125, 0.83489990234375, 0.911956787109375, 0.989013671875, 1.066070556640625, 1.14312744140625, 1.220184326171875, 1.2972412109375, 1.374298095703125, 1.45135498046875, 1.528411865234375, 1.60546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 13.0, 25.0, 39.0, 81.0, 98.0, 153.0, 173.0, 137.0, 110.0, 64.0, 48.0, 19.0, 13.0, 9.0, 11.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00029277801513671875, -0.00028478726744651794, -0.00027679651975631714, -0.00026880577206611633, -0.00026081502437591553, -0.0002528242766857147, -0.0002448335289955139, -0.0002368427813053131, -0.0002288520336151123, -0.0002208612859249115, -0.0002128705382347107, -0.0002048797905445099, -0.00019688904285430908, -0.00018889829516410828, -0.00018090754747390747, -0.00017291679978370667, -0.00016492605209350586, -0.00015693530440330505, -0.00014894455671310425, -0.00014095380902290344, -0.00013296306133270264, -0.00012497231364250183, -0.00011698156595230103, -0.00010899081826210022, -0.00010100007057189941, -9.300932288169861e-05, -8.50185751914978e-05, -7.7027827501297e-05, -6.903707981109619e-05, -6.104633212089539e-05, -5.305558443069458e-05, -4.5064836740493774e-05, -3.707408905029297e-05, -2.9083341360092163e-05, -2.1092593669891357e-05, -1.3101845979690552e-05, -5.111098289489746e-06, 2.8796494007110596e-06, 1.0870397090911865e-05, 1.886114478111267e-05, 2.6851892471313477e-05, 3.484264016151428e-05, 4.283338785171509e-05, 5.0824135541915894e-05, 5.88148832321167e-05, 6.68056309223175e-05, 7.479637861251831e-05, 8.278712630271912e-05, 9.077787399291992e-05, 9.876862168312073e-05, 0.00010675936937332153, 0.00011475011706352234, 0.00012274086475372314, 0.00013073161244392395, 0.00013872236013412476, 0.00014671310782432556, 0.00015470385551452637, 0.00016269460320472717, 0.00017068535089492798, 0.00017867609858512878, 0.0001866668462753296, 0.0001946575939655304, 0.0002026483416557312, 0.000210639089345932, 0.0002186298370361328]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 10.0, 11.0, 8.0, 18.0, 7.0, 24.0, 35.0, 78.0, 109.0, 153.0, 240.0, 471.0, 919.0, 2039.0, 6416.0, 35860.0, 379045.0, 556628.0, 53176.0, 8507.0, 2538.0, 1042.0, 491.0, 266.0, 149.0, 111.0, 68.0, 47.0, 26.0, 11.0, 13.0, 14.0, 8.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6513671875, -0.6281814575195312, -0.6049957275390625, -0.5818099975585938, -0.558624267578125, -0.5354385375976562, -0.5122528076171875, -0.48906707763671875, -0.46588134765625, -0.44269561767578125, -0.4195098876953125, -0.39632415771484375, -0.373138427734375, -0.34995269775390625, -0.3267669677734375, -0.30358123779296875, -0.2803955078125, -0.25720977783203125, -0.2340240478515625, -0.21083831787109375, -0.187652587890625, -0.16446685791015625, -0.1412811279296875, -0.11809539794921875, -0.09490966796875, -0.07172393798828125, -0.0485382080078125, -0.02535247802734375, -0.002166748046875, 0.02101898193359375, 0.0442047119140625, 0.06739044189453125, 0.090576171875, 0.11376190185546875, 0.1369476318359375, 0.16013336181640625, 0.183319091796875, 0.20650482177734375, 0.2296905517578125, 0.25287628173828125, 0.27606201171875, 0.29924774169921875, 0.3224334716796875, 0.34561920166015625, 0.368804931640625, 0.39199066162109375, 0.4151763916015625, 0.43836212158203125, 0.4615478515625, 0.48473358154296875, 0.5079193115234375, 0.5311050415039062, 0.554290771484375, 0.5774765014648438, 0.6006622314453125, 0.6238479614257812, 0.64703369140625, 0.6702194213867188, 0.6934051513671875, 0.7165908813476562, 0.739776611328125, 0.7629623413085938, 0.7861480712890625, 0.8093338012695312, 0.83251953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 3.0, 2.0, 9.0, 11.0, 13.0, 16.0, 29.0, 23.0, 47.0, 61.0, 87.0, 101.0, 117.0, 110.0, 91.0, 77.0, 40.0, 38.0, 29.0, 27.0, 21.0, 6.0, 9.0, 9.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1767578125, -1.1457138061523438, -1.1146697998046875, -1.0836257934570312, -1.052581787109375, -1.0215377807617188, -0.9904937744140625, -0.9594497680664062, -0.92840576171875, -0.8973617553710938, -0.8663177490234375, -0.8352737426757812, -0.804229736328125, -0.7731857299804688, -0.7421417236328125, -0.7110977172851562, -0.6800537109375, -0.6490097045898438, -0.6179656982421875, -0.5869216918945312, -0.555877685546875, -0.5248336791992188, -0.4937896728515625, -0.46274566650390625, -0.43170166015625, -0.40065765380859375, -0.3696136474609375, -0.33856964111328125, -0.307525634765625, -0.27648162841796875, -0.2454376220703125, -0.21439361572265625, -0.183349609375, -0.15230560302734375, -0.1212615966796875, -0.09021759033203125, -0.059173583984375, -0.02812957763671875, 0.0029144287109375, 0.03395843505859375, 0.06500244140625, 0.09604644775390625, 0.1270904541015625, 0.15813446044921875, 0.189178466796875, 0.22022247314453125, 0.2512664794921875, 0.28231048583984375, 0.3133544921875, 0.34439849853515625, 0.3754425048828125, 0.40648651123046875, 0.437530517578125, 0.46857452392578125, 0.4996185302734375, 0.5306625366210938, 0.56170654296875, 0.5927505493164062, 0.6237945556640625, 0.6548385620117188, 0.685882568359375, 0.7169265747070312, 0.7479705810546875, 0.7790145874023438, 0.81005859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 17.0, 42.0, 89.0, 157.0, 206.0, 184.0, 116.0, 86.0, 46.0, 26.0, 11.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.760398864746094, -11.22939682006836, -10.698393821716309, -10.167391777038574, -9.636388778686523, -9.105386734008789, -8.574384689331055, -8.04338264465332, -7.5123796463012695, -6.981377124786377, -6.450374603271484, -5.91937255859375, -5.388370037078857, -4.857367515563965, -4.3263654708862305, -3.795362949371338, -3.2643604278564453, -2.7333579063415527, -2.2023556232452393, -1.6713532209396362, -1.1403508186340332, -0.6093482971191406, -0.07834601402282715, 0.45265626907348633, 0.9836587905883789, 1.514661192893982, 2.045663595199585, 2.5766658782958984, 3.107668399810791, 3.6386709213256836, 4.169672966003418, 4.7006754875183105, 5.231678009033203, 5.762680530548096, 6.293683052062988, 6.824685096740723, 7.355687618255615, 7.886690139770508, 8.417692184448242, 8.948694229125977, 9.479697227478027, 10.010699272155762, 10.541702270507812, 11.072704315185547, 11.603706359863281, 12.134709358215332, 12.665711402893066, 13.196714401245117, 13.727716445922852, 14.258718490600586, 14.789721488952637, 15.320723533630371, 15.851726531982422, 16.382728576660156, 16.91373062133789, 17.444732666015625, 17.97573471069336, 18.506736755371094, 19.037738800048828, 19.568742752075195, 20.09974479675293, 20.630746841430664, 21.1617488861084, 21.692750930786133, 22.2237548828125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 5.0, 4.0, 18.0, 15.0, 19.0, 33.0, 47.0, 46.0, 70.0, 73.0, 107.0, 104.0, 92.0, 94.0, 62.0, 46.0, 53.0, 29.0, 29.0, 14.0, 13.0, 14.0, 9.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.26752471923828, -19.532329559326172, -18.79713249206543, -18.06193733215332, -17.326740264892578, -16.59154510498047, -15.85634994506836, -15.121153831481934, -14.385957717895508, -13.650761604309082, -12.915565490722656, -12.180370330810547, -11.445174217224121, -10.709978103637695, -9.974782943725586, -9.23958683013916, -8.504390716552734, -7.769194602966309, -7.033998966217041, -6.298803329467773, -5.563607215881348, -4.828411102294922, -4.093215465545654, -3.3580198287963867, -2.622823715209961, -1.8876278400421143, -1.1524319648742676, -0.4172360897064209, 0.3179597854614258, 1.0531556606292725, 1.7883515357971191, 2.5235471725463867, 3.2587413787841797, 3.9939372539520264, 4.729133129119873, 5.464328765869141, 6.199524879455566, 6.934720993041992, 7.66991662979126, 8.405112266540527, 9.140308380126953, 9.875504493713379, 10.610700607299805, 11.345895767211914, 12.08109188079834, 12.816287994384766, 13.551483154296875, 14.2866792678833, 15.021875381469727, 15.757071495056152, 16.492267608642578, 17.227462768554688, 17.962657928466797, 18.69785499572754, 19.43305015563965, 20.16824722290039, 20.9034423828125, 21.63863754272461, 22.37383460998535, 23.10902976989746, 23.844226837158203, 24.579421997070312, 25.314617156982422, 26.04981231689453, 26.785009384155273]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 10.0, 20.0, 39.0, 49.0, 104.0, 152.0, 253.0, 508.0, 1074.0, 2500.0, 6548.0, 22480.0, 147798.0, 3891454.0, 94419.0, 17106.0, 5328.0, 2131.0, 1001.0, 488.0, 294.0, 169.0, 107.0, 60.0, 60.0, 24.0, 19.0, 19.0, 12.0, 4.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0105743408203125, -0.965484619140625, -0.9203948974609375, -0.87530517578125, -0.8302154541015625, -0.785125732421875, -0.7400360107421875, -0.6949462890625, -0.6498565673828125, -0.604766845703125, -0.5596771240234375, -0.51458740234375, -0.4694976806640625, -0.424407958984375, -0.3793182373046875, -0.334228515625, -0.2891387939453125, -0.244049072265625, -0.1989593505859375, -0.15386962890625, -0.1087799072265625, -0.063690185546875, -0.0186004638671875, 0.0264892578125, 0.0715789794921875, 0.116668701171875, 0.1617584228515625, 0.20684814453125, 0.2519378662109375, 0.297027587890625, 0.3421173095703125, 0.38720703125, 0.4322967529296875, 0.477386474609375, 0.5224761962890625, 0.56756591796875, 0.6126556396484375, 0.657745361328125, 0.7028350830078125, 0.7479248046875, 0.7930145263671875, 0.838104248046875, 0.8831939697265625, 0.92828369140625, 0.9733734130859375, 1.018463134765625, 1.0635528564453125, 1.108642578125, 1.1537322998046875, 1.198822021484375, 1.2439117431640625, 1.28900146484375, 1.3340911865234375, 1.379180908203125, 1.4242706298828125, 1.4693603515625, 1.5144500732421875, 1.559539794921875, 1.6046295166015625, 1.64971923828125, 1.6948089599609375, 1.739898681640625, 1.7849884033203125, 1.830078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 1.0, 8.0, 8.0, 12.0, 15.0, 22.0, 40.0, 49.0, 68.0, 68.0, 90.0, 118.0, 101.0, 89.0, 86.0, 64.0, 58.0, 41.0, 17.0, 15.0, 18.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67578125, -0.646392822265625, -0.61700439453125, -0.587615966796875, -0.5582275390625, -0.528839111328125, -0.49945068359375, -0.470062255859375, -0.440673828125, -0.411285400390625, -0.38189697265625, -0.352508544921875, -0.3231201171875, -0.293731689453125, -0.26434326171875, -0.234954833984375, -0.20556640625, -0.176177978515625, -0.14678955078125, -0.117401123046875, -0.0880126953125, -0.058624267578125, -0.02923583984375, 0.000152587890625, 0.029541015625, 0.058929443359375, 0.08831787109375, 0.117706298828125, 0.1470947265625, 0.176483154296875, 0.20587158203125, 0.235260009765625, 0.2646484375, 0.294036865234375, 0.32342529296875, 0.352813720703125, 0.3822021484375, 0.411590576171875, 0.44097900390625, 0.470367431640625, 0.499755859375, 0.529144287109375, 0.55853271484375, 0.587921142578125, 0.6173095703125, 0.646697998046875, 0.67608642578125, 0.705474853515625, 0.73486328125, 0.764251708984375, 0.79364013671875, 0.823028564453125, 0.8524169921875, 0.881805419921875, 0.91119384765625, 0.940582275390625, 0.969970703125, 0.999359130859375, 1.02874755859375, 1.058135986328125, 1.0875244140625, 1.116912841796875, 1.14630126953125, 1.175689697265625, 1.205078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 10.0, 22.0, 18.0, 31.0, 45.0, 76.0, 83.0, 133.0, 220.0, 311.0, 468.0, 753.0, 1238.0, 2431.0, 4614.0, 10430.0, 26023.0, 86785.0, 579819.0, 3272486.0, 143464.0, 37800.0, 13896.0, 5934.0, 2979.0, 1564.0, 978.0, 561.0, 374.0, 240.0, 161.0, 99.0, 70.0, 42.0, 38.0, 29.0, 14.0, 13.0, 7.0, 7.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8134765625, -0.7865142822265625, -0.759552001953125, -0.7325897216796875, -0.70562744140625, -0.6786651611328125, -0.651702880859375, -0.6247406005859375, -0.5977783203125, -0.5708160400390625, -0.543853759765625, -0.5168914794921875, -0.48992919921875, -0.4629669189453125, -0.436004638671875, -0.4090423583984375, -0.382080078125, -0.3551177978515625, -0.328155517578125, -0.3011932373046875, -0.27423095703125, -0.2472686767578125, -0.220306396484375, -0.1933441162109375, -0.1663818359375, -0.1394195556640625, -0.112457275390625, -0.0854949951171875, -0.05853271484375, -0.0315704345703125, -0.004608154296875, 0.0223541259765625, 0.04931640625, 0.0762786865234375, 0.103240966796875, 0.1302032470703125, 0.15716552734375, 0.1841278076171875, 0.211090087890625, 0.2380523681640625, 0.2650146484375, 0.2919769287109375, 0.318939208984375, 0.3459014892578125, 0.37286376953125, 0.3998260498046875, 0.426788330078125, 0.4537506103515625, 0.480712890625, 0.5076751708984375, 0.534637451171875, 0.5615997314453125, 0.58856201171875, 0.6155242919921875, 0.642486572265625, 0.6694488525390625, 0.6964111328125, 0.7233734130859375, 0.750335693359375, 0.7772979736328125, 0.80426025390625, 0.8312225341796875, 0.858184814453125, 0.8851470947265625, 0.912109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 12.0, 8.0, 20.0, 23.0, 37.0, 78.0, 166.0, 361.0, 2637.0, 407.0, 142.0, 62.0, 45.0, 27.0, 13.0, 6.0, 12.0, 5.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4033203125, -0.39013671875, -0.376953125, -0.36376953125, -0.3505859375, -0.33740234375, -0.32421875, -0.31103515625, -0.2978515625, -0.28466796875, -0.271484375, -0.25830078125, -0.2451171875, -0.23193359375, -0.21875, -0.20556640625, -0.1923828125, -0.17919921875, -0.166015625, -0.15283203125, -0.1396484375, -0.12646484375, -0.11328125, -0.10009765625, -0.0869140625, -0.07373046875, -0.060546875, -0.04736328125, -0.0341796875, -0.02099609375, -0.0078125, 0.00537109375, 0.0185546875, 0.03173828125, 0.044921875, 0.05810546875, 0.0712890625, 0.08447265625, 0.09765625, 0.11083984375, 0.1240234375, 0.13720703125, 0.150390625, 0.16357421875, 0.1767578125, 0.18994140625, 0.203125, 0.21630859375, 0.2294921875, 0.24267578125, 0.255859375, 0.26904296875, 0.2822265625, 0.29541015625, 0.30859375, 0.32177734375, 0.3349609375, 0.34814453125, 0.361328125, 0.37451171875, 0.3876953125, 0.40087890625, 0.4140625, 0.42724609375, 0.4404296875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 16.0, 101.0, 266.0, 360.0, 208.0, 44.0, 13.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.686465859413147, -1.5433162450790405, -1.400166630744934, -1.2570171356201172, -1.1138675212860107, -0.9707178473472595, -0.8275682926177979, -0.6844186782836914, -0.541269063949585, -0.3981194496154785, -0.25496986508369446, -0.1118202805519104, 0.031329333782196045, 0.1744789481163025, 0.31762850284576416, 0.4607781171798706, 0.603927731513977, 0.7470773458480835, 0.8902269601821899, 1.0333764553070068, 1.1765260696411133, 1.3196756839752197, 1.4628252983093262, 1.6059749126434326, 1.749124526977539, 1.8922741413116455, 2.035423755645752, 2.1785733699798584, 2.321722984313965, 2.4648725986480713, 2.6080222129821777, 2.751171588897705, 2.8943214416503906, 3.037471055984497, 3.1806206703186035, 3.32377028465271, 3.4669198989868164, 3.610069513320923, 3.7532191276550293, 3.8963685035705566, 4.039518356323242, 4.1826677322387695, 4.325817584991455, 4.468966960906982, 4.612116813659668, 4.755266189575195, 4.898416042327881, 5.041565418243408, 5.184715270996094, 5.327864646911621, 5.471014499664307, 5.614163875579834, 5.7573137283325195, 5.900463104248047, 6.043612957000732, 6.18676233291626, 6.329911708831787, 6.4730610847473145, 6.6162109375, 6.759360313415527, 6.902510166168213, 7.04565954208374, 7.188809394836426, 7.331958770751953, 7.475108623504639]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 5.0, 10.0, 16.0, 12.0, 11.0, 20.0, 21.0, 24.0, 25.0, 25.0, 30.0, 30.0, 30.0, 32.0, 38.0, 46.0, 38.0, 51.0, 34.0, 36.0, 35.0, 33.0, 34.0, 38.0, 32.0, 28.0, 21.0, 31.0, 25.0, 19.0, 15.0, 17.0, 26.0, 11.0, 9.0, 14.0, 13.0, 10.0, 12.0, 10.0, 4.0, 6.0, 5.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.954521894454956, -0.9246616959571838, -0.8948014974594116, -0.8649412393569946, -0.8350810408592224, -0.8052208423614502, -0.7753605842590332, -0.745500385761261, -0.7156401872634888, -0.6857799887657166, -0.6559197902679443, -0.6260595321655273, -0.5961993336677551, -0.5663391351699829, -0.5364788770675659, -0.5066186785697937, -0.4767584800720215, -0.44689828157424927, -0.41703805327415466, -0.38717782497406006, -0.35731762647628784, -0.3274574279785156, -0.297597199678421, -0.2677369713783264, -0.2378767728805542, -0.2080165594816208, -0.17815634608268738, -0.14829613268375397, -0.11843591928482056, -0.08857570588588715, -0.058715492486953735, -0.028855279088020325, 0.001004934310913086, 0.030865147709846497, 0.06072536110877991, 0.09058557450771332, 0.12044578790664673, 0.15030600130558014, 0.18016621470451355, 0.21002642810344696, 0.23988664150238037, 0.2697468400001526, 0.2996070683002472, 0.3294672966003418, 0.359327495098114, 0.38918769359588623, 0.41904792189598083, 0.44890815019607544, 0.47876834869384766, 0.5086285471916199, 0.5384887456893921, 0.5683490037918091, 0.5982092022895813, 0.6280694007873535, 0.6579296588897705, 0.6877898573875427, 0.7176500558853149, 0.7475102543830872, 0.7773704528808594, 0.8072307109832764, 0.8370909094810486, 0.8669511079788208, 0.8968113660812378, 0.92667156457901, 0.9565317630767822]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 6.0, 8.0, 18.0, 26.0, 48.0, 91.0, 204.0, 473.0, 1374.0, 5889.0, 38018.0, 376057.0, 548598.0, 65973.0, 8730.0, 1887.0, 631.0, 236.0, 117.0, 69.0, 41.0, 22.0, 10.0, 7.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.416015625, -2.3586578369140625, -2.301300048828125, -2.2439422607421875, -2.18658447265625, -2.1292266845703125, -2.071868896484375, -2.0145111083984375, -1.9571533203125, -1.8997955322265625, -1.842437744140625, -1.7850799560546875, -1.72772216796875, -1.6703643798828125, -1.613006591796875, -1.5556488037109375, -1.498291015625, -1.4409332275390625, -1.383575439453125, -1.3262176513671875, -1.26885986328125, -1.2115020751953125, -1.154144287109375, -1.0967864990234375, -1.0394287109375, -0.9820709228515625, -0.924713134765625, -0.8673553466796875, -0.80999755859375, -0.7526397705078125, -0.695281982421875, -0.6379241943359375, -0.58056640625, -0.5232086181640625, -0.465850830078125, -0.4084930419921875, -0.35113525390625, -0.2937774658203125, -0.236419677734375, -0.1790618896484375, -0.1217041015625, -0.0643463134765625, -0.006988525390625, 0.0503692626953125, 0.10772705078125, 0.1650848388671875, 0.222442626953125, 0.2798004150390625, 0.337158203125, 0.3945159912109375, 0.451873779296875, 0.5092315673828125, 0.56658935546875, 0.6239471435546875, 0.681304931640625, 0.7386627197265625, 0.7960205078125, 0.8533782958984375, 0.910736083984375, 0.9680938720703125, 1.02545166015625, 1.0828094482421875, 1.140167236328125, 1.1975250244140625, 1.2548828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 10.0, 12.0, 21.0, 21.0, 38.0, 57.0, 58.0, 71.0, 96.0, 113.0, 90.0, 86.0, 67.0, 66.0, 56.0, 40.0, 34.0, 20.0, 15.0, 9.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.6236343383789062, -0.5954132080078125, -0.5671920776367188, -0.538970947265625, -0.5107498168945312, -0.4825286865234375, -0.45430755615234375, -0.42608642578125, -0.39786529541015625, -0.3696441650390625, -0.34142303466796875, -0.313201904296875, -0.28498077392578125, -0.2567596435546875, -0.22853851318359375, -0.2003173828125, -0.17209625244140625, -0.1438751220703125, -0.11565399169921875, -0.087432861328125, -0.05921173095703125, -0.0309906005859375, -0.00276947021484375, 0.02545166015625, 0.05367279052734375, 0.0818939208984375, 0.11011505126953125, 0.138336181640625, 0.16655731201171875, 0.1947784423828125, 0.22299957275390625, 0.251220703125, 0.27944183349609375, 0.3076629638671875, 0.33588409423828125, 0.364105224609375, 0.39232635498046875, 0.4205474853515625, 0.44876861572265625, 0.47698974609375, 0.5052108764648438, 0.5334320068359375, 0.5616531372070312, 0.589874267578125, 0.6180953979492188, 0.6463165283203125, 0.6745376586914062, 0.7027587890625, 0.7309799194335938, 0.7592010498046875, 0.7874221801757812, 0.815643310546875, 0.8438644409179688, 0.8720855712890625, 0.9003067016601562, 0.92852783203125, 0.9567489624023438, 0.9849700927734375, 1.0131912231445312, 1.041412353515625, 1.0696334838867188, 1.0978546142578125, 1.1260757446289062, 1.154296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 9.0, 8.0, 15.0, 22.0, 27.0, 33.0, 58.0, 116.0, 251.0, 646.0, 2517.0, 23290.0, 783825.0, 226879.0, 8581.0, 1426.0, 420.0, 177.0, 90.0, 54.0, 34.0, 17.0, 15.0, 16.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.61328125, -2.5079345703125, -2.402587890625, -2.2972412109375, -2.19189453125, -2.0865478515625, -1.981201171875, -1.8758544921875, -1.7705078125, -1.6651611328125, -1.559814453125, -1.4544677734375, -1.34912109375, -1.2437744140625, -1.138427734375, -1.0330810546875, -0.927734375, -0.8223876953125, -0.717041015625, -0.6116943359375, -0.50634765625, -0.4010009765625, -0.295654296875, -0.1903076171875, -0.0849609375, 0.0203857421875, 0.125732421875, 0.2310791015625, 0.33642578125, 0.4417724609375, 0.547119140625, 0.6524658203125, 0.7578125, 0.8631591796875, 0.968505859375, 1.0738525390625, 1.17919921875, 1.2845458984375, 1.389892578125, 1.4952392578125, 1.6005859375, 1.7059326171875, 1.811279296875, 1.9166259765625, 2.02197265625, 2.1273193359375, 2.232666015625, 2.3380126953125, 2.443359375, 2.5487060546875, 2.654052734375, 2.7593994140625, 2.86474609375, 2.9700927734375, 3.075439453125, 3.1807861328125, 3.2861328125, 3.3914794921875, 3.496826171875, 3.6021728515625, 3.70751953125, 3.8128662109375, 3.918212890625, 4.0235595703125, 4.12890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 11.0, 6.0, 5.0, 13.0, 20.0, 7.0, 18.0, 27.0, 23.0, 37.0, 44.0, 44.0, 56.0, 57.0, 46.0, 57.0, 77.0, 61.0, 60.0, 50.0, 36.0, 36.0, 30.0, 29.0, 19.0, 22.0, 11.0, 18.0, 14.0, 11.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.83038330078125, -2.7349853515625, -2.63958740234375, -2.544189453125, -2.44879150390625, -2.3533935546875, -2.25799560546875, -2.16259765625, -2.06719970703125, -1.9718017578125, -1.87640380859375, -1.781005859375, -1.68560791015625, -1.5902099609375, -1.49481201171875, -1.3994140625, -1.30401611328125, -1.2086181640625, -1.11322021484375, -1.017822265625, -0.92242431640625, -0.8270263671875, -0.73162841796875, -0.63623046875, -0.54083251953125, -0.4454345703125, -0.35003662109375, -0.254638671875, -0.15924072265625, -0.0638427734375, 0.03155517578125, 0.126953125, 0.22235107421875, 0.3177490234375, 0.41314697265625, 0.508544921875, 0.60394287109375, 0.6993408203125, 0.79473876953125, 0.89013671875, 0.98553466796875, 1.0809326171875, 1.17633056640625, 1.271728515625, 1.36712646484375, 1.4625244140625, 1.55792236328125, 1.6533203125, 1.74871826171875, 1.8441162109375, 1.93951416015625, 2.034912109375, 2.13031005859375, 2.2257080078125, 2.32110595703125, 2.41650390625, 2.51190185546875, 2.6072998046875, 2.70269775390625, 2.798095703125, 2.89349365234375, 2.9888916015625, 3.08428955078125, 3.1796875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 8.0, 14.0, 23.0, 33.0, 35.0, 73.0, 120.0, 197.0, 399.0, 1095.0, 4877.0, 167119.0, 858614.0, 12911.0, 1796.0, 603.0, 282.0, 116.0, 76.0, 58.0, 24.0, 17.0, 14.0, 8.0, 5.0, 10.0, 4.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.267608642578125, -2.20318603515625, -2.138763427734375, -2.0743408203125, -2.009918212890625, -1.94549560546875, -1.881072998046875, -1.816650390625, -1.752227783203125, -1.68780517578125, -1.623382568359375, -1.5589599609375, -1.494537353515625, -1.43011474609375, -1.365692138671875, -1.30126953125, -1.236846923828125, -1.17242431640625, -1.108001708984375, -1.0435791015625, -0.979156494140625, -0.91473388671875, -0.850311279296875, -0.785888671875, -0.721466064453125, -0.65704345703125, -0.592620849609375, -0.5281982421875, -0.463775634765625, -0.39935302734375, -0.334930419921875, -0.2705078125, -0.206085205078125, -0.14166259765625, -0.077239990234375, -0.0128173828125, 0.051605224609375, 0.11602783203125, 0.180450439453125, 0.244873046875, 0.309295654296875, 0.37371826171875, 0.438140869140625, 0.5025634765625, 0.566986083984375, 0.63140869140625, 0.695831298828125, 0.76025390625, 0.824676513671875, 0.88909912109375, 0.953521728515625, 1.0179443359375, 1.082366943359375, 1.14678955078125, 1.211212158203125, 1.275634765625, 1.340057373046875, 1.40447998046875, 1.468902587890625, 1.5333251953125, 1.597747802734375, 1.66217041015625, 1.726593017578125, 1.791015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 23.0, 34.0, 42.0, 73.0, 111.0, 150.0, 173.0, 120.0, 106.0, 59.0, 40.0, 27.0, 10.0, 9.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002970695495605469, -0.00029018335044384, -0.0002832971513271332, -0.00027641095221042633, -0.0002695247530937195, -0.00026263855397701263, -0.0002557523548603058, -0.00024886615574359894, -0.0002419799566268921, -0.00023509375751018524, -0.0002282075583934784, -0.00022132135927677155, -0.0002144351601600647, -0.00020754896104335785, -0.000200662761926651, -0.00019377656280994415, -0.0001868903636932373, -0.00018000416457653046, -0.0001731179654598236, -0.00016623176634311676, -0.0001593455672264099, -0.00015245936810970306, -0.00014557316899299622, -0.00013868696987628937, -0.00013180077075958252, -0.00012491457164287567, -0.00011802837252616882, -0.00011114217340946198, -0.00010425597429275513, -9.736977517604828e-05, -9.048357605934143e-05, -8.359737694263458e-05, -7.671117782592773e-05, -6.982497870922089e-05, -6.293877959251404e-05, -5.605258047580719e-05, -4.916638135910034e-05, -4.2280182242393494e-05, -3.5393983125686646e-05, -2.8507784008979797e-05, -2.162158489227295e-05, -1.4735385775566101e-05, -7.849186658859253e-06, -9.629875421524048e-07, 5.923211574554443e-06, 1.2809410691261292e-05, 1.969560980796814e-05, 2.6581808924674988e-05, 3.3468008041381836e-05, 4.0354207158088684e-05, 4.724040627479553e-05, 5.412660539150238e-05, 6.101280450820923e-05, 6.789900362491608e-05, 7.478520274162292e-05, 8.167140185832977e-05, 8.855760097503662e-05, 9.544380009174347e-05, 0.00010232999920845032, 0.00010921619832515717, 0.00011610239744186401, 0.00012298859655857086, 0.0001298747956752777, 0.00013676099479198456, 0.0001436471939086914]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 5.0, 8.0, 13.0, 29.0, 61.0, 113.0, 285.0, 660.0, 2487.0, 22021.0, 884858.0, 130685.0, 5429.0, 1191.0, 391.0, 156.0, 76.0, 31.0, 13.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2431640625, -1.1907501220703125, -1.138336181640625, -1.0859222412109375, -1.03350830078125, -0.9810943603515625, -0.928680419921875, -0.8762664794921875, -0.8238525390625, -0.7714385986328125, -0.719024658203125, -0.6666107177734375, -0.61419677734375, -0.5617828369140625, -0.509368896484375, -0.4569549560546875, -0.404541015625, -0.3521270751953125, -0.299713134765625, -0.2472991943359375, -0.19488525390625, -0.1424713134765625, -0.090057373046875, -0.0376434326171875, 0.0147705078125, 0.0671844482421875, 0.119598388671875, 0.1720123291015625, 0.22442626953125, 0.2768402099609375, 0.329254150390625, 0.3816680908203125, 0.43408203125, 0.4864959716796875, 0.538909912109375, 0.5913238525390625, 0.64373779296875, 0.6961517333984375, 0.748565673828125, 0.8009796142578125, 0.8533935546875, 0.9058074951171875, 0.958221435546875, 1.0106353759765625, 1.06304931640625, 1.1154632568359375, 1.167877197265625, 1.2202911376953125, 1.272705078125, 1.3251190185546875, 1.377532958984375, 1.4299468994140625, 1.48236083984375, 1.5347747802734375, 1.587188720703125, 1.6396026611328125, 1.6920166015625, 1.7444305419921875, 1.796844482421875, 1.8492584228515625, 1.90167236328125, 1.9540863037109375, 2.006500244140625, 2.0589141845703125, 2.111328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 3.0, 14.0, 18.0, 24.0, 63.0, 133.0, 174.0, 181.0, 167.0, 83.0, 68.0, 23.0, 17.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.7866363525390625, -1.729522705078125, -1.6724090576171875, -1.61529541015625, -1.5581817626953125, -1.501068115234375, -1.4439544677734375, -1.3868408203125, -1.3297271728515625, -1.272613525390625, -1.2154998779296875, -1.15838623046875, -1.1012725830078125, -1.044158935546875, -0.9870452880859375, -0.929931640625, -0.8728179931640625, -0.815704345703125, -0.7585906982421875, -0.70147705078125, -0.6443634033203125, -0.587249755859375, -0.5301361083984375, -0.4730224609375, -0.4159088134765625, -0.358795166015625, -0.3016815185546875, -0.24456787109375, -0.1874542236328125, -0.130340576171875, -0.0732269287109375, -0.01611328125, 0.0410003662109375, 0.098114013671875, 0.1552276611328125, 0.21234130859375, 0.2694549560546875, 0.326568603515625, 0.3836822509765625, 0.4407958984375, 0.4979095458984375, 0.555023193359375, 0.6121368408203125, 0.66925048828125, 0.7263641357421875, 0.783477783203125, 0.8405914306640625, 0.897705078125, 0.9548187255859375, 1.011932373046875, 1.0690460205078125, 1.12615966796875, 1.1832733154296875, 1.240386962890625, 1.2975006103515625, 1.3546142578125, 1.4117279052734375, 1.468841552734375, 1.5259552001953125, 1.58306884765625, 1.6401824951171875, 1.697296142578125, 1.7544097900390625, 1.8115234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 18.0, 80.0, 241.0, 344.0, 206.0, 72.0, 21.0, 18.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.73120880126953, -52.72235870361328, -51.71350860595703, -50.70465850830078, -49.695804595947266, -48.686954498291016, -47.678104400634766, -46.669254302978516, -45.660404205322266, -44.651554107666016, -43.642704010009766, -42.63385009765625, -41.625, -40.61614990234375, -39.6072998046875, -38.59844970703125, -37.589599609375, -36.58074951171875, -35.5718994140625, -34.56304931640625, -33.554195404052734, -32.545345306396484, -31.536495208740234, -30.527645111083984, -29.51879119873047, -28.50994110107422, -27.501089096069336, -26.492238998413086, -25.483388900756836, -24.474536895751953, -23.465686798095703, -22.456836700439453, -21.447988510131836, -20.439138412475586, -19.430286407470703, -18.421436309814453, -17.412586212158203, -16.403736114501953, -15.39488410949707, -14.38603401184082, -13.377182960510254, -12.368331909179688, -11.359481811523438, -10.350630760192871, -9.341779708862305, -8.332929611206055, -7.324078559875488, -6.31522798538208, -5.306377410888672, -4.297526836395264, -3.2886760234832764, -2.279825210571289, -1.2709746360778809, -0.26212406158447266, 0.7467269897460938, 1.755577564239502, 2.76442813873291, 3.7732787132263184, 4.782129287719727, 5.790980339050293, 6.799830913543701, 7.808681488037109, 8.817532539367676, 9.826383590698242, 10.835233688354492]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 6.0, 9.0, 8.0, 12.0, 13.0, 13.0, 19.0, 19.0, 24.0, 22.0, 32.0, 45.0, 36.0, 52.0, 55.0, 57.0, 63.0, 56.0, 60.0, 61.0, 53.0, 51.0, 34.0, 29.0, 35.0, 28.0, 17.0, 15.0, 20.0, 12.0, 7.0, 8.0, 9.0, 2.0, 3.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.056785583496094, -9.654315948486328, -9.251846313476562, -8.849377632141113, -8.446907997131348, -8.044438362121582, -7.641968727111816, -7.239499568939209, -6.837030410766602, -6.434560775756836, -6.0320916175842285, -5.629621982574463, -5.2271528244018555, -4.82468318939209, -4.422213554382324, -4.019744396209717, -3.617274761199951, -3.2148053646087646, -2.812335968017578, -2.4098663330078125, -2.007397174835205, -1.6049275398254395, -1.202458143234253, -0.7999887466430664, -0.3975193500518799, 0.004950076341629028, 0.40741950273513794, 0.8098889589309692, 1.2123583555221558, 1.6148278713226318, 2.0172972679138184, 2.419766664505005, 2.8222360610961914, 3.224705457687378, 3.6271748542785645, 4.02964448928833, 4.4321136474609375, 4.834583282470703, 5.237052917480469, 5.639522075653076, 6.041991233825684, 6.444460868835449, 6.846930027008057, 7.249399662017822, 7.65186882019043, 8.054338455200195, 8.456808090209961, 8.859277725219727, 9.261747360229492, 9.664216995239258, 10.066686630249023, 10.469155311584473, 10.871624946594238, 11.274094581604004, 11.67656421661377, 12.079032897949219, 12.481502532958984, 12.88397216796875, 13.286441802978516, 13.688910484313965, 14.09138011932373, 14.493849754333496, 14.896319389343262, 15.298788070678711, 15.701257705688477]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 14.0, 9.0, 16.0, 22.0, 48.0, 81.0, 148.0, 304.0, 629.0, 1681.0, 5279.0, 28863.0, 4013945.0, 126422.0, 11617.0, 2926.0, 1087.0, 480.0, 274.0, 145.0, 93.0, 48.0, 38.0, 25.0, 20.0, 17.0, 11.0, 8.0, 1.0, 4.0, 8.0, 2.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8330078125, -1.7589874267578125, -1.684967041015625, -1.6109466552734375, -1.53692626953125, -1.4629058837890625, -1.388885498046875, -1.3148651123046875, -1.2408447265625, -1.1668243408203125, -1.092803955078125, -1.0187835693359375, -0.94476318359375, -0.8707427978515625, -0.796722412109375, -0.7227020263671875, -0.648681640625, -0.5746612548828125, -0.500640869140625, -0.4266204833984375, -0.35260009765625, -0.2785797119140625, -0.204559326171875, -0.1305389404296875, -0.0565185546875, 0.0175018310546875, 0.091522216796875, 0.1655426025390625, 0.23956298828125, 0.3135833740234375, 0.387603759765625, 0.4616241455078125, 0.53564453125, 0.6096649169921875, 0.683685302734375, 0.7577056884765625, 0.83172607421875, 0.9057464599609375, 0.979766845703125, 1.0537872314453125, 1.1278076171875, 1.2018280029296875, 1.275848388671875, 1.3498687744140625, 1.42388916015625, 1.4979095458984375, 1.571929931640625, 1.6459503173828125, 1.719970703125, 1.7939910888671875, 1.868011474609375, 1.9420318603515625, 2.01605224609375, 2.0900726318359375, 2.164093017578125, 2.2381134033203125, 2.3121337890625, 2.3861541748046875, 2.460174560546875, 2.5341949462890625, 2.60821533203125, 2.6822357177734375, 2.756256103515625, 2.8302764892578125, 2.904296875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 11.0, 10.0, 26.0, 34.0, 47.0, 64.0, 102.0, 149.0, 135.0, 133.0, 90.0, 82.0, 38.0, 31.0, 14.0, 10.0, 9.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9375, -0.8957061767578125, -0.853912353515625, -0.8121185302734375, -0.77032470703125, -0.7285308837890625, -0.686737060546875, -0.6449432373046875, -0.6031494140625, -0.5613555908203125, -0.519561767578125, -0.4777679443359375, -0.43597412109375, -0.3941802978515625, -0.352386474609375, -0.3105926513671875, -0.268798828125, -0.2270050048828125, -0.185211181640625, -0.1434173583984375, -0.10162353515625, -0.0598297119140625, -0.018035888671875, 0.0237579345703125, 0.0655517578125, 0.1073455810546875, 0.149139404296875, 0.1909332275390625, 0.23272705078125, 0.2745208740234375, 0.316314697265625, 0.3581085205078125, 0.39990234375, 0.4416961669921875, 0.483489990234375, 0.5252838134765625, 0.56707763671875, 0.6088714599609375, 0.650665283203125, 0.6924591064453125, 0.7342529296875, 0.7760467529296875, 0.817840576171875, 0.8596343994140625, 0.90142822265625, 0.9432220458984375, 0.985015869140625, 1.0268096923828125, 1.068603515625, 1.1103973388671875, 1.152191162109375, 1.1939849853515625, 1.23577880859375, 1.2775726318359375, 1.319366455078125, 1.3611602783203125, 1.4029541015625, 1.4447479248046875, 1.486541748046875, 1.5283355712890625, 1.57012939453125, 1.6119232177734375, 1.653717041015625, 1.6955108642578125, 1.7373046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 6.0, 13.0, 14.0, 24.0, 36.0, 38.0, 81.0, 144.0, 259.0, 386.0, 709.0, 1467.0, 3138.0, 8009.0, 27086.0, 172650.0, 3840577.0, 107328.0, 20464.0, 6575.0, 2618.0, 1176.0, 602.0, 359.0, 204.0, 107.0, 54.0, 40.0, 34.0, 24.0, 15.0, 16.0, 7.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.435546875, -1.3925628662109375, -1.349578857421875, -1.3065948486328125, -1.26361083984375, -1.2206268310546875, -1.177642822265625, -1.1346588134765625, -1.0916748046875, -1.0486907958984375, -1.005706787109375, -0.9627227783203125, -0.91973876953125, -0.8767547607421875, -0.833770751953125, -0.7907867431640625, -0.747802734375, -0.7048187255859375, -0.661834716796875, -0.6188507080078125, -0.57586669921875, -0.5328826904296875, -0.489898681640625, -0.4469146728515625, -0.4039306640625, -0.3609466552734375, -0.317962646484375, -0.2749786376953125, -0.23199462890625, -0.1890106201171875, -0.146026611328125, -0.1030426025390625, -0.06005859375, -0.0170745849609375, 0.025909423828125, 0.0688934326171875, 0.11187744140625, 0.1548614501953125, 0.197845458984375, 0.2408294677734375, 0.2838134765625, 0.3267974853515625, 0.369781494140625, 0.4127655029296875, 0.45574951171875, 0.4987335205078125, 0.541717529296875, 0.5847015380859375, 0.627685546875, 0.6706695556640625, 0.713653564453125, 0.7566375732421875, 0.79962158203125, 0.8426055908203125, 0.885589599609375, 0.9285736083984375, 0.9715576171875, 1.0145416259765625, 1.057525634765625, 1.1005096435546875, 1.14349365234375, 1.1864776611328125, 1.229461669921875, 1.2724456787109375, 1.3154296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 2.0, 5.0, 8.0, 9.0, 9.0, 15.0, 27.0, 70.0, 109.0, 224.0, 3037.0, 310.0, 100.0, 61.0, 32.0, 18.0, 14.0, 5.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447265625, -0.43395233154296875, -0.4206390380859375, -0.40732574462890625, -0.394012451171875, -0.38069915771484375, -0.3673858642578125, -0.35407257080078125, -0.34075927734375, -0.32744598388671875, -0.3141326904296875, -0.30081939697265625, -0.287506103515625, -0.27419281005859375, -0.2608795166015625, -0.24756622314453125, -0.2342529296875, -0.22093963623046875, -0.2076263427734375, -0.19431304931640625, -0.180999755859375, -0.16768646240234375, -0.1543731689453125, -0.14105987548828125, -0.12774658203125, -0.11443328857421875, -0.1011199951171875, -0.08780670166015625, -0.074493408203125, -0.06118011474609375, -0.0478668212890625, -0.03455352783203125, -0.021240234375, -0.00792694091796875, 0.0053863525390625, 0.01869964599609375, 0.032012939453125, 0.04532623291015625, 0.0586395263671875, 0.07195281982421875, 0.08526611328125, 0.09857940673828125, 0.1118927001953125, 0.12520599365234375, 0.138519287109375, 0.15183258056640625, 0.1651458740234375, 0.17845916748046875, 0.1917724609375, 0.20508575439453125, 0.2183990478515625, 0.23171234130859375, 0.245025634765625, 0.25833892822265625, 0.2716522216796875, 0.28496551513671875, 0.29827880859375, 0.31159210205078125, 0.3249053955078125, 0.33821868896484375, 0.351531982421875, 0.36484527587890625, 0.3781585693359375, 0.39147186279296875, 0.40478515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 19.0, 47.0, 112.0, 201.0, 251.0, 199.0, 109.0, 35.0, 13.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123575210571289, -3.0288658142089844, -2.9341564178466797, -2.839447021484375, -2.7447378635406494, -2.6500284671783447, -2.55531907081604, -2.4606096744537354, -2.3659005165100098, -2.271191120147705, -2.1764817237854004, -2.0817723274230957, -1.9870631694793701, -1.8923537731170654, -1.7976443767547607, -1.702934980392456, -1.6082255840301514, -1.5135161876678467, -1.4188069105148315, -1.3240975141525269, -1.2293882369995117, -1.134678840637207, -1.0399694442749023, -0.9452601075172424, -0.8505507707595825, -0.7558414340019226, -0.6611320972442627, -0.566422700881958, -0.4717133641242981, -0.3770040273666382, -0.2822946310043335, -0.18758529424667358, -0.09287571907043457, 0.0018336325883865356, 0.09654298424720764, 0.19125235080718994, 0.28596168756484985, 0.38067102432250977, 0.47538042068481445, 0.5700897574424744, 0.6647990942001343, 0.7595084309577942, 0.8542177677154541, 0.9489271640777588, 1.0436365604400635, 1.1383458375930786, 1.2330552339553833, 1.3277645111083984, 1.4224739074707031, 1.5171833038330078, 1.611892580986023, 1.7066019773483276, 1.8013112545013428, 1.8960206508636475, 1.9907300472259521, 2.085439443588257, 2.1801486015319824, 2.274857997894287, 2.369567394256592, 2.4642767906188965, 2.558985948562622, 2.6536953449249268, 2.7484047412872314, 2.843114137649536, 2.937823534011841]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 0.0, 1.0, 4.0, 9.0, 12.0, 12.0, 24.0, 16.0, 14.0, 25.0, 33.0, 38.0, 45.0, 39.0, 40.0, 33.0, 41.0, 57.0, 62.0, 57.0, 58.0, 55.0, 39.0, 43.0, 37.0, 30.0, 35.0, 33.0, 22.0, 17.0, 17.0, 11.0, 13.0, 2.0, 2.0, 11.0, 5.0, 1.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.506568193435669, -1.467463493347168, -1.428358793258667, -1.3892539739608765, -1.3501492738723755, -1.3110445737838745, -1.2719398736953735, -1.2328351736068726, -1.193730354309082, -1.154625654220581, -1.11552095413208, -1.0764161348342896, -1.0373114347457886, -0.9982067346572876, -0.9591020345687866, -0.9199973344802856, -0.8808926343917847, -0.8417879343032837, -0.8026831746101379, -0.763578474521637, -0.7244737148284912, -0.6853690147399902, -0.6462643146514893, -0.6071596145629883, -0.5680548548698425, -0.5289501547813416, -0.4898453950881958, -0.4507406949996948, -0.41163596510887146, -0.3725312352180481, -0.3334265351295471, -0.29432180523872375, -0.2552170753479004, -0.21611234545707703, -0.17700763046741486, -0.13790291547775269, -0.09879818558692932, -0.05969345569610596, -0.020588740706443787, 0.018515974283218384, 0.05762070417404175, 0.09672542661428452, 0.13583014905452728, 0.17493486404418945, 0.21403959393501282, 0.2531443238258362, 0.29224902391433716, 0.3313537538051605, 0.3704584836959839, 0.40956321358680725, 0.4486679434776306, 0.4877726435661316, 0.5268774032592773, 0.5659821033477783, 0.6050868034362793, 0.6441915035247803, 0.683296263217926, 0.722400963306427, 0.7615057229995728, 0.8006104230880737, 0.8397151231765747, 0.8788198828697205, 0.9179245829582214, 0.9570293426513672, 0.9961340427398682]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 14.0, 13.0, 13.0, 21.0, 29.0, 64.0, 98.0, 195.0, 440.0, 1167.0, 3764.0, 21258.0, 269014.0, 679436.0, 62124.0, 7748.0, 1895.0, 626.0, 279.0, 146.0, 76.0, 52.0, 29.0, 14.0, 8.0, 13.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6875, -1.6231689453125, -1.558837890625, -1.4945068359375, -1.43017578125, -1.3658447265625, -1.301513671875, -1.2371826171875, -1.1728515625, -1.1085205078125, -1.044189453125, -0.9798583984375, -0.91552734375, -0.8511962890625, -0.786865234375, -0.7225341796875, -0.658203125, -0.5938720703125, -0.529541015625, -0.4652099609375, -0.40087890625, -0.3365478515625, -0.272216796875, -0.2078857421875, -0.1435546875, -0.0792236328125, -0.014892578125, 0.0494384765625, 0.11376953125, 0.1781005859375, 0.242431640625, 0.3067626953125, 0.37109375, 0.4354248046875, 0.499755859375, 0.5640869140625, 0.62841796875, 0.6927490234375, 0.757080078125, 0.8214111328125, 0.8857421875, 0.9500732421875, 1.014404296875, 1.0787353515625, 1.14306640625, 1.2073974609375, 1.271728515625, 1.3360595703125, 1.400390625, 1.4647216796875, 1.529052734375, 1.5933837890625, 1.65771484375, 1.7220458984375, 1.786376953125, 1.8507080078125, 1.9150390625, 1.9793701171875, 2.043701171875, 2.1080322265625, 2.17236328125, 2.2366943359375, 2.301025390625, 2.3653564453125, 2.4296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 8.0, 20.0, 25.0, 27.0, 53.0, 59.0, 98.0, 121.0, 125.0, 117.0, 87.0, 85.0, 58.0, 32.0, 36.0, 15.0, 13.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8154296875, -0.7779388427734375, -0.740447998046875, -0.7029571533203125, -0.66546630859375, -0.6279754638671875, -0.590484619140625, -0.5529937744140625, -0.5155029296875, -0.4780120849609375, -0.440521240234375, -0.4030303955078125, -0.36553955078125, -0.3280487060546875, -0.290557861328125, -0.2530670166015625, -0.215576171875, -0.1780853271484375, -0.140594482421875, -0.1031036376953125, -0.06561279296875, -0.0281219482421875, 0.009368896484375, 0.0468597412109375, 0.0843505859375, 0.1218414306640625, 0.159332275390625, 0.1968231201171875, 0.23431396484375, 0.2718048095703125, 0.309295654296875, 0.3467864990234375, 0.38427734375, 0.4217681884765625, 0.459259033203125, 0.4967498779296875, 0.53424072265625, 0.5717315673828125, 0.609222412109375, 0.6467132568359375, 0.6842041015625, 0.7216949462890625, 0.759185791015625, 0.7966766357421875, 0.83416748046875, 0.8716583251953125, 0.909149169921875, 0.9466400146484375, 0.984130859375, 1.0216217041015625, 1.059112548828125, 1.0966033935546875, 1.13409423828125, 1.1715850830078125, 1.209075927734375, 1.2465667724609375, 1.2840576171875, 1.3215484619140625, 1.359039306640625, 1.3965301513671875, 1.43402099609375, 1.4715118408203125, 1.509002685546875, 1.5464935302734375, 1.583984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 3.0, 8.0, 16.0, 12.0, 25.0, 31.0, 75.0, 98.0, 214.0, 397.0, 974.0, 3080.0, 25944.0, 790592.0, 215118.0, 8664.0, 1891.0, 710.0, 275.0, 159.0, 79.0, 63.0, 38.0, 24.0, 21.0, 8.0, 7.0, 4.0, 6.0, 3.0, 6.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.956787109375, -1.87451171875, -1.792236328125, -1.7099609375, -1.627685546875, -1.54541015625, -1.463134765625, -1.380859375, -1.298583984375, -1.21630859375, -1.134033203125, -1.0517578125, -0.969482421875, -0.88720703125, -0.804931640625, -0.72265625, -0.640380859375, -0.55810546875, -0.475830078125, -0.3935546875, -0.311279296875, -0.22900390625, -0.146728515625, -0.064453125, 0.017822265625, 0.10009765625, 0.182373046875, 0.2646484375, 0.346923828125, 0.42919921875, 0.511474609375, 0.59375, 0.676025390625, 0.75830078125, 0.840576171875, 0.9228515625, 1.005126953125, 1.08740234375, 1.169677734375, 1.251953125, 1.334228515625, 1.41650390625, 1.498779296875, 1.5810546875, 1.663330078125, 1.74560546875, 1.827880859375, 1.91015625, 1.992431640625, 2.07470703125, 2.156982421875, 2.2392578125, 2.321533203125, 2.40380859375, 2.486083984375, 2.568359375, 2.650634765625, 2.73291015625, 2.815185546875, 2.8974609375, 2.979736328125, 3.06201171875, 3.144287109375, 3.2265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 4.0, 11.0, 6.0, 13.0, 17.0, 21.0, 29.0, 42.0, 29.0, 34.0, 44.0, 50.0, 52.0, 60.0, 51.0, 47.0, 50.0, 58.0, 54.0, 47.0, 42.0, 35.0, 34.0, 34.0, 29.0, 15.0, 25.0, 10.0, 10.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.064453125, -2.969146728515625, -2.87384033203125, -2.778533935546875, -2.6832275390625, -2.587921142578125, -2.49261474609375, -2.397308349609375, -2.302001953125, -2.206695556640625, -2.11138916015625, -2.016082763671875, -1.9207763671875, -1.825469970703125, -1.73016357421875, -1.634857177734375, -1.53955078125, -1.444244384765625, -1.34893798828125, -1.253631591796875, -1.1583251953125, -1.063018798828125, -0.96771240234375, -0.872406005859375, -0.777099609375, -0.681793212890625, -0.58648681640625, -0.491180419921875, -0.3958740234375, -0.300567626953125, -0.20526123046875, -0.109954833984375, -0.0146484375, 0.080657958984375, 0.17596435546875, 0.271270751953125, 0.3665771484375, 0.461883544921875, 0.55718994140625, 0.652496337890625, 0.747802734375, 0.843109130859375, 0.93841552734375, 1.033721923828125, 1.1290283203125, 1.224334716796875, 1.31964111328125, 1.414947509765625, 1.51025390625, 1.605560302734375, 1.70086669921875, 1.796173095703125, 1.8914794921875, 1.986785888671875, 2.08209228515625, 2.177398681640625, 2.272705078125, 2.368011474609375, 2.46331787109375, 2.558624267578125, 2.6539306640625, 2.749237060546875, 2.84454345703125, 2.939849853515625, 3.03515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 3.0, 8.0, 20.0, 32.0, 58.0, 115.0, 258.0, 886.0, 5250.0, 659123.0, 377256.0, 4256.0, 799.0, 250.0, 95.0, 60.0, 32.0, 19.0, 11.0, 2.0, 5.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6328125, -2.563446044921875, -2.49407958984375, -2.424713134765625, -2.3553466796875, -2.285980224609375, -2.21661376953125, -2.147247314453125, -2.077880859375, -2.008514404296875, -1.93914794921875, -1.869781494140625, -1.8004150390625, -1.731048583984375, -1.66168212890625, -1.592315673828125, -1.52294921875, -1.453582763671875, -1.38421630859375, -1.314849853515625, -1.2454833984375, -1.176116943359375, -1.10675048828125, -1.037384033203125, -0.968017578125, -0.898651123046875, -0.82928466796875, -0.759918212890625, -0.6905517578125, -0.621185302734375, -0.55181884765625, -0.482452392578125, -0.4130859375, -0.343719482421875, -0.27435302734375, -0.204986572265625, -0.1356201171875, -0.066253662109375, 0.00311279296875, 0.072479248046875, 0.141845703125, 0.211212158203125, 0.28057861328125, 0.349945068359375, 0.4193115234375, 0.488677978515625, 0.55804443359375, 0.627410888671875, 0.69677734375, 0.766143798828125, 0.83551025390625, 0.904876708984375, 0.9742431640625, 1.043609619140625, 1.11297607421875, 1.182342529296875, 1.251708984375, 1.321075439453125, 1.39044189453125, 1.459808349609375, 1.5291748046875, 1.598541259765625, 1.66790771484375, 1.737274169921875, 1.806640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 10.0, 9.0, 18.0, 23.0, 33.0, 44.0, 43.0, 81.0, 123.0, 130.0, 126.0, 110.0, 78.0, 61.0, 31.0, 28.0, 18.0, 11.0, 8.0, 8.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.72747802734375e-05, -9.24132764339447e-05, -8.75517725944519e-05, -8.26902687549591e-05, -7.782876491546631e-05, -7.296726107597351e-05, -6.810575723648071e-05, -6.324425339698792e-05, -5.838274955749512e-05, -5.352124571800232e-05, -4.865974187850952e-05, -4.3798238039016724e-05, -3.8936734199523926e-05, -3.407523036003113e-05, -2.921372652053833e-05, -2.4352222681045532e-05, -1.9490718841552734e-05, -1.4629215002059937e-05, -9.767711162567139e-06, -4.906207323074341e-06, -4.470348358154297e-08, 4.816800355911255e-06, 9.678304195404053e-06, 1.453980803489685e-05, 1.940131187438965e-05, 2.4262815713882446e-05, 2.9124319553375244e-05, 3.398582339286804e-05, 3.884732723236084e-05, 4.370883107185364e-05, 4.8570334911346436e-05, 5.3431838750839233e-05, 5.829334259033203e-05, 6.315484642982483e-05, 6.801635026931763e-05, 7.287785410881042e-05, 7.773935794830322e-05, 8.260086178779602e-05, 8.746236562728882e-05, 9.232386946678162e-05, 9.718537330627441e-05, 0.00010204687714576721, 0.00010690838098526001, 0.00011176988482475281, 0.0001166313886642456, 0.0001214928925037384, 0.0001263543963432312, 0.000131215900182724, 0.0001360774040222168, 0.0001409389078617096, 0.0001458004117012024, 0.0001506619155406952, 0.000155523419380188, 0.00016038492321968079, 0.00016524642705917358, 0.00017010793089866638, 0.00017496943473815918, 0.00017983093857765198, 0.00018469244241714478, 0.00018955394625663757, 0.00019441545009613037, 0.00019927695393562317, 0.00020413845777511597, 0.00020899996161460876, 0.00021386146545410156]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 8.0, 7.0, 16.0, 16.0, 25.0, 54.0, 103.0, 218.0, 443.0, 1077.0, 3932.0, 33341.0, 820903.0, 176241.0, 9016.0, 1905.0, 621.0, 298.0, 152.0, 66.0, 41.0, 19.0, 19.0, 8.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.46875, -1.4317855834960938, -1.3948211669921875, -1.3578567504882812, -1.320892333984375, -1.2839279174804688, -1.2469635009765625, -1.2099990844726562, -1.17303466796875, -1.1360702514648438, -1.0991058349609375, -1.0621414184570312, -1.025177001953125, -0.9882125854492188, -0.9512481689453125, -0.9142837524414062, -0.8773193359375, -0.8403549194335938, -0.8033905029296875, -0.7664260864257812, -0.729461669921875, -0.6924972534179688, -0.6555328369140625, -0.6185684204101562, -0.58160400390625, -0.5446395874023438, -0.5076751708984375, -0.47071075439453125, -0.433746337890625, -0.39678192138671875, -0.3598175048828125, -0.32285308837890625, -0.285888671875, -0.24892425537109375, -0.2119598388671875, -0.17499542236328125, -0.138031005859375, -0.10106658935546875, -0.0641021728515625, -0.02713775634765625, 0.00982666015625, 0.04679107666015625, 0.0837554931640625, 0.12071990966796875, 0.157684326171875, 0.19464874267578125, 0.2316131591796875, 0.26857757568359375, 0.3055419921875, 0.34250640869140625, 0.3794708251953125, 0.41643524169921875, 0.453399658203125, 0.49036407470703125, 0.5273284912109375, 0.5642929077148438, 0.60125732421875, 0.6382217407226562, 0.6751861572265625, 0.7121505737304688, 0.749114990234375, 0.7860794067382812, 0.8230438232421875, 0.8600082397460938, 0.89697265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 17.0, 24.0, 35.0, 51.0, 63.0, 82.0, 97.0, 112.0, 97.0, 72.0, 79.0, 52.0, 55.0, 40.0, 32.0, 19.0, 7.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.294921875, -1.2647476196289062, -1.2345733642578125, -1.2043991088867188, -1.174224853515625, -1.1440505981445312, -1.1138763427734375, -1.0837020874023438, -1.05352783203125, -1.0233535766601562, -0.9931793212890625, -0.9630050659179688, -0.932830810546875, -0.9026565551757812, -0.8724822998046875, -0.8423080444335938, -0.8121337890625, -0.7819595336914062, -0.7517852783203125, -0.7216110229492188, -0.691436767578125, -0.6612625122070312, -0.6310882568359375, -0.6009140014648438, -0.57073974609375, -0.5405654907226562, -0.5103912353515625, -0.48021697998046875, -0.450042724609375, -0.41986846923828125, -0.3896942138671875, -0.35951995849609375, -0.329345703125, -0.29917144775390625, -0.2689971923828125, -0.23882293701171875, -0.208648681640625, -0.17847442626953125, -0.1483001708984375, -0.11812591552734375, -0.08795166015625, -0.05777740478515625, -0.0276031494140625, 0.00257110595703125, 0.032745361328125, 0.06291961669921875, 0.0930938720703125, 0.12326812744140625, 0.1534423828125, 0.18361663818359375, 0.2137908935546875, 0.24396514892578125, 0.274139404296875, 0.30431365966796875, 0.3344879150390625, 0.36466217041015625, 0.39483642578125, 0.42501068115234375, 0.4551849365234375, 0.48535919189453125, 0.515533447265625, 0.5457077026367188, 0.5758819580078125, 0.6060562133789062, 0.63623046875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 14.0, 34.0, 144.0, 274.0, 304.0, 177.0, 45.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.9364013671875, -37.1484489440918, -36.360496520996094, -35.57254409790039, -34.78459167480469, -33.996639251708984, -33.20868682861328, -32.42073440551758, -31.632781982421875, -30.844829559326172, -30.05687713623047, -29.268924713134766, -28.480972290039062, -27.69301986694336, -26.905067443847656, -26.117115020751953, -25.329160690307617, -24.541208267211914, -23.75325584411621, -22.965303421020508, -22.177350997924805, -21.3893985748291, -20.601444244384766, -19.813491821289062, -19.02553939819336, -18.237586975097656, -17.449634552001953, -16.66168212890625, -15.873729705810547, -15.085777282714844, -14.297823905944824, -13.509871482849121, -12.721921920776367, -11.933969497680664, -11.146017074584961, -10.358064651489258, -9.570112228393555, -8.782159805297852, -7.994206428527832, -7.206254005432129, -6.418301582336426, -5.630349159240723, -4.8423967361450195, -4.054443836212158, -3.266491413116455, -2.478538990020752, -1.6905860900878906, -0.9026336669921875, -0.11468124389648438, 0.6732712984085083, 1.461223840713501, 2.249176502227783, 3.0371289253234863, 3.8250813484191895, 4.613034248352051, 5.400986671447754, 6.188939094543457, 6.97689151763916, 7.764843940734863, 8.552797317504883, 9.340749740600586, 10.128702163696289, 10.916654586791992, 11.704607009887695, 12.492559432983398]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 12.0, 6.0, 9.0, 13.0, 21.0, 25.0, 21.0, 32.0, 30.0, 39.0, 46.0, 49.0, 44.0, 58.0, 48.0, 62.0, 35.0, 54.0, 54.0, 55.0, 44.0, 26.0, 31.0, 35.0, 24.0, 28.0, 21.0, 14.0, 6.0, 13.0, 12.0, 6.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.606850624084473, -12.248764038085938, -11.890676498413086, -11.532588958740234, -11.1745023727417, -10.816415786743164, -10.458328247070312, -10.100240707397461, -9.742154121398926, -9.38406753540039, -9.025979995727539, -8.667892456054688, -8.309805870056152, -7.951718807220459, -7.593631744384766, -7.235544681549072, -6.877457618713379, -6.5193705558776855, -6.161283493041992, -5.803196430206299, -5.4451093673706055, -5.087022304534912, -4.728935241699219, -4.370848178863525, -4.012761116027832, -3.6546740531921387, -3.2965869903564453, -2.938499927520752, -2.5804128646850586, -2.2223258018493652, -1.8642387390136719, -1.5061516761779785, -1.1480655670166016, -0.7899785041809082, -0.43189144134521484, -0.07380437850952148, 0.2842826843261719, 0.6423697471618652, 1.0004568099975586, 1.358543872833252, 1.7166309356689453, 2.0747179985046387, 2.432805061340332, 2.7908921241760254, 3.1489791870117188, 3.507066249847412, 3.8651533126831055, 4.223240375518799, 4.581327438354492, 4.9394145011901855, 5.297501564025879, 5.655588626861572, 6.013675689697266, 6.371762752532959, 6.729849815368652, 7.087936878204346, 7.446023941040039, 7.804111003875732, 8.162198066711426, 8.520284652709961, 8.878372192382812, 9.236459732055664, 9.5945463180542, 9.952632904052734, 10.310720443725586]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 8.0, 9.0, 13.0, 17.0, 26.0, 34.0, 62.0, 134.0, 272.0, 549.0, 1356.0, 4251.0, 20049.0, 270610.0, 3837247.0, 47357.0, 8056.0, 2319.0, 887.0, 439.0, 201.0, 124.0, 81.0, 43.0, 35.0, 27.0, 26.0, 11.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3271484375, -1.2699737548828125, -1.212799072265625, -1.1556243896484375, -1.09844970703125, -1.0412750244140625, -0.984100341796875, -0.9269256591796875, -0.8697509765625, -0.8125762939453125, -0.755401611328125, -0.6982269287109375, -0.64105224609375, -0.5838775634765625, -0.526702880859375, -0.4695281982421875, -0.412353515625, -0.3551788330078125, -0.298004150390625, -0.2408294677734375, -0.18365478515625, -0.1264801025390625, -0.069305419921875, -0.0121307373046875, 0.0450439453125, 0.1022186279296875, 0.159393310546875, 0.2165679931640625, 0.27374267578125, 0.3309173583984375, 0.388092041015625, 0.4452667236328125, 0.50244140625, 0.5596160888671875, 0.616790771484375, 0.6739654541015625, 0.73114013671875, 0.7883148193359375, 0.845489501953125, 0.9026641845703125, 0.9598388671875, 1.0170135498046875, 1.074188232421875, 1.1313629150390625, 1.18853759765625, 1.2457122802734375, 1.302886962890625, 1.3600616455078125, 1.417236328125, 1.4744110107421875, 1.531585693359375, 1.5887603759765625, 1.64593505859375, 1.7031097412109375, 1.760284423828125, 1.8174591064453125, 1.8746337890625, 1.9318084716796875, 1.988983154296875, 2.0461578369140625, 2.10333251953125, 2.1605072021484375, 2.217681884765625, 2.2748565673828125, 2.33203125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 10.0, 10.0, 22.0, 26.0, 52.0, 79.0, 123.0, 158.0, 150.0, 134.0, 99.0, 49.0, 39.0, 27.0, 12.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7418136596679688, -0.6960296630859375, -0.6502456665039062, -0.604461669921875, -0.5586776733398438, -0.5128936767578125, -0.46710968017578125, -0.42132568359375, -0.37554168701171875, -0.3297576904296875, -0.28397369384765625, -0.238189697265625, -0.19240570068359375, -0.1466217041015625, -0.10083770751953125, -0.0550537109375, -0.00926971435546875, 0.0365142822265625, 0.08229827880859375, 0.128082275390625, 0.17386627197265625, 0.2196502685546875, 0.26543426513671875, 0.31121826171875, 0.35700225830078125, 0.4027862548828125, 0.44857025146484375, 0.494354248046875, 0.5401382446289062, 0.5859222412109375, 0.6317062377929688, 0.677490234375, 0.7232742309570312, 0.7690582275390625, 0.8148422241210938, 0.860626220703125, 0.9064102172851562, 0.9521942138671875, 0.9979782104492188, 1.04376220703125, 1.0895462036132812, 1.1353302001953125, 1.1811141967773438, 1.226898193359375, 1.2726821899414062, 1.3184661865234375, 1.3642501831054688, 1.4100341796875, 1.4558181762695312, 1.5016021728515625, 1.5473861694335938, 1.593170166015625, 1.6389541625976562, 1.6847381591796875, 1.7305221557617188, 1.77630615234375, 1.8220901489257812, 1.8678741455078125, 1.9136581420898438, 1.959442138671875, 2.0052261352539062, 2.0510101318359375, 2.0967941284179688, 2.142578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 9.0, 12.0, 17.0, 31.0, 51.0, 57.0, 131.0, 229.0, 362.0, 785.0, 1522.0, 3052.0, 7082.0, 20078.0, 88205.0, 1975566.0, 1975105.0, 88699.0, 20076.0, 7032.0, 3110.0, 1462.0, 699.0, 383.0, 224.0, 133.0, 61.0, 42.0, 30.0, 16.0, 9.0, 10.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9677734375, -0.937530517578125, -0.90728759765625, -0.877044677734375, -0.8468017578125, -0.816558837890625, -0.78631591796875, -0.756072998046875, -0.725830078125, -0.695587158203125, -0.66534423828125, -0.635101318359375, -0.6048583984375, -0.574615478515625, -0.54437255859375, -0.514129638671875, -0.48388671875, -0.453643798828125, -0.42340087890625, -0.393157958984375, -0.3629150390625, -0.332672119140625, -0.30242919921875, -0.272186279296875, -0.241943359375, -0.211700439453125, -0.18145751953125, -0.151214599609375, -0.1209716796875, -0.090728759765625, -0.06048583984375, -0.030242919921875, 0.0, 0.030242919921875, 0.06048583984375, 0.090728759765625, 0.1209716796875, 0.151214599609375, 0.18145751953125, 0.211700439453125, 0.241943359375, 0.272186279296875, 0.30242919921875, 0.332672119140625, 0.3629150390625, 0.393157958984375, 0.42340087890625, 0.453643798828125, 0.48388671875, 0.514129638671875, 0.54437255859375, 0.574615478515625, 0.6048583984375, 0.635101318359375, 0.66534423828125, 0.695587158203125, 0.725830078125, 0.756072998046875, 0.78631591796875, 0.816558837890625, 0.8468017578125, 0.877044677734375, 0.90728759765625, 0.937530517578125, 0.9677734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 13.0, 12.0, 18.0, 31.0, 48.0, 67.0, 125.0, 245.0, 805.0, 2014.0, 296.0, 139.0, 96.0, 46.0, 29.0, 25.0, 17.0, 6.0, 4.0, 6.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5810546875, -0.5640411376953125, -0.547027587890625, -0.5300140380859375, -0.51300048828125, -0.4959869384765625, -0.478973388671875, -0.4619598388671875, -0.4449462890625, -0.4279327392578125, -0.410919189453125, -0.3939056396484375, -0.37689208984375, -0.3598785400390625, -0.342864990234375, -0.3258514404296875, -0.308837890625, -0.2918243408203125, -0.274810791015625, -0.2577972412109375, -0.24078369140625, -0.2237701416015625, -0.206756591796875, -0.1897430419921875, -0.1727294921875, -0.1557159423828125, -0.138702392578125, -0.1216888427734375, -0.10467529296875, -0.0876617431640625, -0.070648193359375, -0.0536346435546875, -0.03662109375, -0.0196075439453125, -0.002593994140625, 0.0144195556640625, 0.03143310546875, 0.0484466552734375, 0.065460205078125, 0.0824737548828125, 0.0994873046875, 0.1165008544921875, 0.133514404296875, 0.1505279541015625, 0.16754150390625, 0.1845550537109375, 0.201568603515625, 0.2185821533203125, 0.235595703125, 0.2526092529296875, 0.269622802734375, 0.2866363525390625, 0.30364990234375, 0.3206634521484375, 0.337677001953125, 0.3546905517578125, 0.3717041015625, 0.3887176513671875, 0.405731201171875, 0.4227447509765625, 0.43975830078125, 0.4567718505859375, 0.473785400390625, 0.4907989501953125, 0.5078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 18.0, 18.0, 49.0, 111.0, 186.0, 237.0, 197.0, 110.0, 38.0, 23.0, 7.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.986946105957031, -6.846772193908691, -6.706598281860352, -6.566424369812012, -6.426250457763672, -6.286076545715332, -6.145902633666992, -6.005728721618652, -5.8655548095703125, -5.725380897521973, -5.585206985473633, -5.445033073425293, -5.304859161376953, -5.164685249328613, -5.024511337280273, -4.884337425231934, -4.744163513183594, -4.603989601135254, -4.463815689086914, -4.323641777038574, -4.183467864990234, -4.0432939529418945, -3.9031200408935547, -3.762946128845215, -3.622772693634033, -3.4825987815856934, -3.3424248695373535, -3.2022509574890137, -3.062077045440674, -2.921903133392334, -2.781729221343994, -2.6415553092956543, -2.5013813972473145, -2.3612074851989746, -2.2210335731506348, -2.080859661102295, -1.940685749053955, -1.8005118370056152, -1.660338044166565, -1.520164132118225, -1.3799902200698853, -1.2398163080215454, -1.0996423959732056, -0.9594685435295105, -0.8192946314811707, -0.6791207194328308, -0.5389468669891357, -0.3987729549407959, -0.25859904289245605, -0.1184251457452774, 0.021748751401901245, 0.1619226336479187, 0.30209654569625854, 0.4422704577445984, 0.5824443101882935, 0.7226182222366333, 0.8627921342849731, 1.002966046333313, 1.1431399583816528, 1.2833137512207031, 1.423487663269043, 1.5636615753173828, 1.7038354873657227, 1.8440093994140625, 1.9841833114624023]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 8.0, 13.0, 15.0, 16.0, 21.0, 24.0, 36.0, 32.0, 54.0, 32.0, 43.0, 48.0, 51.0, 66.0, 54.0, 39.0, 56.0, 42.0, 47.0, 37.0, 34.0, 37.0, 29.0, 35.0, 21.0, 20.0, 13.0, 14.0, 12.0, 10.0, 10.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.0708112716674805, -2.009063482284546, -1.9473155736923218, -1.8855677843093872, -1.823819875717163, -1.7620720863342285, -1.700324296951294, -1.6385763883590698, -1.5768285989761353, -1.5150808095932007, -1.4533329010009766, -1.391585111618042, -1.3298372030258179, -1.2680894136428833, -1.2063415050506592, -1.1445937156677246, -1.08284592628479, -1.0210981369018555, -0.9593502283096313, -0.8976024389266968, -0.8358545899391174, -0.7741067409515381, -0.7123588919639587, -0.6506110429763794, -0.5888631343841553, -0.5271152853965759, -0.46536746621131897, -0.4036196172237396, -0.34187179803848267, -0.2801239490509033, -0.21837610006332397, -0.15662828087806702, -0.09488046169281006, -0.03313262388110161, 0.028615213930606842, 0.09036305546760559, 0.15211088955402374, 0.2138587236404419, 0.27560657262802124, 0.3373543918132782, 0.39910224080085754, 0.4608500897884369, 0.5225979089736938, 0.5843457579612732, 0.6460936069488525, 0.7078413963317871, 0.7695893049240112, 0.8313370943069458, 0.8930849432945251, 0.9548327922821045, 1.016580581665039, 1.0783284902572632, 1.1400762796401978, 1.2018241882324219, 1.2635719776153564, 1.325319766998291, 1.3870676755905151, 1.4488154649734497, 1.5105633735656738, 1.5723111629486084, 1.6340590715408325, 1.695806860923767, 1.7575547695159912, 1.8193025588989258, 1.8810503482818604]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 12.0, 21.0, 34.0, 106.0, 185.0, 524.0, 3244.0, 118542.0, 901316.0, 22502.0, 1526.0, 303.0, 126.0, 50.0, 27.0, 14.0, 11.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.9556884765625, -3.833251953125, -3.7108154296875, -3.58837890625, -3.4659423828125, -3.343505859375, -3.2210693359375, -3.0986328125, -2.9761962890625, -2.853759765625, -2.7313232421875, -2.60888671875, -2.4864501953125, -2.364013671875, -2.2415771484375, -2.119140625, -1.9967041015625, -1.874267578125, -1.7518310546875, -1.62939453125, -1.5069580078125, -1.384521484375, -1.2620849609375, -1.1396484375, -1.0172119140625, -0.894775390625, -0.7723388671875, -0.64990234375, -0.5274658203125, -0.405029296875, -0.2825927734375, -0.16015625, -0.0377197265625, 0.084716796875, 0.2071533203125, 0.32958984375, 0.4520263671875, 0.574462890625, 0.6968994140625, 0.8193359375, 0.9417724609375, 1.064208984375, 1.1866455078125, 1.30908203125, 1.4315185546875, 1.553955078125, 1.6763916015625, 1.798828125, 1.9212646484375, 2.043701171875, 2.1661376953125, 2.28857421875, 2.4110107421875, 2.533447265625, 2.6558837890625, 2.7783203125, 2.9007568359375, 3.023193359375, 3.1456298828125, 3.26806640625, 3.3905029296875, 3.512939453125, 3.6353759765625, 3.7578125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 10.0, 6.0, 24.0, 31.0, 56.0, 77.0, 108.0, 122.0, 129.0, 122.0, 100.0, 67.0, 56.0, 35.0, 22.0, 16.0, 5.0, 4.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.572265625, -0.532958984375, -0.49365234375, -0.454345703125, -0.4150390625, -0.375732421875, -0.33642578125, -0.297119140625, -0.2578125, -0.218505859375, -0.17919921875, -0.139892578125, -0.1005859375, -0.061279296875, -0.02197265625, 0.017333984375, 0.056640625, 0.095947265625, 0.13525390625, 0.174560546875, 0.2138671875, 0.253173828125, 0.29248046875, 0.331787109375, 0.37109375, 0.410400390625, 0.44970703125, 0.489013671875, 0.5283203125, 0.567626953125, 0.60693359375, 0.646240234375, 0.685546875, 0.724853515625, 0.76416015625, 0.803466796875, 0.8427734375, 0.882080078125, 0.92138671875, 0.960693359375, 1.0, 1.039306640625, 1.07861328125, 1.117919921875, 1.1572265625, 1.196533203125, 1.23583984375, 1.275146484375, 1.314453125, 1.353759765625, 1.39306640625, 1.432373046875, 1.4716796875, 1.510986328125, 1.55029296875, 1.589599609375, 1.62890625, 1.668212890625, 1.70751953125, 1.746826171875, 1.7861328125, 1.825439453125, 1.86474609375, 1.904052734375, 1.943359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 5.0, 16.0, 28.0, 46.0, 76.0, 137.0, 274.0, 583.0, 1454.0, 6251.0, 90242.0, 888397.0, 53781.0, 4898.0, 1255.0, 532.0, 249.0, 131.0, 74.0, 28.0, 26.0, 15.0, 7.0, 15.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.3260498046875, -2.238037109375, -2.1500244140625, -2.06201171875, -1.9739990234375, -1.885986328125, -1.7979736328125, -1.7099609375, -1.6219482421875, -1.533935546875, -1.4459228515625, -1.35791015625, -1.2698974609375, -1.181884765625, -1.0938720703125, -1.005859375, -0.9178466796875, -0.829833984375, -0.7418212890625, -0.65380859375, -0.5657958984375, -0.477783203125, -0.3897705078125, -0.3017578125, -0.2137451171875, -0.125732421875, -0.0377197265625, 0.05029296875, 0.1383056640625, 0.226318359375, 0.3143310546875, 0.40234375, 0.4903564453125, 0.578369140625, 0.6663818359375, 0.75439453125, 0.8424072265625, 0.930419921875, 1.0184326171875, 1.1064453125, 1.1944580078125, 1.282470703125, 1.3704833984375, 1.45849609375, 1.5465087890625, 1.634521484375, 1.7225341796875, 1.810546875, 1.8985595703125, 1.986572265625, 2.0745849609375, 2.16259765625, 2.2506103515625, 2.338623046875, 2.4266357421875, 2.5146484375, 2.6026611328125, 2.690673828125, 2.7786865234375, 2.86669921875, 2.9547119140625, 3.042724609375, 3.1307373046875, 3.21875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 11.0, 11.0, 14.0, 14.0, 19.0, 20.0, 21.0, 27.0, 24.0, 30.0, 29.0, 46.0, 56.0, 35.0, 40.0, 52.0, 55.0, 49.0, 46.0, 43.0, 41.0, 51.0, 26.0, 36.0, 32.0, 27.0, 19.0, 15.0, 20.0, 18.0, 6.0, 6.0, 9.0, 8.0, 8.0, 2.0, 9.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.162109375, -2.088897705078125, -2.01568603515625, -1.942474365234375, -1.8692626953125, -1.796051025390625, -1.72283935546875, -1.649627685546875, -1.576416015625, -1.503204345703125, -1.42999267578125, -1.356781005859375, -1.2835693359375, -1.210357666015625, -1.13714599609375, -1.063934326171875, -0.99072265625, -0.917510986328125, -0.84429931640625, -0.771087646484375, -0.6978759765625, -0.624664306640625, -0.55145263671875, -0.478240966796875, -0.405029296875, -0.331817626953125, -0.25860595703125, -0.185394287109375, -0.1121826171875, -0.038970947265625, 0.03424072265625, 0.107452392578125, 0.1806640625, 0.253875732421875, 0.32708740234375, 0.400299072265625, 0.4735107421875, 0.546722412109375, 0.61993408203125, 0.693145751953125, 0.766357421875, 0.839569091796875, 0.91278076171875, 0.985992431640625, 1.0592041015625, 1.132415771484375, 1.20562744140625, 1.278839111328125, 1.35205078125, 1.425262451171875, 1.49847412109375, 1.571685791015625, 1.6448974609375, 1.718109130859375, 1.79132080078125, 1.864532470703125, 1.937744140625, 2.010955810546875, 2.08416748046875, 2.157379150390625, 2.2305908203125, 2.303802490234375, 2.37701416015625, 2.450225830078125, 2.5234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 18.0, 13.0, 12.0, 27.0, 49.0, 63.0, 125.0, 184.0, 348.0, 752.0, 2169.0, 10639.0, 148943.0, 824895.0, 51845.0, 5788.0, 1439.0, 539.0, 271.0, 142.0, 107.0, 56.0, 30.0, 24.0, 16.0, 14.0, 9.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.994140625, -0.9651870727539062, -0.9362335205078125, -0.9072799682617188, -0.878326416015625, -0.8493728637695312, -0.8204193115234375, -0.7914657592773438, -0.76251220703125, -0.7335586547851562, -0.7046051025390625, -0.6756515502929688, -0.646697998046875, -0.6177444458007812, -0.5887908935546875, -0.5598373413085938, -0.5308837890625, -0.5019302368164062, -0.4729766845703125, -0.44402313232421875, -0.415069580078125, -0.38611602783203125, -0.3571624755859375, -0.32820892333984375, -0.29925537109375, -0.27030181884765625, -0.2413482666015625, -0.21239471435546875, -0.183441162109375, -0.15448760986328125, -0.1255340576171875, -0.09658050537109375, -0.067626953125, -0.03867340087890625, -0.0097198486328125, 0.01923370361328125, 0.048187255859375, 0.07714080810546875, 0.1060943603515625, 0.13504791259765625, 0.16400146484375, 0.19295501708984375, 0.2219085693359375, 0.25086212158203125, 0.279815673828125, 0.30876922607421875, 0.3377227783203125, 0.36667633056640625, 0.3956298828125, 0.42458343505859375, 0.4535369873046875, 0.48249053955078125, 0.511444091796875, 0.5403976440429688, 0.5693511962890625, 0.5983047485351562, 0.62725830078125, 0.6562118530273438, 0.6851654052734375, 0.7141189575195312, 0.743072509765625, 0.7720260620117188, 0.8009796142578125, 0.8299331665039062, 0.85888671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 0.0, 3.0, 10.0, 12.0, 5.0, 11.0, 19.0, 16.0, 29.0, 33.0, 36.0, 52.0, 69.0, 72.0, 90.0, 127.0, 91.0, 67.0, 55.0, 32.0, 40.0, 31.0, 24.0, 18.0, 14.0, 11.0, 7.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015234947204589844, -0.00014836899936199188, -0.00014438852667808533, -0.00014040805399417877, -0.00013642758131027222, -0.00013244710862636566, -0.0001284666359424591, -0.00012448616325855255, -0.000120505690574646, -0.00011652521789073944, -0.00011254474520683289, -0.00010856427252292633, -0.00010458379983901978, -0.00010060332715511322, -9.662285447120667e-05, -9.264238178730011e-05, -8.866190910339355e-05, -8.4681436419487e-05, -8.070096373558044e-05, -7.672049105167389e-05, -7.274001836776733e-05, -6.875954568386078e-05, -6.477907299995422e-05, -6.079860031604767e-05, -5.681812763214111e-05, -5.283765494823456e-05, -4.8857182264328e-05, -4.487670958042145e-05, -4.089623689651489e-05, -3.691576421260834e-05, -3.293529152870178e-05, -2.8954818844795227e-05, -2.4974346160888672e-05, -2.0993873476982117e-05, -1.701340079307556e-05, -1.3032928109169006e-05, -9.052455425262451e-06, -5.071982741355896e-06, -1.0915100574493408e-06, 2.8889626264572144e-06, 6.8694353103637695e-06, 1.0849907994270325e-05, 1.483038067817688e-05, 1.8810853362083435e-05, 2.279132604598999e-05, 2.6771798729896545e-05, 3.07522714138031e-05, 3.4732744097709656e-05, 3.871321678161621e-05, 4.2693689465522766e-05, 4.667416214942932e-05, 5.0654634833335876e-05, 5.463510751724243e-05, 5.861558020114899e-05, 6.259605288505554e-05, 6.65765255689621e-05, 7.055699825286865e-05, 7.453747093677521e-05, 7.851794362068176e-05, 8.249841630458832e-05, 8.647888898849487e-05, 9.045936167240143e-05, 9.443983435630798e-05, 9.842030704021454e-05, 0.0001024007797241211]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 7.0, 4.0, 15.0, 23.0, 21.0, 41.0, 78.0, 146.0, 304.0, 714.0, 2494.0, 16699.0, 733939.0, 281985.0, 9293.0, 1676.0, 573.0, 270.0, 111.0, 59.0, 50.0, 20.0, 10.0, 14.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5869140625, -1.5490188598632812, -1.5111236572265625, -1.4732284545898438, -1.435333251953125, -1.3974380493164062, -1.3595428466796875, -1.3216476440429688, -1.28375244140625, -1.2458572387695312, -1.2079620361328125, -1.1700668334960938, -1.132171630859375, -1.0942764282226562, -1.0563812255859375, -1.0184860229492188, -0.9805908203125, -0.9426956176757812, -0.9048004150390625, -0.8669052124023438, -0.829010009765625, -0.7911148071289062, -0.7532196044921875, -0.7153244018554688, -0.67742919921875, -0.6395339965820312, -0.6016387939453125, -0.5637435913085938, -0.525848388671875, -0.48795318603515625, -0.4500579833984375, -0.41216278076171875, -0.374267578125, -0.33637237548828125, -0.2984771728515625, -0.26058197021484375, -0.222686767578125, -0.18479156494140625, -0.1468963623046875, -0.10900115966796875, -0.07110595703125, -0.03321075439453125, 0.0046844482421875, 0.04257965087890625, 0.080474853515625, 0.11837005615234375, 0.1562652587890625, 0.19416046142578125, 0.2320556640625, 0.26995086669921875, 0.3078460693359375, 0.34574127197265625, 0.383636474609375, 0.42153167724609375, 0.4594268798828125, 0.49732208251953125, 0.53521728515625, 0.5731124877929688, 0.6110076904296875, 0.6489028930664062, 0.686798095703125, 0.7246932983398438, 0.7625885009765625, 0.8004837036132812, 0.83837890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 8.0, 9.0, 6.0, 11.0, 20.0, 42.0, 45.0, 74.0, 101.0, 126.0, 140.0, 114.0, 77.0, 76.0, 48.0, 31.0, 12.0, 13.0, 12.0, 6.0, 7.0, 3.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6083984375, -0.5797271728515625, -0.551055908203125, -0.5223846435546875, -0.49371337890625, -0.4650421142578125, -0.436370849609375, -0.4076995849609375, -0.3790283203125, -0.3503570556640625, -0.321685791015625, -0.2930145263671875, -0.26434326171875, -0.2356719970703125, -0.207000732421875, -0.1783294677734375, -0.149658203125, -0.1209869384765625, -0.092315673828125, -0.0636444091796875, -0.03497314453125, -0.0063018798828125, 0.022369384765625, 0.0510406494140625, 0.0797119140625, 0.1083831787109375, 0.137054443359375, 0.1657257080078125, 0.19439697265625, 0.2230682373046875, 0.251739501953125, 0.2804107666015625, 0.30908203125, 0.3377532958984375, 0.366424560546875, 0.3950958251953125, 0.42376708984375, 0.4524383544921875, 0.481109619140625, 0.5097808837890625, 0.5384521484375, 0.5671234130859375, 0.595794677734375, 0.6244659423828125, 0.65313720703125, 0.6818084716796875, 0.710479736328125, 0.7391510009765625, 0.767822265625, 0.7964935302734375, 0.825164794921875, 0.8538360595703125, 0.88250732421875, 0.9111785888671875, 0.939849853515625, 0.9685211181640625, 0.9971923828125, 1.0258636474609375, 1.054534912109375, 1.0832061767578125, 1.11187744140625, 1.1405487060546875, 1.169219970703125, 1.1978912353515625, 1.2265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 24.0, 131.0, 534.0, 255.0, 48.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-66.69625854492188, -65.40594482421875, -64.11563110351562, -62.8253173828125, -61.535003662109375, -60.24468994140625, -58.954376220703125, -57.664058685302734, -56.37374496459961, -55.083431243896484, -53.79311752319336, -52.502803802490234, -51.21249008178711, -49.92217254638672, -48.631858825683594, -47.34154510498047, -46.051231384277344, -44.76091766357422, -43.470603942871094, -42.18029022216797, -40.889976501464844, -39.59966278076172, -38.309349060058594, -37.0190315246582, -35.728721618652344, -34.43840789794922, -33.148094177246094, -31.85778045654297, -30.56746482849121, -29.277151107788086, -27.98683738708496, -26.696521759033203, -25.406211853027344, -24.11589813232422, -22.825584411621094, -21.53527069091797, -20.24495506286621, -18.954641342163086, -17.66432762145996, -16.374011993408203, -15.083698272705078, -13.793384552001953, -12.503069877624512, -11.212756156921387, -9.922441482543945, -8.63212776184082, -7.341814041137695, -6.051499366760254, -4.761185646057129, -3.4708714485168457, -2.1805574893951416, -0.8902435302734375, 0.4000706672668457, 1.690384864807129, 2.980698585510254, 4.271013259887695, 5.56132698059082, 6.8516411781311035, 8.141955375671387, 9.432269096374512, 10.722583770751953, 12.012897491455078, 13.303211212158203, 14.593525886535645, 15.88383960723877]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 13.0, 13.0, 15.0, 11.0, 21.0, 20.0, 29.0, 29.0, 49.0, 43.0, 41.0, 44.0, 59.0, 63.0, 69.0, 59.0, 57.0, 32.0, 50.0, 45.0, 37.0, 32.0, 36.0, 30.0, 19.0, 14.0, 12.0, 12.0, 6.0, 4.0, 8.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.336716651916504, -12.959380149841309, -12.582043647766113, -12.204707145690918, -11.827371597290039, -11.450035095214844, -11.072698593139648, -10.695362091064453, -10.318025588989258, -9.940689086914062, -9.563352584838867, -9.186016082763672, -8.808679580688477, -8.431344032287598, -8.054007530212402, -7.676671028137207, -7.299334526062012, -6.921998023986816, -6.544661521911621, -6.167325496673584, -5.789988994598389, -5.412652492523193, -5.035316467285156, -4.657979965209961, -4.280643463134766, -3.9033069610595703, -3.525970697402954, -3.148634433746338, -2.7712979316711426, -2.3939614295959473, -2.016625165939331, -1.6392889022827148, -1.2619514465332031, -0.8846150636672974, -0.5072786808013916, -0.12994229793548584, 0.24739408493041992, 0.6247304677963257, 1.0020668506622314, 1.3794031143188477, 1.756739616394043, 2.1340761184692383, 2.5114123821258545, 2.8887486457824707, 3.266085147857666, 3.6434216499328613, 4.020757675170898, 4.398094177246094, 4.775430679321289, 5.152767181396484, 5.53010368347168, 5.907439708709717, 6.284776210784912, 6.662112712860107, 7.0394487380981445, 7.41678524017334, 7.794121742248535, 8.17145824432373, 8.548794746398926, 8.926131248474121, 9.303466796875, 9.680803298950195, 10.05813980102539, 10.435476303100586, 10.812812805175781]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 17.0, 11.0, 24.0, 21.0, 46.0, 69.0, 142.0, 352.0, 1198.0, 7261.0, 128381.0, 3960459.0, 88344.0, 5888.0, 1228.0, 367.0, 164.0, 105.0, 62.0, 41.0, 30.0, 16.0, 15.0, 8.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7939453125, -1.738677978515625, -1.68341064453125, -1.628143310546875, -1.5728759765625, -1.517608642578125, -1.46234130859375, -1.407073974609375, -1.351806640625, -1.296539306640625, -1.24127197265625, -1.186004638671875, -1.1307373046875, -1.075469970703125, -1.02020263671875, -0.964935302734375, -0.90966796875, -0.854400634765625, -0.79913330078125, -0.743865966796875, -0.6885986328125, -0.633331298828125, -0.57806396484375, -0.522796630859375, -0.467529296875, -0.412261962890625, -0.35699462890625, -0.301727294921875, -0.2464599609375, -0.191192626953125, -0.13592529296875, -0.080657958984375, -0.025390625, 0.029876708984375, 0.08514404296875, 0.140411376953125, 0.1956787109375, 0.250946044921875, 0.30621337890625, 0.361480712890625, 0.416748046875, 0.472015380859375, 0.52728271484375, 0.582550048828125, 0.6378173828125, 0.693084716796875, 0.74835205078125, 0.803619384765625, 0.85888671875, 0.914154052734375, 0.96942138671875, 1.024688720703125, 1.0799560546875, 1.135223388671875, 1.19049072265625, 1.245758056640625, 1.301025390625, 1.356292724609375, 1.41156005859375, 1.466827392578125, 1.5220947265625, 1.577362060546875, 1.63262939453125, 1.687896728515625, 1.7431640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 12.0, 20.0, 37.0, 62.0, 64.0, 78.0, 93.0, 123.0, 112.0, 103.0, 80.0, 64.0, 43.0, 36.0, 22.0, 19.0, 10.0, 5.0, 7.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43994140625, -0.41255950927734375, -0.3851776123046875, -0.35779571533203125, -0.330413818359375, -0.30303192138671875, -0.2756500244140625, -0.24826812744140625, -0.22088623046875, -0.19350433349609375, -0.1661224365234375, -0.13874053955078125, -0.111358642578125, -0.08397674560546875, -0.0565948486328125, -0.02921295166015625, -0.0018310546875, 0.02555084228515625, 0.0529327392578125, 0.08031463623046875, 0.107696533203125, 0.13507843017578125, 0.1624603271484375, 0.18984222412109375, 0.21722412109375, 0.24460601806640625, 0.2719879150390625, 0.29936981201171875, 0.326751708984375, 0.35413360595703125, 0.3815155029296875, 0.40889739990234375, 0.436279296875, 0.46366119384765625, 0.4910430908203125, 0.5184249877929688, 0.545806884765625, 0.5731887817382812, 0.6005706787109375, 0.6279525756835938, 0.65533447265625, 0.6827163696289062, 0.7100982666015625, 0.7374801635742188, 0.764862060546875, 0.7922439575195312, 0.8196258544921875, 0.8470077514648438, 0.8743896484375, 0.9017715454101562, 0.9291534423828125, 0.9565353393554688, 0.983917236328125, 1.0112991333007812, 1.0386810302734375, 1.0660629272460938, 1.09344482421875, 1.1208267211914062, 1.1482086181640625, 1.1755905151367188, 1.202972412109375, 1.2303543090820312, 1.2577362060546875, 1.2851181030273438, 1.3125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 4.0, 8.0, 13.0, 17.0, 20.0, 31.0, 50.0, 95.0, 174.0, 520.0, 1699.0, 8917.0, 84076.0, 3601610.0, 470500.0, 21860.0, 3349.0, 782.0, 259.0, 98.0, 66.0, 32.0, 22.0, 9.0, 12.0, 20.0, 4.0, 13.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.1650238037109375, -1.123016357421875, -1.0810089111328125, -1.03900146484375, -0.9969940185546875, -0.954986572265625, -0.9129791259765625, -0.8709716796875, -0.8289642333984375, -0.786956787109375, -0.7449493408203125, -0.70294189453125, -0.6609344482421875, -0.618927001953125, -0.5769195556640625, -0.534912109375, -0.4929046630859375, -0.450897216796875, -0.4088897705078125, -0.36688232421875, -0.3248748779296875, -0.282867431640625, -0.2408599853515625, -0.1988525390625, -0.1568450927734375, -0.114837646484375, -0.0728302001953125, -0.03082275390625, 0.0111846923828125, 0.053192138671875, 0.0951995849609375, 0.13720703125, 0.1792144775390625, 0.221221923828125, 0.2632293701171875, 0.30523681640625, 0.3472442626953125, 0.389251708984375, 0.4312591552734375, 0.4732666015625, 0.5152740478515625, 0.557281494140625, 0.5992889404296875, 0.64129638671875, 0.6833038330078125, 0.725311279296875, 0.7673187255859375, 0.809326171875, 0.8513336181640625, 0.893341064453125, 0.9353485107421875, 0.97735595703125, 1.0193634033203125, 1.061370849609375, 1.1033782958984375, 1.1453857421875, 1.1873931884765625, 1.229400634765625, 1.2714080810546875, 1.31341552734375, 1.3554229736328125, 1.397430419921875, 1.4394378662109375, 1.4814453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 8.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 11.0, 11.0, 16.0, 17.0, 23.0, 45.0, 64.0, 104.0, 181.0, 390.0, 720.0, 943.0, 689.0, 349.0, 215.0, 88.0, 62.0, 45.0, 18.0, 19.0, 10.0, 15.0, 6.0, 6.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.13671875, -1.1037750244140625, -1.070831298828125, -1.0378875732421875, -1.00494384765625, -0.9720001220703125, -0.939056396484375, -0.9061126708984375, -0.8731689453125, -0.8402252197265625, -0.807281494140625, -0.7743377685546875, -0.74139404296875, -0.7084503173828125, -0.675506591796875, -0.6425628662109375, -0.609619140625, -0.5766754150390625, -0.543731689453125, -0.5107879638671875, -0.47784423828125, -0.4449005126953125, -0.411956787109375, -0.3790130615234375, -0.3460693359375, -0.3131256103515625, -0.280181884765625, -0.2472381591796875, -0.21429443359375, -0.1813507080078125, -0.148406982421875, -0.1154632568359375, -0.08251953125, -0.0495758056640625, -0.016632080078125, 0.0163116455078125, 0.04925537109375, 0.0821990966796875, 0.115142822265625, 0.1480865478515625, 0.1810302734375, 0.2139739990234375, 0.246917724609375, 0.2798614501953125, 0.31280517578125, 0.3457489013671875, 0.378692626953125, 0.4116363525390625, 0.444580078125, 0.4775238037109375, 0.510467529296875, 0.5434112548828125, 0.57635498046875, 0.6092987060546875, 0.642242431640625, 0.6751861572265625, 0.7081298828125, 0.7410736083984375, 0.774017333984375, 0.8069610595703125, 0.83990478515625, 0.8728485107421875, 0.905792236328125, 0.9387359619140625, 0.9716796875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 21.0, 115.0, 382.0, 340.0, 100.0, 23.0, 10.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.93694305419922, -25.345582962036133, -24.754220962524414, -24.162860870361328, -23.57149887084961, -22.980138778686523, -22.388778686523438, -21.79741668701172, -21.206056594848633, -20.614696502685547, -20.023334503173828, -19.431974411010742, -18.840612411499023, -18.249252319335938, -17.65789031982422, -17.066530227661133, -16.475170135498047, -15.883809089660645, -15.292448043823242, -14.701087951660156, -14.109726905822754, -13.518365859985352, -12.92700481414795, -12.335643768310547, -11.744281768798828, -11.152920722961426, -10.561559677124023, -9.970199584960938, -9.378838539123535, -8.787477493286133, -8.19611644744873, -7.604755878448486, -7.013395309448242, -6.42203426361084, -5.830673694610596, -5.239312648773193, -4.647952079772949, -4.056591033935547, -3.4652299880981445, -2.8738694190979004, -2.282508373260498, -1.6911475658416748, -1.099786639213562, -0.5084257125854492, 0.08293509483337402, 0.6742959022521973, 1.2656569480895996, 1.8570175170898438, 2.448378562927246, 3.0397393703460693, 3.6311001777648926, 4.222461223602295, 4.813821792602539, 5.405182838439941, 5.996543884277344, 6.587904453277588, 7.17926549911499, 7.770626544952393, 8.361987113952637, 8.953348159790039, 9.544709205627441, 10.136070251464844, 10.72743034362793, 11.318791389465332, 11.910152435302734]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 12.0, 10.0, 18.0, 21.0, 24.0, 35.0, 44.0, 51.0, 48.0, 61.0, 70.0, 72.0, 70.0, 69.0, 58.0, 62.0, 58.0, 41.0, 28.0, 28.0, 33.0, 19.0, 25.0, 13.0, 7.0, 9.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.451959133148193, -7.267388343811035, -7.082817554473877, -6.898246765136719, -6.713675498962402, -6.529104709625244, -6.344533920288086, -6.159963130950928, -5.9753923416137695, -5.790821552276611, -5.606250762939453, -5.421679496765137, -5.2371087074279785, -5.05253791809082, -4.867967128753662, -4.683396339416504, -4.4988250732421875, -4.314254283905029, -4.129683494567871, -3.945112466812134, -3.7605414390563965, -3.5759706497192383, -3.39139986038208, -3.206829071044922, -3.0222580432891846, -2.8376872539520264, -2.653116226196289, -2.468545436859131, -2.2839746475219727, -2.0994036197662354, -1.9148328304290771, -1.7302619218826294, -1.5456905364990234, -1.3611196279525757, -1.176548719406128, -0.9919779300689697, -0.807407021522522, -0.6228361129760742, -0.438265323638916, -0.25369441509246826, -0.06912350654602051, 0.11544737219810486, 0.3000182509422302, 0.4845890998840332, 0.669160008430481, 0.8537309169769287, 1.038301706314087, 1.2228726148605347, 1.4074435234069824, 1.5920144319534302, 1.776585340499878, 1.9611561298370361, 2.1457271575927734, 2.3302979469299316, 2.51486873626709, 2.699439525604248, 2.8840105533599854, 3.0685813426971436, 3.253152370452881, 3.437723159790039, 3.6222939491271973, 3.8068649768829346, 3.9914357662200928, 4.17600679397583, 4.360577583312988]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 8.0, 11.0, 19.0, 19.0, 39.0, 58.0, 127.0, 233.0, 441.0, 1001.0, 2347.0, 6399.0, 20704.0, 84671.0, 422237.0, 400317.0, 79929.0, 19776.0, 5982.0, 2287.0, 963.0, 448.0, 233.0, 118.0, 74.0, 36.0, 28.0, 15.0, 10.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8667984008789062, -0.8346710205078125, -0.8025436401367188, -0.770416259765625, -0.7382888793945312, -0.7061614990234375, -0.6740341186523438, -0.64190673828125, -0.6097793579101562, -0.5776519775390625, -0.5455245971679688, -0.513397216796875, -0.48126983642578125, -0.4491424560546875, -0.41701507568359375, -0.3848876953125, -0.35276031494140625, -0.3206329345703125, -0.28850555419921875, -0.256378173828125, -0.22425079345703125, -0.1921234130859375, -0.15999603271484375, -0.12786865234375, -0.09574127197265625, -0.0636138916015625, -0.03148651123046875, 0.000640869140625, 0.03276824951171875, 0.0648956298828125, 0.09702301025390625, 0.129150390625, 0.16127777099609375, 0.1934051513671875, 0.22553253173828125, 0.257659912109375, 0.28978729248046875, 0.3219146728515625, 0.35404205322265625, 0.38616943359375, 0.41829681396484375, 0.4504241943359375, 0.48255157470703125, 0.514678955078125, 0.5468063354492188, 0.5789337158203125, 0.6110610961914062, 0.6431884765625, 0.6753158569335938, 0.7074432373046875, 0.7395706176757812, 0.771697998046875, 0.8038253784179688, 0.8359527587890625, 0.8680801391601562, 0.90020751953125, 0.9323348999023438, 0.9644622802734375, 0.9965896606445312, 1.028717041015625, 1.0608444213867188, 1.0929718017578125, 1.1250991821289062, 1.1572265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 9.0, 14.0, 27.0, 33.0, 40.0, 52.0, 70.0, 88.0, 87.0, 87.0, 84.0, 100.0, 76.0, 59.0, 50.0, 30.0, 20.0, 21.0, 18.0, 10.0, 7.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.44345855712890625, -0.4210968017578125, -0.39873504638671875, -0.376373291015625, -0.35401153564453125, -0.3316497802734375, -0.30928802490234375, -0.28692626953125, -0.26456451416015625, -0.2422027587890625, -0.21984100341796875, -0.197479248046875, -0.17511749267578125, -0.1527557373046875, -0.13039398193359375, -0.1080322265625, -0.08567047119140625, -0.0633087158203125, -0.04094696044921875, -0.018585205078125, 0.00377655029296875, 0.0261383056640625, 0.04850006103515625, 0.07086181640625, 0.09322357177734375, 0.1155853271484375, 0.13794708251953125, 0.160308837890625, 0.18267059326171875, 0.2050323486328125, 0.22739410400390625, 0.249755859375, 0.27211761474609375, 0.2944793701171875, 0.31684112548828125, 0.339202880859375, 0.36156463623046875, 0.3839263916015625, 0.40628814697265625, 0.42864990234375, 0.45101165771484375, 0.4733734130859375, 0.49573516845703125, 0.518096923828125, 0.5404586791992188, 0.5628204345703125, 0.5851821899414062, 0.6075439453125, 0.6299057006835938, 0.6522674560546875, 0.6746292114257812, 0.696990966796875, 0.7193527221679688, 0.7417144775390625, 0.7640762329101562, 0.78643798828125, 0.8087997436523438, 0.8311614990234375, 0.8535232543945312, 0.875885009765625, 0.8982467651367188, 0.9206085205078125, 0.9429702758789062, 0.96533203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 3.0, 6.0, 12.0, 12.0, 22.0, 47.0, 59.0, 90.0, 157.0, 226.0, 435.0, 971.0, 2611.0, 12903.0, 270134.0, 729619.0, 24980.0, 3779.0, 1190.0, 574.0, 270.0, 165.0, 91.0, 65.0, 42.0, 26.0, 18.0, 12.0, 8.0, 11.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.96875, -1.90118408203125, -1.8336181640625, -1.76605224609375, -1.698486328125, -1.63092041015625, -1.5633544921875, -1.49578857421875, -1.42822265625, -1.36065673828125, -1.2930908203125, -1.22552490234375, -1.157958984375, -1.09039306640625, -1.0228271484375, -0.95526123046875, -0.8876953125, -0.82012939453125, -0.7525634765625, -0.68499755859375, -0.617431640625, -0.54986572265625, -0.4822998046875, -0.41473388671875, -0.34716796875, -0.27960205078125, -0.2120361328125, -0.14447021484375, -0.076904296875, -0.00933837890625, 0.0582275390625, 0.12579345703125, 0.193359375, 0.26092529296875, 0.3284912109375, 0.39605712890625, 0.463623046875, 0.53118896484375, 0.5987548828125, 0.66632080078125, 0.73388671875, 0.80145263671875, 0.8690185546875, 0.93658447265625, 1.004150390625, 1.07171630859375, 1.1392822265625, 1.20684814453125, 1.2744140625, 1.34197998046875, 1.4095458984375, 1.47711181640625, 1.544677734375, 1.61224365234375, 1.6798095703125, 1.74737548828125, 1.81494140625, 1.88250732421875, 1.9500732421875, 2.01763916015625, 2.085205078125, 2.15277099609375, 2.2203369140625, 2.28790283203125, 2.35546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 5.0, 2.0, 3.0, 11.0, 5.0, 10.0, 11.0, 16.0, 29.0, 22.0, 30.0, 46.0, 45.0, 55.0, 75.0, 55.0, 59.0, 83.0, 66.0, 67.0, 66.0, 51.0, 40.0, 30.0, 30.0, 21.0, 14.0, 11.0, 9.0, 11.0, 4.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.55194091796875, -2.4749755859375, -2.39801025390625, -2.321044921875, -2.24407958984375, -2.1671142578125, -2.09014892578125, -2.01318359375, -1.93621826171875, -1.8592529296875, -1.78228759765625, -1.705322265625, -1.62835693359375, -1.5513916015625, -1.47442626953125, -1.3974609375, -1.32049560546875, -1.2435302734375, -1.16656494140625, -1.089599609375, -1.01263427734375, -0.9356689453125, -0.85870361328125, -0.78173828125, -0.70477294921875, -0.6278076171875, -0.55084228515625, -0.473876953125, -0.39691162109375, -0.3199462890625, -0.24298095703125, -0.166015625, -0.08905029296875, -0.0120849609375, 0.06488037109375, 0.141845703125, 0.21881103515625, 0.2957763671875, 0.37274169921875, 0.44970703125, 0.52667236328125, 0.6036376953125, 0.68060302734375, 0.757568359375, 0.83453369140625, 0.9114990234375, 0.98846435546875, 1.0654296875, 1.14239501953125, 1.2193603515625, 1.29632568359375, 1.373291015625, 1.45025634765625, 1.5272216796875, 1.60418701171875, 1.68115234375, 1.75811767578125, 1.8350830078125, 1.91204833984375, 1.989013671875, 2.06597900390625, 2.1429443359375, 2.21990966796875, 2.296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 17.0, 15.0, 15.0, 29.0, 32.0, 45.0, 61.0, 112.0, 204.0, 384.0, 796.0, 2170.0, 8496.0, 70970.0, 855171.0, 95393.0, 10274.0, 2452.0, 906.0, 409.0, 200.0, 122.0, 76.0, 49.0, 36.0, 24.0, 24.0, 13.0, 8.0, 8.0, 7.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.927734375, -0.90008544921875, -0.8724365234375, -0.84478759765625, -0.817138671875, -0.78948974609375, -0.7618408203125, -0.73419189453125, -0.70654296875, -0.67889404296875, -0.6512451171875, -0.62359619140625, -0.595947265625, -0.56829833984375, -0.5406494140625, -0.51300048828125, -0.4853515625, -0.45770263671875, -0.4300537109375, -0.40240478515625, -0.374755859375, -0.34710693359375, -0.3194580078125, -0.29180908203125, -0.26416015625, -0.23651123046875, -0.2088623046875, -0.18121337890625, -0.153564453125, -0.12591552734375, -0.0982666015625, -0.07061767578125, -0.04296875, -0.01531982421875, 0.0123291015625, 0.03997802734375, 0.067626953125, 0.09527587890625, 0.1229248046875, 0.15057373046875, 0.17822265625, 0.20587158203125, 0.2335205078125, 0.26116943359375, 0.288818359375, 0.31646728515625, 0.3441162109375, 0.37176513671875, 0.3994140625, 0.42706298828125, 0.4547119140625, 0.48236083984375, 0.510009765625, 0.53765869140625, 0.5653076171875, 0.59295654296875, 0.62060546875, 0.64825439453125, 0.6759033203125, 0.70355224609375, 0.731201171875, 0.75885009765625, 0.7864990234375, 0.81414794921875, 0.841796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 11.0, 11.0, 10.0, 16.0, 17.0, 18.0, 22.0, 30.0, 39.0, 51.0, 56.0, 93.0, 138.0, 138.0, 69.0, 39.0, 41.0, 29.0, 25.0, 21.0, 15.0, 9.0, 12.0, 10.0, 11.0, 12.0, 7.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001074075698852539, -0.00010391976684331894, -0.00010043196380138397, -9.6944160759449e-05, -9.345635771751404e-05, -8.996855467557907e-05, -8.64807516336441e-05, -8.299294859170914e-05, -7.950514554977417e-05, -7.60173425078392e-05, -7.252953946590424e-05, -6.904173642396927e-05, -6.55539333820343e-05, -6.206613034009933e-05, -5.857832729816437e-05, -5.50905242562294e-05, -5.1602721214294434e-05, -4.8114918172359467e-05, -4.46271151304245e-05, -4.113931208848953e-05, -3.7651509046554565e-05, -3.41637060046196e-05, -3.067590296268463e-05, -2.7188099920749664e-05, -2.3700296878814697e-05, -2.021249383687973e-05, -1.6724690794944763e-05, -1.3236887753009796e-05, -9.749084711074829e-06, -6.261281669139862e-06, -2.773478627204895e-06, 7.14324414730072e-07, 4.202127456665039e-06, 7.689930498600006e-06, 1.1177733540534973e-05, 1.466553658246994e-05, 1.8153339624404907e-05, 2.1641142666339874e-05, 2.512894570827484e-05, 2.861674875020981e-05, 3.2104551792144775e-05, 3.559235483407974e-05, 3.908015787601471e-05, 4.2567960917949677e-05, 4.6055763959884644e-05, 4.954356700181961e-05, 5.303137004375458e-05, 5.6519173085689545e-05, 6.000697612762451e-05, 6.349477916955948e-05, 6.698258221149445e-05, 7.047038525342941e-05, 7.395818829536438e-05, 7.744599133729935e-05, 8.093379437923431e-05, 8.442159742116928e-05, 8.790940046310425e-05, 9.139720350503922e-05, 9.488500654697418e-05, 9.837280958890915e-05, 0.00010186061263084412, 0.00010534841567277908, 0.00010883621871471405, 0.00011232402175664902, 0.00011581182479858398]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 11.0, 16.0, 20.0, 28.0, 44.0, 72.0, 119.0, 215.0, 344.0, 693.0, 1547.0, 4688.0, 24072.0, 366903.0, 609371.0, 31467.0, 5467.0, 1764.0, 725.0, 391.0, 202.0, 128.0, 65.0, 55.0, 41.0, 22.0, 24.0, 14.0, 9.0, 10.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76025390625, -0.7349624633789062, -0.7096710205078125, -0.6843795776367188, -0.659088134765625, -0.6337966918945312, -0.6085052490234375, -0.5832138061523438, -0.55792236328125, -0.5326309204101562, -0.5073394775390625, -0.48204803466796875, -0.456756591796875, -0.43146514892578125, -0.4061737060546875, -0.38088226318359375, -0.3555908203125, -0.33029937744140625, -0.3050079345703125, -0.27971649169921875, -0.254425048828125, -0.22913360595703125, -0.2038421630859375, -0.17855072021484375, -0.15325927734375, -0.12796783447265625, -0.1026763916015625, -0.07738494873046875, -0.052093505859375, -0.02680206298828125, -0.0015106201171875, 0.02378082275390625, 0.049072265625, 0.07436370849609375, 0.0996551513671875, 0.12494659423828125, 0.150238037109375, 0.17552947998046875, 0.2008209228515625, 0.22611236572265625, 0.25140380859375, 0.27669525146484375, 0.3019866943359375, 0.32727813720703125, 0.352569580078125, 0.37786102294921875, 0.4031524658203125, 0.42844390869140625, 0.4537353515625, 0.47902679443359375, 0.5043182373046875, 0.5296096801757812, 0.554901123046875, 0.5801925659179688, 0.6054840087890625, 0.6307754516601562, 0.65606689453125, 0.6813583374023438, 0.7066497802734375, 0.7319412231445312, 0.757232666015625, 0.7825241088867188, 0.8078155517578125, 0.8331069946289062, 0.8583984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 12.0, 8.0, 11.0, 16.0, 15.0, 31.0, 32.0, 45.0, 48.0, 56.0, 85.0, 109.0, 91.0, 88.0, 73.0, 64.0, 57.0, 31.0, 23.0, 28.0, 14.0, 10.0, 14.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64208984375, -0.6233901977539062, -0.6046905517578125, -0.5859909057617188, -0.567291259765625, -0.5485916137695312, -0.5298919677734375, -0.5111923217773438, -0.49249267578125, -0.47379302978515625, -0.4550933837890625, -0.43639373779296875, -0.417694091796875, -0.39899444580078125, -0.3802947998046875, -0.36159515380859375, -0.3428955078125, -0.32419586181640625, -0.3054962158203125, -0.28679656982421875, -0.268096923828125, -0.24939727783203125, -0.2306976318359375, -0.21199798583984375, -0.19329833984375, -0.17459869384765625, -0.1558990478515625, -0.13719940185546875, -0.118499755859375, -0.09980010986328125, -0.0811004638671875, -0.06240081787109375, -0.043701171875, -0.02500152587890625, -0.0063018798828125, 0.01239776611328125, 0.031097412109375, 0.04979705810546875, 0.0684967041015625, 0.08719635009765625, 0.10589599609375, 0.12459564208984375, 0.1432952880859375, 0.16199493408203125, 0.180694580078125, 0.19939422607421875, 0.2180938720703125, 0.23679351806640625, 0.2554931640625, 0.27419281005859375, 0.2928924560546875, 0.31159210205078125, 0.330291748046875, 0.34899139404296875, 0.3676910400390625, 0.38639068603515625, 0.40509033203125, 0.42378997802734375, 0.4424896240234375, 0.46118927001953125, 0.479888916015625, 0.49858856201171875, 0.5172882080078125, 0.5359878540039062, 0.5546875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 17.0, 37.0, 131.0, 337.0, 315.0, 107.0, 25.0, 11.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.143689155578613, -14.53260326385498, -13.921518325805664, -13.310432434082031, -12.699346542358398, -12.088261604309082, -11.47717571258545, -10.866090774536133, -10.2550048828125, -9.643918991088867, -9.03283405303955, -8.421748161315918, -7.810662746429443, -7.199577331542969, -6.588491439819336, -5.977406024932861, -5.366320610046387, -4.755235195159912, -4.1441497802734375, -3.5330638885498047, -2.92197847366333, -2.3108930587768555, -1.6998074054718018, -1.088721752166748, -0.47763633728027344, 0.13344919681549072, 0.7445347309112549, 1.355620265007019, 1.9667057991027832, 2.577791213989258, 3.1888768672943115, 3.7999625205993652, 4.411046981811523, 5.022132396697998, 5.633217811584473, 6.2443037033081055, 6.85538911819458, 7.466474533081055, 8.077560424804688, 8.68864631652832, 9.299731254577637, 9.91081714630127, 10.521902084350586, 11.132987976074219, 11.744073867797852, 12.355158805847168, 12.9662446975708, 13.577329635620117, 14.18841552734375, 14.799501419067383, 15.4105863571167, 16.021671295166016, 16.63275718688965, 17.24384307861328, 17.854928970336914, 18.466014862060547, 19.077098846435547, 19.68818473815918, 20.299270629882812, 20.910354614257812, 21.521440505981445, 22.132526397705078, 22.74361228942871, 23.354698181152344, 23.965784072875977]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 4.0, 8.0, 10.0, 16.0, 17.0, 22.0, 41.0, 29.0, 47.0, 54.0, 79.0, 80.0, 76.0, 91.0, 66.0, 53.0, 63.0, 48.0, 49.0, 35.0, 31.0, 23.0, 14.0, 11.0, 10.0, 6.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.03976058959961, -13.715754508972168, -13.391748428344727, -13.067742347717285, -12.743736267089844, -12.419730186462402, -12.095724105834961, -11.77171802520752, -11.447711944580078, -11.123705863952637, -10.799699783325195, -10.475693702697754, -10.151687622070312, -9.827681541442871, -9.50367546081543, -9.179669380187988, -8.855663299560547, -8.531657218933105, -8.207651138305664, -7.883645057678223, -7.559638977050781, -7.23563289642334, -6.911626815795898, -6.587620735168457, -6.263615608215332, -5.939609527587891, -5.615603446960449, -5.291597366333008, -4.967591285705566, -4.643585205078125, -4.319579124450684, -3.9955732822418213, -3.671566963195801, -3.3475608825683594, -3.023554801940918, -2.6995487213134766, -2.375542640686035, -2.0515365600585938, -1.7275307178497314, -1.40352463722229, -1.0795185565948486, -0.7555124759674072, -0.4315064549446106, -0.10750043392181396, 0.21650564670562744, 0.5405117273330688, 0.8645176887512207, 1.188523769378662, 1.5125298500061035, 1.836535930633545, 2.1605420112609863, 2.4845480918884277, 2.808554172515869, 3.1325602531433105, 3.456566095352173, 3.7805721759796143, 4.104578018188477, 4.428584098815918, 4.752590179443359, 5.076596260070801, 5.400602340698242, 5.724608421325684, 6.048614501953125, 6.372620582580566, 6.696626663208008]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 12.0, 13.0, 16.0, 28.0, 61.0, 84.0, 138.0, 225.0, 694.0, 19039.0, 4167372.0, 5598.0, 489.0, 191.0, 125.0, 62.0, 37.0, 25.0, 12.0, 13.0, 8.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.02734375, -3.90301513671875, -3.7786865234375, -3.65435791015625, -3.530029296875, -3.40570068359375, -3.2813720703125, -3.15704345703125, -3.03271484375, -2.90838623046875, -2.7840576171875, -2.65972900390625, -2.535400390625, -2.41107177734375, -2.2867431640625, -2.16241455078125, -2.0380859375, -1.91375732421875, -1.7894287109375, -1.66510009765625, -1.540771484375, -1.41644287109375, -1.2921142578125, -1.16778564453125, -1.04345703125, -0.91912841796875, -0.7947998046875, -0.67047119140625, -0.546142578125, -0.42181396484375, -0.2974853515625, -0.17315673828125, -0.048828125, 0.07550048828125, 0.1998291015625, 0.32415771484375, 0.448486328125, 0.57281494140625, 0.6971435546875, 0.82147216796875, 0.94580078125, 1.07012939453125, 1.1944580078125, 1.31878662109375, 1.443115234375, 1.56744384765625, 1.6917724609375, 1.81610107421875, 1.9404296875, 2.06475830078125, 2.1890869140625, 2.31341552734375, 2.437744140625, 2.56207275390625, 2.6864013671875, 2.81072998046875, 2.93505859375, 3.05938720703125, 3.1837158203125, 3.30804443359375, 3.432373046875, 3.55670166015625, 3.6810302734375, 3.80535888671875, 3.9296875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 5.0, 4.0, 11.0, 9.0, 22.0, 22.0, 24.0, 28.0, 39.0, 32.0, 35.0, 56.0, 50.0, 69.0, 54.0, 55.0, 55.0, 47.0, 50.0, 52.0, 48.0, 34.0, 39.0, 25.0, 24.0, 22.0, 15.0, 12.0, 13.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42822265625, -0.41544342041015625, -0.4026641845703125, -0.38988494873046875, -0.377105712890625, -0.36432647705078125, -0.3515472412109375, -0.33876800537109375, -0.32598876953125, -0.31320953369140625, -0.3004302978515625, -0.28765106201171875, -0.274871826171875, -0.26209259033203125, -0.2493133544921875, -0.23653411865234375, -0.2237548828125, -0.21097564697265625, -0.1981964111328125, -0.18541717529296875, -0.172637939453125, -0.15985870361328125, -0.1470794677734375, -0.13430023193359375, -0.12152099609375, -0.10874176025390625, -0.0959625244140625, -0.08318328857421875, -0.070404052734375, -0.05762481689453125, -0.0448455810546875, -0.03206634521484375, -0.019287109375, -0.00650787353515625, 0.0062713623046875, 0.01905059814453125, 0.031829833984375, 0.04460906982421875, 0.0573883056640625, 0.07016754150390625, 0.08294677734375, 0.09572601318359375, 0.1085052490234375, 0.12128448486328125, 0.134063720703125, 0.14684295654296875, 0.1596221923828125, 0.17240142822265625, 0.1851806640625, 0.19795989990234375, 0.2107391357421875, 0.22351837158203125, 0.236297607421875, 0.24907684326171875, 0.2618560791015625, 0.27463531494140625, 0.28741455078125, 0.30019378662109375, 0.3129730224609375, 0.32575225830078125, 0.338531494140625, 0.35131072998046875, 0.3640899658203125, 0.37686920166015625, 0.3896484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 1.0, 6.0, 18.0, 19.0, 36.0, 80.0, 128.0, 249.0, 693.0, 1721.0, 4794.0, 18498.0, 132011.0, 2746952.0, 1204224.0, 66262.0, 12369.0, 3709.0, 1391.0, 595.0, 265.0, 107.0, 52.0, 36.0, 12.0, 17.0, 10.0, 9.0, 8.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6396484375, -0.6149063110351562, -0.5901641845703125, -0.5654220581054688, -0.540679931640625, -0.5159378051757812, -0.4911956787109375, -0.46645355224609375, -0.44171142578125, -0.41696929931640625, -0.3922271728515625, -0.36748504638671875, -0.342742919921875, -0.31800079345703125, -0.2932586669921875, -0.26851654052734375, -0.2437744140625, -0.21903228759765625, -0.1942901611328125, -0.16954803466796875, -0.144805908203125, -0.12006378173828125, -0.0953216552734375, -0.07057952880859375, -0.04583740234375, -0.02109527587890625, 0.0036468505859375, 0.02838897705078125, 0.053131103515625, 0.07787322998046875, 0.1026153564453125, 0.12735748291015625, 0.152099609375, 0.17684173583984375, 0.2015838623046875, 0.22632598876953125, 0.251068115234375, 0.27581024169921875, 0.3005523681640625, 0.32529449462890625, 0.35003662109375, 0.37477874755859375, 0.3995208740234375, 0.42426300048828125, 0.449005126953125, 0.47374725341796875, 0.4984893798828125, 0.5232315063476562, 0.5479736328125, 0.5727157592773438, 0.5974578857421875, 0.6222000122070312, 0.646942138671875, 0.6716842651367188, 0.6964263916015625, 0.7211685180664062, 0.74591064453125, 0.7706527709960938, 0.7953948974609375, 0.8201370239257812, 0.844879150390625, 0.8696212768554688, 0.8943634033203125, 0.9191055297851562, 0.94384765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 8.0, 7.0, 4.0, 16.0, 27.0, 29.0, 48.0, 85.0, 136.0, 209.0, 322.0, 595.0, 750.0, 681.0, 457.0, 263.0, 155.0, 86.0, 52.0, 41.0, 27.0, 14.0, 17.0, 6.0, 12.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6582107543945312, -0.6352691650390625, -0.6123275756835938, -0.589385986328125, -0.5664443969726562, -0.5435028076171875, -0.5205612182617188, -0.49761962890625, -0.47467803955078125, -0.4517364501953125, -0.42879486083984375, -0.405853271484375, -0.38291168212890625, -0.3599700927734375, -0.33702850341796875, -0.3140869140625, -0.29114532470703125, -0.2682037353515625, -0.24526214599609375, -0.222320556640625, -0.19937896728515625, -0.1764373779296875, -0.15349578857421875, -0.13055419921875, -0.10761260986328125, -0.0846710205078125, -0.06172943115234375, -0.038787841796875, -0.01584625244140625, 0.0070953369140625, 0.03003692626953125, 0.052978515625, 0.07592010498046875, 0.0988616943359375, 0.12180328369140625, 0.144744873046875, 0.16768646240234375, 0.1906280517578125, 0.21356964111328125, 0.23651123046875, 0.25945281982421875, 0.2823944091796875, 0.30533599853515625, 0.328277587890625, 0.35121917724609375, 0.3741607666015625, 0.39710235595703125, 0.4200439453125, 0.44298553466796875, 0.4659271240234375, 0.48886871337890625, 0.511810302734375, 0.5347518920898438, 0.5576934814453125, 0.5806350708007812, 0.60357666015625, 0.6265182495117188, 0.6494598388671875, 0.6724014282226562, 0.695343017578125, 0.7182846069335938, 0.7412261962890625, 0.7641677856445312, 0.787109375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 8.0, 9.0, 18.0, 33.0, 71.0, 121.0, 170.0, 188.0, 152.0, 101.0, 61.0, 24.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.263106346130371, -7.059935092926025, -6.8567633628845215, -6.653592109680176, -6.45042085647583, -6.247249603271484, -6.0440778732299805, -5.840906620025635, -5.637735366821289, -5.434564113616943, -5.2313923835754395, -5.028221130371094, -4.825049877166748, -4.621878623962402, -4.418706893920898, -4.215535640716553, -4.012363910675049, -3.809192419052124, -3.6060211658477783, -3.4028496742248535, -3.199678421020508, -2.996506929397583, -2.793335437774658, -2.5901641845703125, -2.3869926929473877, -2.183821201324463, -1.9806499481201172, -1.7774784564971924, -1.5743070840835571, -1.3711357116699219, -1.167964220046997, -0.9647928476333618, -0.7616214752197266, -0.5584501028060913, -0.3552786707878113, -0.15210723876953125, 0.051064133644104004, 0.25423550605773926, 0.45740699768066406, 0.6605783700942993, 0.8637497425079346, 1.0669211149215698, 1.270092487335205, 1.4732639789581299, 1.6764353513717651, 1.8796067237854004, 2.082778215408325, 2.28594970703125, 2.4891209602355957, 2.6922924518585205, 2.895463705062866, 3.098635196685791, 3.3018064498901367, 3.5049779415130615, 3.7081494331359863, 3.911320686340332, 4.114492416381836, 4.317663669586182, 4.5208353996276855, 4.724006652832031, 4.927177906036377, 5.130349159240723, 5.333520889282227, 5.536692142486572, 5.739863395690918]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 12.0, 9.0, 11.0, 21.0, 24.0, 35.0, 24.0, 41.0, 37.0, 52.0, 55.0, 67.0, 64.0, 56.0, 57.0, 75.0, 52.0, 46.0, 44.0, 36.0, 35.0, 26.0, 22.0, 27.0, 9.0, 11.0, 16.0, 8.0, 11.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.642759323120117, -4.523218154907227, -4.403676509857178, -4.284135341644287, -4.1645941734313965, -4.045053005218506, -3.925511360168457, -3.8059701919555664, -3.686429023742676, -3.566887617111206, -3.4473464488983154, -3.3278050422668457, -3.208263874053955, -3.0887224674224854, -2.9691810607910156, -2.849639892578125, -2.7300984859466553, -2.6105570793151855, -2.491015911102295, -2.371474504470825, -2.2519333362579346, -2.132391929626465, -2.012850761413574, -1.8933093547821045, -1.7737680673599243, -1.6542267799377441, -1.534685492515564, -1.4151442050933838, -1.295602798461914, -1.1760616302490234, -1.0565202236175537, -0.9369789361953735, -0.8174374103546143, -0.6978961229324341, -0.5783548355102539, -0.45881348848342896, -0.3392722010612488, -0.2197309136390686, -0.10018956661224365, 0.019351720809936523, 0.1388930082321167, 0.2584342956542969, 0.37797561287879944, 0.497516930103302, 0.6170582175254822, 0.7365995049476624, 0.8561408519744873, 0.9756821393966675, 1.0952234268188477, 1.2147647142410278, 1.334306001663208, 1.4538474082946777, 1.5733885765075684, 1.692929983139038, 1.8124712705612183, 1.9320125579833984, 2.051553726196289, 2.171095132827759, 2.2906363010406494, 2.410177707672119, 2.5297188758850098, 2.6492602825164795, 2.768801689147949, 2.88834285736084, 3.0078842639923096]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 8.0, 9.0, 11.0, 8.0, 10.0, 19.0, 33.0, 27.0, 59.0, 98.0, 171.0, 251.0, 484.0, 850.0, 1613.0, 3381.0, 7295.0, 17736.0, 49553.0, 164758.0, 463811.0, 232218.0, 65803.0, 22846.0, 9140.0, 4043.0, 1943.0, 1012.0, 547.0, 305.0, 188.0, 101.0, 74.0, 55.0, 27.0, 18.0, 11.0, 19.0, 9.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.55908203125, -0.5380859375, -0.51708984375, -0.49609375, -0.47509765625, -0.4541015625, -0.43310546875, -0.412109375, -0.39111328125, -0.3701171875, -0.34912109375, -0.328125, -0.30712890625, -0.2861328125, -0.26513671875, -0.244140625, -0.22314453125, -0.2021484375, -0.18115234375, -0.16015625, -0.13916015625, -0.1181640625, -0.09716796875, -0.076171875, -0.05517578125, -0.0341796875, -0.01318359375, 0.0078125, 0.02880859375, 0.0498046875, 0.07080078125, 0.091796875, 0.11279296875, 0.1337890625, 0.15478515625, 0.17578125, 0.19677734375, 0.2177734375, 0.23876953125, 0.259765625, 0.28076171875, 0.3017578125, 0.32275390625, 0.34375, 0.36474609375, 0.3857421875, 0.40673828125, 0.427734375, 0.44873046875, 0.4697265625, 0.49072265625, 0.51171875, 0.53271484375, 0.5537109375, 0.57470703125, 0.595703125, 0.61669921875, 0.6376953125, 0.65869140625, 0.6796875, 0.70068359375, 0.7216796875, 0.74267578125, 0.763671875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 6.0, 14.0, 24.0, 25.0, 26.0, 26.0, 45.0, 48.0, 51.0, 60.0, 63.0, 71.0, 62.0, 55.0, 51.0, 62.0, 58.0, 37.0, 39.0, 38.0, 34.0, 17.0, 19.0, 7.0, 10.0, 10.0, 4.0, 2.0, 4.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.459228515625, -0.44503021240234375, -0.4308319091796875, -0.41663360595703125, -0.402435302734375, -0.38823699951171875, -0.3740386962890625, -0.35984039306640625, -0.34564208984375, -0.33144378662109375, -0.3172454833984375, -0.30304718017578125, -0.288848876953125, -0.27465057373046875, -0.2604522705078125, -0.24625396728515625, -0.2320556640625, -0.21785736083984375, -0.2036590576171875, -0.18946075439453125, -0.175262451171875, -0.16106414794921875, -0.1468658447265625, -0.13266754150390625, -0.11846923828125, -0.10427093505859375, -0.0900726318359375, -0.07587432861328125, -0.061676025390625, -0.04747772216796875, -0.0332794189453125, -0.01908111572265625, -0.0048828125, 0.00931549072265625, 0.0235137939453125, 0.03771209716796875, 0.051910400390625, 0.06610870361328125, 0.0803070068359375, 0.09450531005859375, 0.10870361328125, 0.12290191650390625, 0.1371002197265625, 0.15129852294921875, 0.165496826171875, 0.17969512939453125, 0.1938934326171875, 0.20809173583984375, 0.2222900390625, 0.23648834228515625, 0.2506866455078125, 0.26488494873046875, 0.279083251953125, 0.29328155517578125, 0.3074798583984375, 0.32167816162109375, 0.33587646484375, 0.35007476806640625, 0.3642730712890625, 0.37847137451171875, 0.392669677734375, 0.40686798095703125, 0.4210662841796875, 0.43526458740234375, 0.449462890625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 6.0, 8.0, 8.0, 7.0, 22.0, 17.0, 38.0, 57.0, 84.0, 127.0, 269.0, 545.0, 1369.0, 4961.0, 34705.0, 623730.0, 353335.0, 23174.0, 3869.0, 1191.0, 462.0, 222.0, 121.0, 62.0, 45.0, 33.0, 19.0, 15.0, 13.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.4949493408203125, -1.444976806640625, -1.3950042724609375, -1.34503173828125, -1.2950592041015625, -1.245086669921875, -1.1951141357421875, -1.1451416015625, -1.0951690673828125, -1.045196533203125, -0.9952239990234375, -0.94525146484375, -0.8952789306640625, -0.845306396484375, -0.7953338623046875, -0.745361328125, -0.6953887939453125, -0.645416259765625, -0.5954437255859375, -0.54547119140625, -0.4954986572265625, -0.445526123046875, -0.3955535888671875, -0.3455810546875, -0.2956085205078125, -0.245635986328125, -0.1956634521484375, -0.14569091796875, -0.0957183837890625, -0.045745849609375, 0.0042266845703125, 0.05419921875, 0.1041717529296875, 0.154144287109375, 0.2041168212890625, 0.25408935546875, 0.3040618896484375, 0.354034423828125, 0.4040069580078125, 0.4539794921875, 0.5039520263671875, 0.553924560546875, 0.6038970947265625, 0.65386962890625, 0.7038421630859375, 0.753814697265625, 0.8037872314453125, 0.853759765625, 0.9037322998046875, 0.953704833984375, 1.0036773681640625, 1.05364990234375, 1.1036224365234375, 1.153594970703125, 1.2035675048828125, 1.2535400390625, 1.3035125732421875, 1.353485107421875, 1.4034576416015625, 1.45343017578125, 1.5034027099609375, 1.553375244140625, 1.6033477783203125, 1.6533203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 7.0, 10.0, 6.0, 11.0, 15.0, 12.0, 19.0, 16.0, 16.0, 23.0, 20.0, 35.0, 40.0, 31.0, 39.0, 38.0, 40.0, 46.0, 38.0, 37.0, 42.0, 38.0, 33.0, 54.0, 33.0, 26.0, 27.0, 23.0, 31.0, 28.0, 24.0, 12.0, 29.0, 15.0, 18.0, 14.0, 10.0, 8.0, 3.0, 4.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.373046875, -1.3340301513671875, -1.295013427734375, -1.2559967041015625, -1.21697998046875, -1.1779632568359375, -1.138946533203125, -1.0999298095703125, -1.0609130859375, -1.0218963623046875, -0.982879638671875, -0.9438629150390625, -0.90484619140625, -0.8658294677734375, -0.826812744140625, -0.7877960205078125, -0.748779296875, -0.7097625732421875, -0.670745849609375, -0.6317291259765625, -0.59271240234375, -0.5536956787109375, -0.514678955078125, -0.4756622314453125, -0.4366455078125, -0.3976287841796875, -0.358612060546875, -0.3195953369140625, -0.28057861328125, -0.2415618896484375, -0.202545166015625, -0.1635284423828125, -0.12451171875, -0.0854949951171875, -0.046478271484375, -0.0074615478515625, 0.03155517578125, 0.0705718994140625, 0.109588623046875, 0.1486053466796875, 0.1876220703125, 0.2266387939453125, 0.265655517578125, 0.3046722412109375, 0.34368896484375, 0.3827056884765625, 0.421722412109375, 0.4607391357421875, 0.499755859375, 0.5387725830078125, 0.577789306640625, 0.6168060302734375, 0.65582275390625, 0.6948394775390625, 0.733856201171875, 0.7728729248046875, 0.8118896484375, 0.8509063720703125, 0.889923095703125, 0.9289398193359375, 0.96795654296875, 1.0069732666015625, 1.045989990234375, 1.0850067138671875, 1.1240234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 9.0, 11.0, 12.0, 21.0, 29.0, 49.0, 87.0, 163.0, 432.0, 1394.0, 9782.0, 830160.0, 199232.0, 5466.0, 1028.0, 331.0, 144.0, 81.0, 39.0, 25.0, 17.0, 11.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.35546875, -1.30853271484375, -1.2615966796875, -1.21466064453125, -1.167724609375, -1.12078857421875, -1.0738525390625, -1.02691650390625, -0.97998046875, -0.93304443359375, -0.8861083984375, -0.83917236328125, -0.792236328125, -0.74530029296875, -0.6983642578125, -0.65142822265625, -0.6044921875, -0.55755615234375, -0.5106201171875, -0.46368408203125, -0.416748046875, -0.36981201171875, -0.3228759765625, -0.27593994140625, -0.22900390625, -0.18206787109375, -0.1351318359375, -0.08819580078125, -0.041259765625, 0.00567626953125, 0.0526123046875, 0.09954833984375, 0.146484375, 0.19342041015625, 0.2403564453125, 0.28729248046875, 0.334228515625, 0.38116455078125, 0.4281005859375, 0.47503662109375, 0.52197265625, 0.56890869140625, 0.6158447265625, 0.66278076171875, 0.709716796875, 0.75665283203125, 0.8035888671875, 0.85052490234375, 0.8974609375, 0.94439697265625, 0.9913330078125, 1.03826904296875, 1.085205078125, 1.13214111328125, 1.1790771484375, 1.22601318359375, 1.27294921875, 1.31988525390625, 1.3668212890625, 1.41375732421875, 1.460693359375, 1.50762939453125, 1.5545654296875, 1.60150146484375, 1.6484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 8.0, 15.0, 21.0, 31.0, 24.0, 62.0, 127.0, 212.0, 211.0, 97.0, 52.0, 42.0, 24.0, 18.0, 9.0, 5.0, 4.0, 8.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001881122589111328, -0.00018220767378807068, -0.00017630308866500854, -0.0001703985035419464, -0.00016449391841888428, -0.00015858933329582214, -0.00015268474817276, -0.00014678016304969788, -0.00014087557792663574, -0.0001349709928035736, -0.00012906640768051147, -0.00012316182255744934, -0.00011725723743438721, -0.00011135265231132507, -0.00010544806718826294, -9.95434820652008e-05, -9.363889694213867e-05, -8.773431181907654e-05, -8.18297266960144e-05, -7.592514157295227e-05, -7.002055644989014e-05, -6.4115971326828e-05, -5.821138620376587e-05, -5.2306801080703735e-05, -4.64022159576416e-05, -4.049763083457947e-05, -3.4593045711517334e-05, -2.86884605884552e-05, -2.2783875465393066e-05, -1.6879290342330933e-05, -1.0974705219268799e-05, -5.070120096206665e-06, 8.344650268554688e-07, 6.7390501499176025e-06, 1.2643635272979736e-05, 1.854822039604187e-05, 2.4452805519104004e-05, 3.0357390642166138e-05, 3.626197576522827e-05, 4.2166560888290405e-05, 4.807114601135254e-05, 5.397573113441467e-05, 5.988031625747681e-05, 6.578490138053894e-05, 7.168948650360107e-05, 7.759407162666321e-05, 8.349865674972534e-05, 8.940324187278748e-05, 9.530782699584961e-05, 0.00010121241211891174, 0.00010711699724197388, 0.00011302158236503601, 0.00011892616748809814, 0.00012483075261116028, 0.0001307353377342224, 0.00013663992285728455, 0.00014254450798034668, 0.0001484490931034088, 0.00015435367822647095, 0.00016025826334953308, 0.00016616284847259521, 0.00017206743359565735, 0.00017797201871871948, 0.00018387660384178162, 0.00018978118896484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 8.0, 15.0, 37.0, 55.0, 85.0, 133.0, 319.0, 1013.0, 4872.0, 53938.0, 939274.0, 42952.0, 4236.0, 944.0, 331.0, 130.0, 89.0, 41.0, 21.0, 18.0, 9.0, 10.0, 8.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1220703125, -1.0875091552734375, -1.052947998046875, -1.0183868408203125, -0.98382568359375, -0.9492645263671875, -0.914703369140625, -0.8801422119140625, -0.8455810546875, -0.8110198974609375, -0.776458740234375, -0.7418975830078125, -0.70733642578125, -0.6727752685546875, -0.638214111328125, -0.6036529541015625, -0.569091796875, -0.5345306396484375, -0.499969482421875, -0.4654083251953125, -0.43084716796875, -0.3962860107421875, -0.361724853515625, -0.3271636962890625, -0.2926025390625, -0.2580413818359375, -0.223480224609375, -0.1889190673828125, -0.15435791015625, -0.1197967529296875, -0.085235595703125, -0.0506744384765625, -0.01611328125, 0.0184478759765625, 0.053009033203125, 0.0875701904296875, 0.12213134765625, 0.1566925048828125, 0.191253662109375, 0.2258148193359375, 0.2603759765625, 0.2949371337890625, 0.329498291015625, 0.3640594482421875, 0.39862060546875, 0.4331817626953125, 0.467742919921875, 0.5023040771484375, 0.536865234375, 0.5714263916015625, 0.605987548828125, 0.6405487060546875, 0.67510986328125, 0.7096710205078125, 0.744232177734375, 0.7787933349609375, 0.8133544921875, 0.8479156494140625, 0.882476806640625, 0.9170379638671875, 0.95159912109375, 0.9861602783203125, 1.020721435546875, 1.0552825927734375, 1.08984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 7.0, 12.0, 12.0, 33.0, 43.0, 55.0, 118.0, 128.0, 182.0, 141.0, 112.0, 59.0, 37.0, 20.0, 16.0, 9.0, 3.0, 5.0, 3.0, 0.0, 9.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98486328125, -0.960479736328125, -0.93609619140625, -0.911712646484375, -0.8873291015625, -0.862945556640625, -0.83856201171875, -0.814178466796875, -0.789794921875, -0.765411376953125, -0.74102783203125, -0.716644287109375, -0.6922607421875, -0.667877197265625, -0.64349365234375, -0.619110107421875, -0.5947265625, -0.570343017578125, -0.54595947265625, -0.521575927734375, -0.4971923828125, -0.472808837890625, -0.44842529296875, -0.424041748046875, -0.399658203125, -0.375274658203125, -0.35089111328125, -0.326507568359375, -0.3021240234375, -0.277740478515625, -0.25335693359375, -0.228973388671875, -0.20458984375, -0.180206298828125, -0.15582275390625, -0.131439208984375, -0.1070556640625, -0.082672119140625, -0.05828857421875, -0.033905029296875, -0.009521484375, 0.014862060546875, 0.03924560546875, 0.063629150390625, 0.0880126953125, 0.112396240234375, 0.13677978515625, 0.161163330078125, 0.185546875, 0.209930419921875, 0.23431396484375, 0.258697509765625, 0.2830810546875, 0.307464599609375, 0.33184814453125, 0.356231689453125, 0.380615234375, 0.404998779296875, 0.42938232421875, 0.453765869140625, 0.4781494140625, 0.502532958984375, 0.52691650390625, 0.551300048828125, 0.57568359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 50.0, 610.0, 296.0, 33.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.84895324707031, -62.61444091796875, -61.37992858886719, -60.14541244506836, -58.9109001159668, -57.676387786865234, -56.44187545776367, -55.20736312866211, -53.97284698486328, -52.73833465576172, -51.503822326660156, -50.26930618286133, -49.034793853759766, -47.8002815246582, -46.56576919555664, -45.33125686645508, -44.096744537353516, -42.86223220825195, -41.62771987915039, -40.39320373535156, -39.15869140625, -37.92417907714844, -36.689666748046875, -35.45515441894531, -34.22064208984375, -32.98612976074219, -31.751615524291992, -30.51710319519043, -29.282588958740234, -28.048076629638672, -26.81356430053711, -25.579051971435547, -24.344532012939453, -23.11001968383789, -21.875505447387695, -20.640993118286133, -19.406478881835938, -18.171966552734375, -16.937454223632812, -15.702940940856934, -14.468427658081055, -13.233914375305176, -11.999401092529297, -10.764888763427734, -9.530375480651855, -8.295862197875977, -7.061349391937256, -5.826836585998535, -4.592323303222656, -3.3578102588653564, -2.1232972145080566, -0.8887841701507568, 0.34572887420654297, 1.5802421569824219, 2.8147549629211426, 4.049267768859863, 5.283781051635742, 6.518294334411621, 7.752807140350342, 8.987319946289062, 10.221833229064941, 11.45634651184082, 12.690858840942383, 13.925372123718262, 15.15988540649414]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 7.0, 9.0, 5.0, 10.0, 5.0, 11.0, 22.0, 15.0, 19.0, 39.0, 19.0, 33.0, 37.0, 34.0, 33.0, 58.0, 44.0, 61.0, 62.0, 51.0, 73.0, 43.0, 34.0, 45.0, 31.0, 30.0, 20.0, 24.0, 24.0, 13.0, 20.0, 11.0, 14.0, 10.0, 9.0, 5.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.476282596588135, -6.281581401824951, -6.086880207061768, -5.892179012298584, -5.6974778175354, -5.502776622772217, -5.308074951171875, -5.113373756408691, -4.918672561645508, -4.723971366882324, -4.529270172119141, -4.334568977355957, -4.139867782592773, -3.94516658782959, -3.750465154647827, -3.5557639598846436, -3.361063003540039, -3.1663618087768555, -2.971660614013672, -2.7769594192504883, -2.5822582244873047, -2.387557029724121, -2.1928555965423584, -1.9981544017791748, -1.8034532070159912, -1.6087520122528076, -1.414050817489624, -1.2193495035171509, -1.0246483087539673, -0.8299471139907837, -0.6352458000183105, -0.44054460525512695, -0.24584388732910156, -0.05114266276359558, 0.1435585618019104, 0.33825981616973877, 0.5329610109329224, 0.727662205696106, 0.9223635196685791, 1.1170647144317627, 1.3117659091949463, 1.5064671039581299, 1.7011682987213135, 1.8958696126937866, 2.0905709266662598, 2.2852721214294434, 2.479973316192627, 2.6746745109558105, 2.869375705718994, 3.0640769004821777, 3.2587780952453613, 3.453479290008545, 3.6481804847717285, 3.842881679534912, 4.037583351135254, 4.2322845458984375, 4.426985740661621, 4.621686935424805, 4.816388130187988, 5.011089324951172, 5.2057905197143555, 5.400491714477539, 5.595192909240723, 5.789894104003906, 5.98459529876709]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 3.0, 11.0, 7.0, 21.0, 27.0, 43.0, 81.0, 185.0, 455.0, 2005.0, 15524.0, 605888.0, 3498860.0, 64604.0, 5054.0, 935.0, 273.0, 131.0, 67.0, 41.0, 22.0, 18.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93310546875, -0.8975448608398438, -0.8619842529296875, -0.8264236450195312, -0.790863037109375, -0.7553024291992188, -0.7197418212890625, -0.6841812133789062, -0.64862060546875, -0.6130599975585938, -0.5774993896484375, -0.5419387817382812, -0.506378173828125, -0.47081756591796875, -0.4352569580078125, -0.39969635009765625, -0.3641357421875, -0.32857513427734375, -0.2930145263671875, -0.25745391845703125, -0.221893310546875, -0.18633270263671875, -0.1507720947265625, -0.11521148681640625, -0.07965087890625, -0.04409027099609375, -0.0085296630859375, 0.02703094482421875, 0.062591552734375, 0.09815216064453125, 0.1337127685546875, 0.16927337646484375, 0.204833984375, 0.24039459228515625, 0.2759552001953125, 0.31151580810546875, 0.347076416015625, 0.38263702392578125, 0.4181976318359375, 0.45375823974609375, 0.48931884765625, 0.5248794555664062, 0.5604400634765625, 0.5960006713867188, 0.631561279296875, 0.6671218872070312, 0.7026824951171875, 0.7382431030273438, 0.7738037109375, 0.8093643188476562, 0.8449249267578125, 0.8804855346679688, 0.916046142578125, 0.9516067504882812, 0.9871673583984375, 1.0227279663085938, 1.05828857421875, 1.0938491821289062, 1.1294097900390625, 1.1649703979492188, 1.200531005859375, 1.2360916137695312, 1.2716522216796875, 1.3072128295898438, 1.3427734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 14.0, 9.0, 22.0, 44.0, 40.0, 46.0, 68.0, 59.0, 66.0, 67.0, 86.0, 73.0, 74.0, 56.0, 56.0, 42.0, 37.0, 32.0, 31.0, 13.0, 14.0, 11.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.59619140625, -0.5814704895019531, -0.5667495727539062, -0.5520286560058594, -0.5373077392578125, -0.5225868225097656, -0.5078659057617188, -0.4931449890136719, -0.478424072265625, -0.4637031555175781, -0.44898223876953125, -0.4342613220214844, -0.4195404052734375, -0.4048194885253906, -0.39009857177734375, -0.3753776550292969, -0.36065673828125, -0.3459358215332031, -0.33121490478515625, -0.3164939880371094, -0.3017730712890625, -0.2870521545410156, -0.27233123779296875, -0.2576103210449219, -0.242889404296875, -0.22816848754882812, -0.21344757080078125, -0.19872665405273438, -0.1840057373046875, -0.16928482055664062, -0.15456390380859375, -0.13984298706054688, -0.1251220703125, -0.11040115356445312, -0.09568023681640625, -0.08095932006835938, -0.0662384033203125, -0.051517486572265625, -0.03679656982421875, -0.022075653076171875, -0.007354736328125, 0.007366180419921875, 0.02208709716796875, 0.036808013916015625, 0.0515289306640625, 0.06624984741210938, 0.08097076416015625, 0.09569168090820312, 0.11041259765625, 0.12513351440429688, 0.13985443115234375, 0.15457534790039062, 0.1692962646484375, 0.18401718139648438, 0.19873809814453125, 0.21345901489257812, 0.228179931640625, 0.24290084838867188, 0.25762176513671875, 0.2723426818847656, 0.2870635986328125, 0.3017845153808594, 0.31650543212890625, 0.3312263488769531, 0.345947265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 2.0, 7.0, 16.0, 18.0, 22.0, 46.0, 54.0, 83.0, 134.0, 226.0, 582.0, 2345.0, 24411.0, 1466103.0, 2658334.0, 37096.0, 3546.0, 743.0, 232.0, 109.0, 74.0, 37.0, 28.0, 15.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4873046875, -1.447174072265625, -1.40704345703125, -1.366912841796875, -1.3267822265625, -1.286651611328125, -1.24652099609375, -1.206390380859375, -1.166259765625, -1.126129150390625, -1.08599853515625, -1.045867919921875, -1.0057373046875, -0.965606689453125, -0.92547607421875, -0.885345458984375, -0.84521484375, -0.805084228515625, -0.76495361328125, -0.724822998046875, -0.6846923828125, -0.644561767578125, -0.60443115234375, -0.564300537109375, -0.524169921875, -0.484039306640625, -0.44390869140625, -0.403778076171875, -0.3636474609375, -0.323516845703125, -0.28338623046875, -0.243255615234375, -0.203125, -0.162994384765625, -0.12286376953125, -0.082733154296875, -0.0426025390625, -0.002471923828125, 0.03765869140625, 0.077789306640625, 0.117919921875, 0.158050537109375, 0.19818115234375, 0.238311767578125, 0.2784423828125, 0.318572998046875, 0.35870361328125, 0.398834228515625, 0.43896484375, 0.479095458984375, 0.51922607421875, 0.559356689453125, 0.5994873046875, 0.639617919921875, 0.67974853515625, 0.719879150390625, 0.760009765625, 0.800140380859375, 0.84027099609375, 0.880401611328125, 0.9205322265625, 0.960662841796875, 1.00079345703125, 1.040924072265625, 1.0810546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 9.0, 10.0, 15.0, 18.0, 37.0, 69.0, 112.0, 253.0, 528.0, 992.0, 934.0, 506.0, 264.0, 142.0, 69.0, 42.0, 27.0, 23.0, 12.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.365386962890625, -1.33038330078125, -1.295379638671875, -1.2603759765625, -1.225372314453125, -1.19036865234375, -1.155364990234375, -1.120361328125, -1.085357666015625, -1.05035400390625, -1.015350341796875, -0.9803466796875, -0.945343017578125, -0.91033935546875, -0.875335693359375, -0.84033203125, -0.805328369140625, -0.77032470703125, -0.735321044921875, -0.7003173828125, -0.665313720703125, -0.63031005859375, -0.595306396484375, -0.560302734375, -0.525299072265625, -0.49029541015625, -0.455291748046875, -0.4202880859375, -0.385284423828125, -0.35028076171875, -0.315277099609375, -0.2802734375, -0.245269775390625, -0.21026611328125, -0.175262451171875, -0.1402587890625, -0.105255126953125, -0.07025146484375, -0.035247802734375, -0.000244140625, 0.034759521484375, 0.06976318359375, 0.104766845703125, 0.1397705078125, 0.174774169921875, 0.20977783203125, 0.244781494140625, 0.27978515625, 0.314788818359375, 0.34979248046875, 0.384796142578125, 0.4197998046875, 0.454803466796875, 0.48980712890625, 0.524810791015625, 0.559814453125, 0.594818115234375, 0.62982177734375, 0.664825439453125, 0.6998291015625, 0.734832763671875, 0.76983642578125, 0.804840087890625, 0.83984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 13.0, 10.0, 26.0, 35.0, 73.0, 112.0, 169.0, 204.0, 160.0, 88.0, 42.0, 28.0, 10.0, 6.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.139776229858398, -6.878053188323975, -6.616330623626709, -6.354607582092285, -6.0928850173950195, -5.831161975860596, -5.569438934326172, -5.307716369628906, -5.045993328094482, -4.784270286560059, -4.522547721862793, -4.260824680328369, -3.9991018772125244, -3.7373790740966797, -3.475656032562256, -3.213933229446411, -2.9522104263305664, -2.6904876232147217, -2.428764820098877, -2.167041778564453, -1.9053189754486084, -1.6435961723327637, -1.3818732500076294, -1.1201503276824951, -0.8584275245666504, -0.5967046618461609, -0.3349817991256714, -0.07325893640518188, 0.18846392631530762, 0.45018672943115234, 0.7119096517562866, 0.9736325740814209, 1.2353553771972656, 1.4970781803131104, 1.7588011026382446, 2.020524024963379, 2.2822468280792236, 2.5439696311950684, 2.805692672729492, 3.067415475845337, 3.3291382789611816, 3.5908610820770264, 3.852583885192871, 4.114306926727295, 4.376029968261719, 4.637752532958984, 4.899475574493408, 5.161198616027832, 5.422921180725098, 5.6846442222595215, 5.946366786956787, 6.208089828491211, 6.469812393188477, 6.7315354347229, 6.993258476257324, 7.25498104095459, 7.516704082489014, 7.7784271240234375, 8.040149688720703, 8.301872253417969, 8.56359577178955, 8.825318336486816, 9.087040901184082, 9.348764419555664, 9.61048698425293]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 8.0, 13.0, 13.0, 6.0, 21.0, 25.0, 30.0, 31.0, 53.0, 45.0, 45.0, 65.0, 59.0, 48.0, 54.0, 52.0, 53.0, 49.0, 53.0, 39.0, 53.0, 35.0, 23.0, 33.0, 20.0, 11.0, 16.0, 14.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.302152633666992, -4.156752586364746, -4.0113525390625, -3.865952968597412, -3.720552921295166, -3.57515287399292, -3.429753065109253, -3.284353256225586, -3.13895320892334, -2.9935531616210938, -2.8481533527374268, -2.7027535438537598, -2.5573534965515137, -2.4119534492492676, -2.2665536403656006, -2.1211538314819336, -1.9757537841796875, -1.830353856086731, -1.6849539279937744, -1.5395539999008179, -1.3941540718078613, -1.2487541437149048, -1.1033542156219482, -0.9579542875289917, -0.8125543594360352, -0.6671544313430786, -0.5217545032501221, -0.3763545751571655, -0.23095464706420898, -0.08555471897125244, 0.0598452091217041, 0.20524513721466064, 0.3506450653076172, 0.49604499340057373, 0.6414449214935303, 0.7868448495864868, 0.9322447776794434, 1.0776447057724, 1.2230446338653564, 1.368444561958313, 1.5138444900512695, 1.659244418144226, 1.8046443462371826, 1.9500442743301392, 2.0954442024230957, 2.240844249725342, 2.386244058609009, 2.531643867492676, 2.677043914794922, 2.822443962097168, 2.967843770980835, 3.113243579864502, 3.258643627166748, 3.404043674468994, 3.549443483352661, 3.694843292236328, 3.840243339538574, 3.9856433868408203, 4.131043434143066, 4.276443004608154, 4.4218430519104, 4.5672430992126465, 4.712642669677734, 4.8580427169799805, 5.003442764282227]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 6.0, 15.0, 23.0, 28.0, 39.0, 81.0, 110.0, 178.0, 340.0, 634.0, 1176.0, 2464.0, 5841.0, 15658.0, 44788.0, 133596.0, 367881.0, 311035.0, 106542.0, 36131.0, 12758.0, 4793.0, 2109.0, 972.0, 567.0, 301.0, 168.0, 112.0, 70.0, 46.0, 24.0, 15.0, 14.0, 6.0, 5.0, 9.0, 2.0, 0.0, 0.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6025390625, -0.5816879272460938, -0.5608367919921875, -0.5399856567382812, -0.519134521484375, -0.49828338623046875, -0.4774322509765625, -0.45658111572265625, -0.43572998046875, -0.41487884521484375, -0.3940277099609375, -0.37317657470703125, -0.352325439453125, -0.33147430419921875, -0.3106231689453125, -0.28977203369140625, -0.2689208984375, -0.24806976318359375, -0.2272186279296875, -0.20636749267578125, -0.185516357421875, -0.16466522216796875, -0.1438140869140625, -0.12296295166015625, -0.10211181640625, -0.08126068115234375, -0.0604095458984375, -0.03955841064453125, -0.018707275390625, 0.00214385986328125, 0.0229949951171875, 0.04384613037109375, 0.064697265625, 0.08554840087890625, 0.1063995361328125, 0.12725067138671875, 0.148101806640625, 0.16895294189453125, 0.1898040771484375, 0.21065521240234375, 0.23150634765625, 0.25235748291015625, 0.2732086181640625, 0.29405975341796875, 0.314910888671875, 0.33576202392578125, 0.3566131591796875, 0.37746429443359375, 0.3983154296875, 0.41916656494140625, 0.4400177001953125, 0.46086883544921875, 0.481719970703125, 0.5025711059570312, 0.5234222412109375, 0.5442733764648438, 0.56512451171875, 0.5859756469726562, 0.6068267822265625, 0.6276779174804688, 0.648529052734375, 0.6693801879882812, 0.6902313232421875, 0.7110824584960938, 0.73193359375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 2.0, 6.0, 4.0, 17.0, 17.0, 20.0, 26.0, 33.0, 61.0, 62.0, 46.0, 67.0, 72.0, 77.0, 63.0, 77.0, 66.0, 55.0, 64.0, 41.0, 29.0, 22.0, 16.0, 15.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5576171875, -0.5428619384765625, -0.528106689453125, -0.5133514404296875, -0.49859619140625, -0.4838409423828125, -0.469085693359375, -0.4543304443359375, -0.4395751953125, -0.4248199462890625, -0.410064697265625, -0.3953094482421875, -0.38055419921875, -0.3657989501953125, -0.351043701171875, -0.3362884521484375, -0.321533203125, -0.3067779541015625, -0.292022705078125, -0.2772674560546875, -0.26251220703125, -0.2477569580078125, -0.233001708984375, -0.2182464599609375, -0.2034912109375, -0.1887359619140625, -0.173980712890625, -0.1592254638671875, -0.14447021484375, -0.1297149658203125, -0.114959716796875, -0.1002044677734375, -0.08544921875, -0.0706939697265625, -0.055938720703125, -0.0411834716796875, -0.02642822265625, -0.0116729736328125, 0.003082275390625, 0.0178375244140625, 0.0325927734375, 0.0473480224609375, 0.062103271484375, 0.0768585205078125, 0.09161376953125, 0.1063690185546875, 0.121124267578125, 0.1358795166015625, 0.150634765625, 0.1653900146484375, 0.180145263671875, 0.1949005126953125, 0.20965576171875, 0.2244110107421875, 0.239166259765625, 0.2539215087890625, 0.2686767578125, 0.2834320068359375, 0.298187255859375, 0.3129425048828125, 0.32769775390625, 0.3424530029296875, 0.357208251953125, 0.3719635009765625, 0.38671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 4.0, 3.0, 7.0, 10.0, 17.0, 21.0, 33.0, 47.0, 44.0, 84.0, 107.0, 171.0, 225.0, 350.0, 535.0, 885.0, 1668.0, 3315.0, 8943.0, 35826.0, 240720.0, 650801.0, 78874.0, 15372.0, 5052.0, 2317.0, 1112.0, 652.0, 445.0, 282.0, 173.0, 130.0, 93.0, 65.0, 37.0, 30.0, 27.0, 17.0, 19.0, 7.0, 7.0, 6.0, 5.0, 2.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.095703125, -1.0594482421875, -1.023193359375, -0.9869384765625, -0.95068359375, -0.9144287109375, -0.878173828125, -0.8419189453125, -0.8056640625, -0.7694091796875, -0.733154296875, -0.6968994140625, -0.66064453125, -0.6243896484375, -0.588134765625, -0.5518798828125, -0.515625, -0.4793701171875, -0.443115234375, -0.4068603515625, -0.37060546875, -0.3343505859375, -0.298095703125, -0.2618408203125, -0.2255859375, -0.1893310546875, -0.153076171875, -0.1168212890625, -0.08056640625, -0.0443115234375, -0.008056640625, 0.0281982421875, 0.064453125, 0.1007080078125, 0.136962890625, 0.1732177734375, 0.20947265625, 0.2457275390625, 0.281982421875, 0.3182373046875, 0.3544921875, 0.3907470703125, 0.427001953125, 0.4632568359375, 0.49951171875, 0.5357666015625, 0.572021484375, 0.6082763671875, 0.64453125, 0.6807861328125, 0.717041015625, 0.7532958984375, 0.78955078125, 0.8258056640625, 0.862060546875, 0.8983154296875, 0.9345703125, 0.9708251953125, 1.007080078125, 1.0433349609375, 1.07958984375, 1.1158447265625, 1.152099609375, 1.1883544921875, 1.224609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 8.0, 5.0, 5.0, 13.0, 21.0, 22.0, 30.0, 25.0, 23.0, 33.0, 41.0, 47.0, 44.0, 62.0, 68.0, 46.0, 59.0, 51.0, 54.0, 45.0, 37.0, 38.0, 38.0, 27.0, 25.0, 25.0, 16.0, 10.0, 15.0, 11.0, 11.0, 13.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.505859375, -1.4554290771484375, -1.404998779296875, -1.3545684814453125, -1.30413818359375, -1.2537078857421875, -1.203277587890625, -1.1528472900390625, -1.1024169921875, -1.0519866943359375, -1.001556396484375, -0.9511260986328125, -0.90069580078125, -0.8502655029296875, -0.799835205078125, -0.7494049072265625, -0.698974609375, -0.6485443115234375, -0.598114013671875, -0.5476837158203125, -0.49725341796875, -0.4468231201171875, -0.396392822265625, -0.3459625244140625, -0.2955322265625, -0.2451019287109375, -0.194671630859375, -0.1442413330078125, -0.09381103515625, -0.0433807373046875, 0.007049560546875, 0.0574798583984375, 0.10791015625, 0.1583404541015625, 0.208770751953125, 0.2592010498046875, 0.30963134765625, 0.3600616455078125, 0.410491943359375, 0.4609222412109375, 0.5113525390625, 0.5617828369140625, 0.612213134765625, 0.6626434326171875, 0.71307373046875, 0.7635040283203125, 0.813934326171875, 0.8643646240234375, 0.914794921875, 0.9652252197265625, 1.015655517578125, 1.0660858154296875, 1.11651611328125, 1.1669464111328125, 1.217376708984375, 1.2678070068359375, 1.3182373046875, 1.3686676025390625, 1.419097900390625, 1.4695281982421875, 1.51995849609375, 1.5703887939453125, 1.620819091796875, 1.6712493896484375, 1.7216796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 10.0, 3.0, 9.0, 10.0, 20.0, 45.0, 69.0, 106.0, 177.0, 338.0, 571.0, 1348.0, 3349.0, 11146.0, 151237.0, 845982.0, 25188.0, 5150.0, 1955.0, 887.0, 403.0, 220.0, 133.0, 68.0, 63.0, 30.0, 11.0, 8.0, 5.0, 3.0, 6.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.068878173828125, -1.03228759765625, -0.995697021484375, -0.9591064453125, -0.922515869140625, -0.88592529296875, -0.849334716796875, -0.812744140625, -0.776153564453125, -0.73956298828125, -0.702972412109375, -0.6663818359375, -0.629791259765625, -0.59320068359375, -0.556610107421875, -0.52001953125, -0.483428955078125, -0.44683837890625, -0.410247802734375, -0.3736572265625, -0.337066650390625, -0.30047607421875, -0.263885498046875, -0.227294921875, -0.190704345703125, -0.15411376953125, -0.117523193359375, -0.0809326171875, -0.044342041015625, -0.00775146484375, 0.028839111328125, 0.0654296875, 0.102020263671875, 0.13861083984375, 0.175201416015625, 0.2117919921875, 0.248382568359375, 0.28497314453125, 0.321563720703125, 0.358154296875, 0.394744873046875, 0.43133544921875, 0.467926025390625, 0.5045166015625, 0.541107177734375, 0.57769775390625, 0.614288330078125, 0.65087890625, 0.687469482421875, 0.72406005859375, 0.760650634765625, 0.7972412109375, 0.833831787109375, 0.87042236328125, 0.907012939453125, 0.943603515625, 0.980194091796875, 1.01678466796875, 1.053375244140625, 1.0899658203125, 1.126556396484375, 1.16314697265625, 1.199737548828125, 1.236328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 18.0, 34.0, 40.0, 60.0, 78.0, 200.0, 246.0, 99.0, 63.0, 43.0, 38.0, 20.0, 15.0, 8.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002491474151611328, -0.0002399645745754242, -0.00023078173398971558, -0.00022159889340400696, -0.00021241605281829834, -0.00020323321223258972, -0.0001940503716468811, -0.00018486753106117249, -0.00017568469047546387, -0.00016650184988975525, -0.00015731900930404663, -0.000148136168718338, -0.0001389533281326294, -0.00012977048754692078, -0.00012058764696121216, -0.00011140480637550354, -0.00010222196578979492, -9.30391252040863e-05, -8.385628461837769e-05, -7.467344403266907e-05, -6.549060344696045e-05, -5.630776286125183e-05, -4.712492227554321e-05, -3.7942081689834595e-05, -2.8759241104125977e-05, -1.957640051841736e-05, -1.039355993270874e-05, -1.210719347000122e-06, 7.972121238708496e-06, 1.7154961824417114e-05, 2.6337802410125732e-05, 3.552064299583435e-05, 4.470348358154297e-05, 5.388632416725159e-05, 6.30691647529602e-05, 7.225200533866882e-05, 8.143484592437744e-05, 9.061768651008606e-05, 9.980052709579468e-05, 0.0001089833676815033, 0.00011816620826721191, 0.00012734904885292053, 0.00013653188943862915, 0.00014571473002433777, 0.0001548975706100464, 0.000164080411195755, 0.00017326325178146362, 0.00018244609236717224, 0.00019162893295288086, 0.00020081177353858948, 0.0002099946141242981, 0.00021917745471000671, 0.00022836029529571533, 0.00023754313588142395, 0.00024672597646713257, 0.0002559088170528412, 0.0002650916576385498, 0.0002742744982242584, 0.00028345733880996704, 0.00029264017939567566, 0.0003018230199813843, 0.0003110058605670929, 0.0003201887011528015, 0.00032937154173851013, 0.00033855438232421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 7.0, 13.0, 7.0, 13.0, 16.0, 17.0, 30.0, 36.0, 53.0, 72.0, 97.0, 166.0, 282.0, 513.0, 1003.0, 1990.0, 4443.0, 11864.0, 56574.0, 840325.0, 104353.0, 16072.0, 5535.0, 2357.0, 1211.0, 569.0, 335.0, 172.0, 106.0, 88.0, 57.0, 43.0, 39.0, 22.0, 14.0, 14.0, 13.0, 6.0, 4.0, 2.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84033203125, -0.8128890991210938, -0.7854461669921875, -0.7580032348632812, -0.730560302734375, -0.7031173706054688, -0.6756744384765625, -0.6482315063476562, -0.62078857421875, -0.5933456420898438, -0.5659027099609375, -0.5384597778320312, -0.511016845703125, -0.48357391357421875, -0.4561309814453125, -0.42868804931640625, -0.4012451171875, -0.37380218505859375, -0.3463592529296875, -0.31891632080078125, -0.291473388671875, -0.26403045654296875, -0.2365875244140625, -0.20914459228515625, -0.18170166015625, -0.15425872802734375, -0.1268157958984375, -0.09937286376953125, -0.071929931640625, -0.04448699951171875, -0.0170440673828125, 0.01039886474609375, 0.037841796875, 0.06528472900390625, 0.0927276611328125, 0.12017059326171875, 0.147613525390625, 0.17505645751953125, 0.2024993896484375, 0.22994232177734375, 0.25738525390625, 0.28482818603515625, 0.3122711181640625, 0.33971405029296875, 0.367156982421875, 0.39459991455078125, 0.4220428466796875, 0.44948577880859375, 0.4769287109375, 0.5043716430664062, 0.5318145751953125, 0.5592575073242188, 0.586700439453125, 0.6141433715820312, 0.6415863037109375, 0.6690292358398438, 0.69647216796875, 0.7239151000976562, 0.7513580322265625, 0.7788009643554688, 0.806243896484375, 0.8336868286132812, 0.8611297607421875, 0.8885726928710938, 0.916015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 4.0, 5.0, 5.0, 7.0, 5.0, 5.0, 10.0, 11.0, 6.0, 15.0, 21.0, 30.0, 54.0, 81.0, 110.0, 144.0, 145.0, 99.0, 73.0, 41.0, 26.0, 22.0, 11.0, 5.0, 11.0, 10.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.85107421875, -0.8272781372070312, -0.8034820556640625, -0.7796859741210938, -0.755889892578125, -0.7320938110351562, -0.7082977294921875, -0.6845016479492188, -0.66070556640625, -0.6369094848632812, -0.6131134033203125, -0.5893173217773438, -0.565521240234375, -0.5417251586914062, -0.5179290771484375, -0.49413299560546875, -0.4703369140625, -0.44654083251953125, -0.4227447509765625, -0.39894866943359375, -0.375152587890625, -0.35135650634765625, -0.3275604248046875, -0.30376434326171875, -0.27996826171875, -0.25617218017578125, -0.2323760986328125, -0.20858001708984375, -0.184783935546875, -0.16098785400390625, -0.1371917724609375, -0.11339569091796875, -0.089599609375, -0.06580352783203125, -0.0420074462890625, -0.01821136474609375, 0.005584716796875, 0.02938079833984375, 0.0531768798828125, 0.07697296142578125, 0.10076904296875, 0.12456512451171875, 0.1483612060546875, 0.17215728759765625, 0.195953369140625, 0.21974945068359375, 0.2435455322265625, 0.26734161376953125, 0.2911376953125, 0.31493377685546875, 0.3387298583984375, 0.36252593994140625, 0.386322021484375, 0.41011810302734375, 0.4339141845703125, 0.45771026611328125, 0.48150634765625, 0.5053024291992188, 0.5290985107421875, 0.5528945922851562, 0.576690673828125, 0.6004867553710938, 0.6242828369140625, 0.6480789184570312, 0.671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 12.0, 27.0, 84.0, 133.0, 271.0, 173.0, 121.0, 55.0, 33.0, 26.0, 19.0, 8.0, 9.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.606428146362305, -16.19607162475586, -15.785715103149414, -15.375358581542969, -14.965002059936523, -14.554645538330078, -14.144289016723633, -13.733932495117188, -13.323575973510742, -12.913219451904297, -12.502862930297852, -12.092506408691406, -11.682149887084961, -11.271793365478516, -10.86143684387207, -10.451080322265625, -10.040722846984863, -9.630366325378418, -9.220009803771973, -8.809653282165527, -8.399296760559082, -7.988940238952637, -7.578583240509033, -7.168226718902588, -6.757870197296143, -6.347513675689697, -5.937157154083252, -5.526800155639648, -5.116443634033203, -4.706087112426758, -4.2957305908203125, -3.885374069213867, -3.475017547607422, -3.0646610260009766, -2.6543045043945312, -2.243947744369507, -1.8335912227630615, -1.4232347011566162, -1.0128779411315918, -0.6025214195251465, -0.19216489791870117, 0.21819168329238892, 0.628548264503479, 1.0389049053192139, 1.4492614269256592, 1.8596179485321045, 2.269974708557129, 2.680331230163574, 3.0906877517700195, 3.501044273376465, 3.91140079498291, 4.3217573165893555, 4.732113838195801, 5.142470359802246, 5.55282735824585, 5.963183879852295, 6.37354040145874, 6.7838969230651855, 7.194253444671631, 7.604610443115234, 8.01496696472168, 8.425323486328125, 8.83568000793457, 9.246036529541016, 9.656393051147461]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 10.0, 10.0, 16.0, 12.0, 15.0, 23.0, 28.0, 32.0, 29.0, 46.0, 41.0, 47.0, 46.0, 67.0, 86.0, 73.0, 69.0, 57.0, 37.0, 37.0, 33.0, 20.0, 27.0, 19.0, 26.0, 15.0, 17.0, 7.0, 13.0, 7.0, 7.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.614406585693359, -6.366888999938965, -6.11937141418457, -5.871853828430176, -5.624336242675781, -5.376818656921387, -5.129300594329834, -4.8817830085754395, -4.634265422821045, -4.38674783706665, -4.139230251312256, -3.8917124271392822, -3.6441948413848877, -3.396677255630493, -3.1491594314575195, -2.901641845703125, -2.6541242599487305, -2.406606674194336, -2.1590890884399414, -1.9115712642669678, -1.6640536785125732, -1.4165360927581787, -1.1690183877944946, -0.9215006828308105, -0.673983097076416, -0.4264654517173767, -0.1789478063583374, 0.0685698390007019, 0.3160874843597412, 0.5636050701141357, 0.8111227750778198, 1.058640480041504, 1.3061580657958984, 1.553675651550293, 1.801193356513977, 2.048711061477661, 2.2962286472320557, 2.54374623298645, 2.791264057159424, 3.0387816429138184, 3.286299228668213, 3.5338168144226074, 3.781334400177002, 4.0288519859313965, 4.276370048522949, 4.523887634277344, 4.771405220031738, 5.018922805786133, 5.266440391540527, 5.513957977294922, 5.761475563049316, 6.008993148803711, 6.2565107345581055, 6.5040283203125, 6.751546382904053, 6.999063968658447, 7.246581554412842, 7.494099140167236, 7.741616725921631, 7.989134311676025, 8.236652374267578, 8.484169960021973, 8.731687545776367, 8.979205131530762, 9.226722717285156]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 6.0, 12.0, 13.0, 21.0, 32.0, 57.0, 64.0, 105.0, 162.0, 323.0, 573.0, 1245.0, 3641.0, 16943.0, 218534.0, 3489923.0, 429698.0, 24863.0, 4806.0, 1583.0, 669.0, 371.0, 185.0, 113.0, 98.0, 70.0, 51.0, 31.0, 22.0, 18.0, 6.0, 12.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8251953125, -0.7982254028320312, -0.7712554931640625, -0.7442855834960938, -0.717315673828125, -0.6903457641601562, -0.6633758544921875, -0.6364059448242188, -0.60943603515625, -0.5824661254882812, -0.5554962158203125, -0.5285263061523438, -0.501556396484375, -0.47458648681640625, -0.4476165771484375, -0.42064666748046875, -0.3936767578125, -0.36670684814453125, -0.3397369384765625, -0.31276702880859375, -0.285797119140625, -0.25882720947265625, -0.2318572998046875, -0.20488739013671875, -0.17791748046875, -0.15094757080078125, -0.1239776611328125, -0.09700775146484375, -0.070037841796875, -0.04306793212890625, -0.0160980224609375, 0.01087188720703125, 0.037841796875, 0.06481170654296875, 0.0917816162109375, 0.11875152587890625, 0.145721435546875, 0.17269134521484375, 0.1996612548828125, 0.22663116455078125, 0.25360107421875, 0.28057098388671875, 0.3075408935546875, 0.33451080322265625, 0.361480712890625, 0.38845062255859375, 0.4154205322265625, 0.44239044189453125, 0.4693603515625, 0.49633026123046875, 0.5233001708984375, 0.5502700805664062, 0.577239990234375, 0.6042098999023438, 0.6311798095703125, 0.6581497192382812, 0.68511962890625, 0.7120895385742188, 0.7390594482421875, 0.7660293579101562, 0.792999267578125, 0.8199691772460938, 0.8469390869140625, 0.8739089965820312, 0.90087890625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 10.0, 16.0, 13.0, 26.0, 16.0, 36.0, 35.0, 36.0, 46.0, 51.0, 46.0, 59.0, 64.0, 68.0, 64.0, 56.0, 60.0, 35.0, 42.0, 44.0, 27.0, 31.0, 25.0, 14.0, 18.0, 14.0, 7.0, 6.0, 8.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.434326171875, -0.4220161437988281, -0.40970611572265625, -0.3973960876464844, -0.3850860595703125, -0.3727760314941406, -0.36046600341796875, -0.3481559753417969, -0.335845947265625, -0.3235359191894531, -0.31122589111328125, -0.2989158630371094, -0.2866058349609375, -0.2742958068847656, -0.26198577880859375, -0.24967575073242188, -0.23736572265625, -0.22505569458007812, -0.21274566650390625, -0.20043563842773438, -0.1881256103515625, -0.17581558227539062, -0.16350555419921875, -0.15119552612304688, -0.138885498046875, -0.12657546997070312, -0.11426544189453125, -0.10195541381835938, -0.0896453857421875, -0.07733535766601562, -0.06502532958984375, -0.052715301513671875, -0.0404052734375, -0.028095245361328125, -0.01578521728515625, -0.003475189208984375, 0.0088348388671875, 0.021144866943359375, 0.03345489501953125, 0.045764923095703125, 0.058074951171875, 0.07038497924804688, 0.08269500732421875, 0.09500503540039062, 0.1073150634765625, 0.11962509155273438, 0.13193511962890625, 0.14424514770507812, 0.15655517578125, 0.16886520385742188, 0.18117523193359375, 0.19348526000976562, 0.2057952880859375, 0.21810531616210938, 0.23041534423828125, 0.24272537231445312, 0.255035400390625, 0.2673454284667969, 0.27965545654296875, 0.2919654846191406, 0.3042755126953125, 0.3165855407714844, 0.32889556884765625, 0.3412055969238281, 0.353515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 8.0, 9.0, 8.0, 5.0, 9.0, 12.0, 22.0, 17.0, 22.0, 33.0, 56.0, 53.0, 69.0, 108.0, 140.0, 196.0, 392.0, 642.0, 1329.0, 3991.0, 16924.0, 131959.0, 3168104.0, 814110.0, 43649.0, 7614.0, 2354.0, 984.0, 512.0, 299.0, 171.0, 140.0, 79.0, 60.0, 46.0, 34.0, 41.0, 16.0, 14.0, 10.0, 11.0, 11.0, 4.0, 2.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.95458984375, -0.9263229370117188, -0.8980560302734375, -0.8697891235351562, -0.841522216796875, -0.8132553100585938, -0.7849884033203125, -0.7567214965820312, -0.72845458984375, -0.7001876831054688, -0.6719207763671875, -0.6436538696289062, -0.615386962890625, -0.5871200561523438, -0.5588531494140625, -0.5305862426757812, -0.5023193359375, -0.47405242919921875, -0.4457855224609375, -0.41751861572265625, -0.389251708984375, -0.36098480224609375, -0.3327178955078125, -0.30445098876953125, -0.27618408203125, -0.24791717529296875, -0.2196502685546875, -0.19138336181640625, -0.163116455078125, -0.13484954833984375, -0.1065826416015625, -0.07831573486328125, -0.050048828125, -0.02178192138671875, 0.0064849853515625, 0.03475189208984375, 0.063018798828125, 0.09128570556640625, 0.1195526123046875, 0.14781951904296875, 0.17608642578125, 0.20435333251953125, 0.2326202392578125, 0.26088714599609375, 0.289154052734375, 0.31742095947265625, 0.3456878662109375, 0.37395477294921875, 0.4022216796875, 0.43048858642578125, 0.4587554931640625, 0.48702239990234375, 0.515289306640625, 0.5435562133789062, 0.5718231201171875, 0.6000900268554688, 0.62835693359375, 0.6566238403320312, 0.6848907470703125, 0.7131576538085938, 0.741424560546875, 0.7696914672851562, 0.7979583740234375, 0.8262252807617188, 0.8544921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 6.0, 17.0, 24.0, 31.0, 53.0, 88.0, 114.0, 191.0, 422.0, 692.0, 855.0, 671.0, 385.0, 206.0, 107.0, 69.0, 42.0, 24.0, 21.0, 16.0, 8.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7796554565429688, -0.7512054443359375, -0.7227554321289062, -0.694305419921875, -0.6658554077148438, -0.6374053955078125, -0.6089553833007812, -0.58050537109375, -0.5520553588867188, -0.5236053466796875, -0.49515533447265625, -0.466705322265625, -0.43825531005859375, -0.4098052978515625, -0.38135528564453125, -0.3529052734375, -0.32445526123046875, -0.2960052490234375, -0.26755523681640625, -0.239105224609375, -0.21065521240234375, -0.1822052001953125, -0.15375518798828125, -0.12530517578125, -0.09685516357421875, -0.0684051513671875, -0.03995513916015625, -0.011505126953125, 0.01694488525390625, 0.0453948974609375, 0.07384490966796875, 0.102294921875, 0.13074493408203125, 0.1591949462890625, 0.18764495849609375, 0.216094970703125, 0.24454498291015625, 0.2729949951171875, 0.30144500732421875, 0.32989501953125, 0.35834503173828125, 0.3867950439453125, 0.41524505615234375, 0.443695068359375, 0.47214508056640625, 0.5005950927734375, 0.5290451049804688, 0.5574951171875, 0.5859451293945312, 0.6143951416015625, 0.6428451538085938, 0.671295166015625, 0.6997451782226562, 0.7281951904296875, 0.7566452026367188, 0.78509521484375, 0.8135452270507812, 0.8419952392578125, 0.8704452514648438, 0.898895263671875, 0.9273452758789062, 0.9557952880859375, 0.9842453002929688, 1.0126953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 27.0, 44.0, 114.0, 220.0, 277.0, 178.0, 71.0, 22.0, 10.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.320428848266602, -14.93005084991455, -14.539671897888184, -14.149293899536133, -13.758914947509766, -13.368536949157715, -12.978158950805664, -12.587779998779297, -12.197402000427246, -11.807024002075195, -11.416645050048828, -11.026267051696777, -10.635889053344727, -10.24551010131836, -9.855132102966309, -9.464754104614258, -9.07437515258789, -8.68399715423584, -8.293618202209473, -7.903240203857422, -7.512861728668213, -7.122483253479004, -6.732105255126953, -6.341726779937744, -5.951348304748535, -5.560969829559326, -5.170591354370117, -4.780213356018066, -4.389834880828857, -3.9994564056396484, -3.6090781688690186, -3.2186999320983887, -2.8283205032348633, -2.4379420280456543, -2.0475637912750244, -1.657185435295105, -1.2668070793151855, -0.8764287233352661, -0.4860503673553467, -0.0956721305847168, 0.2947063446044922, 0.6850847005844116, 1.075463056564331, 1.4658414125442505, 1.85621976852417, 2.246598243713379, 2.636976480484009, 3.0273547172546387, 3.4177331924438477, 3.8081116676330566, 4.198490142822266, 4.588868141174316, 4.979246616363525, 5.369625091552734, 5.760003089904785, 6.150381565093994, 6.540760040283203, 6.931138515472412, 7.321516990661621, 7.711894989013672, 8.102273941040039, 8.49265193939209, 8.88302993774414, 9.273408889770508, 9.663786888122559]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 5.0, 9.0, 8.0, 8.0, 12.0, 17.0, 28.0, 20.0, 19.0, 27.0, 42.0, 40.0, 45.0, 38.0, 61.0, 61.0, 57.0, 66.0, 56.0, 47.0, 42.0, 36.0, 43.0, 35.0, 29.0, 25.0, 21.0, 31.0, 10.0, 13.0, 14.0, 10.0, 7.0, 7.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021277666091919, -2.9093739986419678, -2.7974705696105957, -2.6855669021606445, -2.5736632347106934, -2.461759567260742, -2.34985613822937, -2.237952470779419, -2.126049041748047, -2.0141453742980957, -1.902241826057434, -1.7903382778167725, -1.6784346103668213, -1.5665310621261597, -1.454627513885498, -1.3427238464355469, -1.2308201789855957, -1.118916630744934, -1.007012963294983, -0.8951094150543213, -0.7832058072090149, -0.6713021993637085, -0.5593986511230469, -0.4474950432777405, -0.3355914354324341, -0.22368784248828888, -0.11178424954414368, 0.00011932849884033203, 0.11202293634414673, 0.22392654418945312, 0.33583009243011475, 0.44773370027542114, 0.5596370697021484, 0.6715406775474548, 0.7834442853927612, 0.8953478336334229, 1.007251501083374, 1.1191550493240356, 1.2310585975646973, 1.3429622650146484, 1.45486581325531, 1.5667693614959717, 1.6786730289459229, 1.7905765771865845, 1.902480125427246, 2.0143837928771973, 2.1262874603271484, 2.2381908893585205, 2.3500945568084717, 2.461998224258423, 2.573901653289795, 2.685805320739746, 2.7977089881896973, 2.9096126556396484, 3.0215160846710205, 3.1334197521209717, 3.2453231811523438, 3.357226848602295, 3.469130277633667, 3.581033945083618, 3.6929376125335693, 3.8048410415649414, 3.9167447090148926, 4.028648376464844, 4.140552043914795]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 5.0, 5.0, 11.0, 22.0, 29.0, 40.0, 49.0, 84.0, 123.0, 187.0, 379.0, 743.0, 1331.0, 2931.0, 6909.0, 19605.0, 63940.0, 255206.0, 487436.0, 147210.0, 40028.0, 12851.0, 4887.0, 2155.0, 1061.0, 537.0, 298.0, 169.0, 103.0, 84.0, 53.0, 28.0, 12.0, 18.0, 8.0, 2.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.791015625, -0.7665328979492188, -0.7420501708984375, -0.7175674438476562, -0.693084716796875, -0.6686019897460938, -0.6441192626953125, -0.6196365356445312, -0.59515380859375, -0.5706710815429688, -0.5461883544921875, -0.5217056274414062, -0.497222900390625, -0.47274017333984375, -0.4482574462890625, -0.42377471923828125, -0.3992919921875, -0.37480926513671875, -0.3503265380859375, -0.32584381103515625, -0.301361083984375, -0.27687835693359375, -0.2523956298828125, -0.22791290283203125, -0.20343017578125, -0.17894744873046875, -0.1544647216796875, -0.12998199462890625, -0.105499267578125, -0.08101654052734375, -0.0565338134765625, -0.03205108642578125, -0.007568359375, 0.01691436767578125, 0.0413970947265625, 0.06587982177734375, 0.090362548828125, 0.11484527587890625, 0.1393280029296875, 0.16381072998046875, 0.18829345703125, 0.21277618408203125, 0.2372589111328125, 0.26174163818359375, 0.286224365234375, 0.31070709228515625, 0.3351898193359375, 0.35967254638671875, 0.3841552734375, 0.40863800048828125, 0.4331207275390625, 0.45760345458984375, 0.482086181640625, 0.5065689086914062, 0.5310516357421875, 0.5555343627929688, 0.58001708984375, 0.6044998168945312, 0.6289825439453125, 0.6534652709960938, 0.677947998046875, 0.7024307250976562, 0.7269134521484375, 0.7513961791992188, 0.77587890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 9.0, 14.0, 20.0, 28.0, 26.0, 34.0, 54.0, 60.0, 53.0, 49.0, 56.0, 59.0, 65.0, 61.0, 52.0, 45.0, 41.0, 52.0, 33.0, 30.0, 29.0, 22.0, 19.0, 14.0, 10.0, 11.0, 9.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.46044921875, -0.4480133056640625, -0.435577392578125, -0.4231414794921875, -0.41070556640625, -0.3982696533203125, -0.385833740234375, -0.3733978271484375, -0.3609619140625, -0.3485260009765625, -0.336090087890625, -0.3236541748046875, -0.31121826171875, -0.2987823486328125, -0.286346435546875, -0.2739105224609375, -0.261474609375, -0.2490386962890625, -0.236602783203125, -0.2241668701171875, -0.21173095703125, -0.1992950439453125, -0.186859130859375, -0.1744232177734375, -0.1619873046875, -0.1495513916015625, -0.137115478515625, -0.1246795654296875, -0.11224365234375, -0.0998077392578125, -0.087371826171875, -0.0749359130859375, -0.0625, -0.0500640869140625, -0.037628173828125, -0.0251922607421875, -0.01275634765625, -0.0003204345703125, 0.012115478515625, 0.0245513916015625, 0.0369873046875, 0.0494232177734375, 0.061859130859375, 0.0742950439453125, 0.08673095703125, 0.0991668701171875, 0.111602783203125, 0.1240386962890625, 0.136474609375, 0.1489105224609375, 0.161346435546875, 0.1737823486328125, 0.18621826171875, 0.1986541748046875, 0.211090087890625, 0.2235260009765625, 0.2359619140625, 0.2483978271484375, 0.260833740234375, 0.2732696533203125, 0.28570556640625, 0.2981414794921875, 0.310577392578125, 0.3230133056640625, 0.33544921875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 7.0, 4.0, 12.0, 21.0, 24.0, 38.0, 44.0, 88.0, 135.0, 207.0, 301.0, 525.0, 926.0, 1893.0, 5239.0, 21482.0, 156512.0, 746278.0, 92202.0, 15036.0, 3878.0, 1631.0, 800.0, 454.0, 287.0, 165.0, 98.0, 81.0, 54.0, 40.0, 26.0, 18.0, 7.0, 8.0, 4.0, 7.0, 1.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.255859375, -1.2145233154296875, -1.173187255859375, -1.1318511962890625, -1.09051513671875, -1.0491790771484375, -1.007843017578125, -0.9665069580078125, -0.9251708984375, -0.8838348388671875, -0.842498779296875, -0.8011627197265625, -0.75982666015625, -0.7184906005859375, -0.677154541015625, -0.6358184814453125, -0.594482421875, -0.5531463623046875, -0.511810302734375, -0.4704742431640625, -0.42913818359375, -0.3878021240234375, -0.346466064453125, -0.3051300048828125, -0.2637939453125, -0.2224578857421875, -0.181121826171875, -0.1397857666015625, -0.09844970703125, -0.0571136474609375, -0.015777587890625, 0.0255584716796875, 0.06689453125, 0.1082305908203125, 0.149566650390625, 0.1909027099609375, 0.23223876953125, 0.2735748291015625, 0.314910888671875, 0.3562469482421875, 0.3975830078125, 0.4389190673828125, 0.480255126953125, 0.5215911865234375, 0.56292724609375, 0.6042633056640625, 0.645599365234375, 0.6869354248046875, 0.728271484375, 0.7696075439453125, 0.810943603515625, 0.8522796630859375, 0.89361572265625, 0.9349517822265625, 0.976287841796875, 1.0176239013671875, 1.0589599609375, 1.1002960205078125, 1.141632080078125, 1.1829681396484375, 1.22430419921875, 1.2656402587890625, 1.306976318359375, 1.3483123779296875, 1.3896484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 1.0, 5.0, 6.0, 9.0, 11.0, 11.0, 11.0, 14.0, 16.0, 30.0, 26.0, 22.0, 32.0, 37.0, 47.0, 40.0, 42.0, 49.0, 39.0, 45.0, 42.0, 36.0, 46.0, 39.0, 38.0, 46.0, 40.0, 18.0, 25.0, 24.0, 14.0, 16.0, 21.0, 21.0, 18.0, 8.0, 12.0, 9.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.033203125, -0.9966278076171875, -0.960052490234375, -0.9234771728515625, -0.88690185546875, -0.8503265380859375, -0.813751220703125, -0.7771759033203125, -0.7406005859375, -0.7040252685546875, -0.667449951171875, -0.6308746337890625, -0.59429931640625, -0.5577239990234375, -0.521148681640625, -0.4845733642578125, -0.447998046875, -0.4114227294921875, -0.374847412109375, -0.3382720947265625, -0.30169677734375, -0.2651214599609375, -0.228546142578125, -0.1919708251953125, -0.1553955078125, -0.1188201904296875, -0.082244873046875, -0.0456695556640625, -0.00909423828125, 0.0274810791015625, 0.064056396484375, 0.1006317138671875, 0.13720703125, 0.1737823486328125, 0.210357666015625, 0.2469329833984375, 0.28350830078125, 0.3200836181640625, 0.356658935546875, 0.3932342529296875, 0.4298095703125, 0.4663848876953125, 0.502960205078125, 0.5395355224609375, 0.57611083984375, 0.6126861572265625, 0.649261474609375, 0.6858367919921875, 0.722412109375, 0.7589874267578125, 0.795562744140625, 0.8321380615234375, 0.86871337890625, 0.9052886962890625, 0.941864013671875, 0.9784393310546875, 1.0150146484375, 1.0515899658203125, 1.088165283203125, 1.1247406005859375, 1.16131591796875, 1.1978912353515625, 1.234466552734375, 1.2710418701171875, 1.3076171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 4.0, 3.0, 6.0, 10.0, 13.0, 19.0, 26.0, 35.0, 62.0, 76.0, 128.0, 283.0, 499.0, 1125.0, 2945.0, 9366.0, 38919.0, 279065.0, 640107.0, 56694.0, 12566.0, 3713.0, 1387.0, 665.0, 322.0, 176.0, 103.0, 62.0, 55.0, 44.0, 21.0, 16.0, 12.0, 6.0, 11.0, 3.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5625, -0.5438232421875, -0.525146484375, -0.5064697265625, -0.48779296875, -0.4691162109375, -0.450439453125, -0.4317626953125, -0.4130859375, -0.3944091796875, -0.375732421875, -0.3570556640625, -0.33837890625, -0.3197021484375, -0.301025390625, -0.2823486328125, -0.263671875, -0.2449951171875, -0.226318359375, -0.2076416015625, -0.18896484375, -0.1702880859375, -0.151611328125, -0.1329345703125, -0.1142578125, -0.0955810546875, -0.076904296875, -0.0582275390625, -0.03955078125, -0.0208740234375, -0.002197265625, 0.0164794921875, 0.03515625, 0.0538330078125, 0.072509765625, 0.0911865234375, 0.10986328125, 0.1285400390625, 0.147216796875, 0.1658935546875, 0.1845703125, 0.2032470703125, 0.221923828125, 0.2406005859375, 0.25927734375, 0.2779541015625, 0.296630859375, 0.3153076171875, 0.333984375, 0.3526611328125, 0.371337890625, 0.3900146484375, 0.40869140625, 0.4273681640625, 0.446044921875, 0.4647216796875, 0.4833984375, 0.5020751953125, 0.520751953125, 0.5394287109375, 0.55810546875, 0.5767822265625, 0.595458984375, 0.6141357421875, 0.6328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 3.0, 3.0, 6.0, 9.0, 4.0, 14.0, 7.0, 26.0, 30.0, 43.0, 65.0, 99.0, 153.0, 189.0, 94.0, 69.0, 46.0, 27.0, 12.0, 17.0, 14.0, 10.0, 8.0, 13.0, 4.0, 8.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00018846988677978516, -0.00018309615552425385, -0.00017772242426872253, -0.00017234869301319122, -0.0001669749617576599, -0.0001616012305021286, -0.0001562274992465973, -0.00015085376799106598, -0.00014548003673553467, -0.00014010630548000336, -0.00013473257422447205, -0.00012935884296894073, -0.00012398511171340942, -0.00011861138045787811, -0.0001132376492023468, -0.00010786391794681549, -0.00010249018669128418, -9.711645543575287e-05, -9.174272418022156e-05, -8.636899292469025e-05, -8.099526166915894e-05, -7.562153041362762e-05, -7.024779915809631e-05, -6.4874067902565e-05, -5.950033664703369e-05, -5.412660539150238e-05, -4.875287413597107e-05, -4.337914288043976e-05, -3.800541162490845e-05, -3.2631680369377136e-05, -2.7257949113845825e-05, -2.1884217858314514e-05, -1.6510486602783203e-05, -1.1136755347251892e-05, -5.763024091720581e-06, -3.8929283618927e-07, 4.984438419342041e-06, 1.0358169674873352e-05, 1.5731900930404663e-05, 2.1105632185935974e-05, 2.6479363441467285e-05, 3.1853094696998596e-05, 3.722682595252991e-05, 4.260055720806122e-05, 4.797428846359253e-05, 5.334801971912384e-05, 5.872175097465515e-05, 6.409548223018646e-05, 6.946921348571777e-05, 7.484294474124908e-05, 8.02166759967804e-05, 8.55904072523117e-05, 9.096413850784302e-05, 9.633786976337433e-05, 0.00010171160101890564, 0.00010708533227443695, 0.00011245906352996826, 0.00011783279478549957, 0.00012320652604103088, 0.0001285802572965622, 0.0001339539885520935, 0.00013932771980762482, 0.00014470145106315613, 0.00015007518231868744, 0.00015544891357421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 1.0, 6.0, 13.0, 16.0, 17.0, 42.0, 52.0, 96.0, 144.0, 271.0, 441.0, 854.0, 1730.0, 4599.0, 14422.0, 57570.0, 576923.0, 324486.0, 47315.0, 12079.0, 3933.0, 1592.0, 828.0, 424.0, 266.0, 149.0, 100.0, 60.0, 42.0, 18.0, 23.0, 11.0, 6.0, 6.0, 9.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.62451171875, -0.6066360473632812, -0.5887603759765625, -0.5708847045898438, -0.553009033203125, -0.5351333618164062, -0.5172576904296875, -0.49938201904296875, -0.48150634765625, -0.46363067626953125, -0.4457550048828125, -0.42787933349609375, -0.410003662109375, -0.39212799072265625, -0.3742523193359375, -0.35637664794921875, -0.3385009765625, -0.32062530517578125, -0.3027496337890625, -0.28487396240234375, -0.266998291015625, -0.24912261962890625, -0.2312469482421875, -0.21337127685546875, -0.19549560546875, -0.17761993408203125, -0.1597442626953125, -0.14186859130859375, -0.123992919921875, -0.10611724853515625, -0.0882415771484375, -0.07036590576171875, -0.052490234375, -0.03461456298828125, -0.0167388916015625, 0.00113677978515625, 0.019012451171875, 0.03688812255859375, 0.0547637939453125, 0.07263946533203125, 0.09051513671875, 0.10839080810546875, 0.1262664794921875, 0.14414215087890625, 0.162017822265625, 0.17989349365234375, 0.1977691650390625, 0.21564483642578125, 0.2335205078125, 0.25139617919921875, 0.2692718505859375, 0.28714752197265625, 0.305023193359375, 0.32289886474609375, 0.3407745361328125, 0.35865020751953125, 0.37652587890625, 0.39440155029296875, 0.4122772216796875, 0.43015289306640625, 0.448028564453125, 0.46590423583984375, 0.4837799072265625, 0.5016555786132812, 0.51953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 1.0, 2.0, 6.0, 5.0, 6.0, 7.0, 10.0, 8.0, 13.0, 11.0, 16.0, 25.0, 30.0, 33.0, 43.0, 54.0, 76.0, 76.0, 89.0, 88.0, 66.0, 61.0, 48.0, 52.0, 25.0, 20.0, 19.0, 18.0, 21.0, 15.0, 9.0, 3.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 6.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2841148376464844, -0.27379608154296875, -0.2634773254394531, -0.2531585693359375, -0.24283981323242188, -0.23252105712890625, -0.22220230102539062, -0.211883544921875, -0.20156478881835938, -0.19124603271484375, -0.18092727661132812, -0.1706085205078125, -0.16028976440429688, -0.14997100830078125, -0.13965225219726562, -0.12933349609375, -0.11901473999023438, -0.10869598388671875, -0.09837722778320312, -0.0880584716796875, -0.07773971557617188, -0.06742095947265625, -0.057102203369140625, -0.046783447265625, -0.036464691162109375, -0.02614593505859375, -0.015827178955078125, -0.0055084228515625, 0.004810333251953125, 0.01512908935546875, 0.025447845458984375, 0.0357666015625, 0.046085357666015625, 0.05640411376953125, 0.06672286987304688, 0.0770416259765625, 0.08736038208007812, 0.09767913818359375, 0.10799789428710938, 0.118316650390625, 0.12863540649414062, 0.13895416259765625, 0.14927291870117188, 0.1595916748046875, 0.16991043090820312, 0.18022918701171875, 0.19054794311523438, 0.20086669921875, 0.21118545532226562, 0.22150421142578125, 0.23182296752929688, 0.2421417236328125, 0.2524604797363281, 0.26277923583984375, 0.2730979919433594, 0.283416748046875, 0.2937355041503906, 0.30405426025390625, 0.3143730163574219, 0.3246917724609375, 0.3350105285644531, 0.34532928466796875, 0.3556480407714844, 0.365966796875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 8.0, 22.0, 47.0, 106.0, 253.0, 298.0, 133.0, 73.0, 28.0, 6.0, 2.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.409189224243164, -15.999808311462402, -15.59042739868164, -15.181046485900879, -14.771665573120117, -14.362284660339355, -13.952903747558594, -13.543523788452148, -13.13414192199707, -12.724761009216309, -12.315380096435547, -11.905999183654785, -11.496618270874023, -11.087237358093262, -10.6778564453125, -10.268476486206055, -9.859095573425293, -9.449714660644531, -9.04033374786377, -8.630952835083008, -8.221571922302246, -7.812191009521484, -7.402810573577881, -6.993429660797119, -6.584048748016357, -6.174667835235596, -5.765286922454834, -5.3559064865112305, -4.946525573730469, -4.537144660949707, -4.127763748168945, -3.7183828353881836, -3.309001922607422, -2.89962100982666, -2.4902400970458984, -2.080859422683716, -1.671478509902954, -1.2620975971221924, -0.8527169227600098, -0.44333600997924805, -0.03395509719848633, 0.3754257559776306, 0.7848066091537476, 1.1941874027252197, 1.6035683155059814, 2.012949228286743, 2.422329902648926, 2.8317108154296875, 3.241091728210449, 3.650472640991211, 4.059853553771973, 4.469234466552734, 4.878615379333496, 5.287996292114258, 5.697376728057861, 6.106757640838623, 6.516138553619385, 6.9255194664001465, 7.334900379180908, 7.744280815124512, 8.153661727905273, 8.563042640686035, 8.972423553466797, 9.381804466247559, 9.79118537902832]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 2.0, 10.0, 14.0, 18.0, 16.0, 11.0, 18.0, 22.0, 23.0, 26.0, 31.0, 34.0, 39.0, 59.0, 49.0, 68.0, 74.0, 66.0, 58.0, 38.0, 26.0, 35.0, 35.0, 41.0, 24.0, 24.0, 21.0, 13.0, 22.0, 15.0, 10.0, 8.0, 6.0, 11.0, 5.0, 3.0, 6.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.722186088562012, -5.552452087402344, -5.382718086242676, -5.212984085083008, -5.043250560760498, -4.87351655960083, -4.703782558441162, -4.534048557281494, -4.364314556121826, -4.194580554962158, -4.02484655380249, -3.8551127910614014, -3.6853787899017334, -3.5156450271606445, -3.3459110260009766, -3.1761770248413086, -3.0064432621002197, -2.8367092609405518, -2.666975498199463, -2.497241497039795, -2.327507495880127, -2.157773494720459, -1.9880397319793701, -1.8183057308197021, -1.6485718488693237, -1.4788379669189453, -1.3091039657592773, -1.139370083808899, -0.9696361422538757, -0.7999022006988525, -0.6301683187484741, -0.46043431758880615, -0.29070043563842773, -0.12096650898456573, 0.048767417669296265, 0.21850132942199707, 0.38823527097702026, 0.5579692125320435, 0.7277030944824219, 0.8974370956420898, 1.0671709775924683, 1.2369048595428467, 1.4066388607025146, 1.576372742652893, 1.7461066246032715, 1.9158406257629395, 2.0855746269226074, 2.2553086280822754, 2.4250423908233643, 2.5947763919830322, 2.764510154724121, 2.934244155883789, 3.103978157043457, 3.273712158203125, 3.443445920944214, 3.613179922103882, 3.7829136848449707, 3.9526476860046387, 4.122381687164307, 4.292115211486816, 4.461849212646484, 4.631583213806152, 4.80131721496582, 4.971051216125488, 5.140785217285156]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 13.0, 13.0, 26.0, 31.0, 51.0, 91.0, 120.0, 198.0, 346.0, 635.0, 1378.0, 3350.0, 11011.0, 69451.0, 2472489.0, 1570796.0, 48703.0, 9396.0, 3211.0, 1369.0, 662.0, 379.0, 209.0, 101.0, 70.0, 56.0, 39.0, 20.0, 15.0, 4.0, 9.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88525390625, -0.8575286865234375, -0.829803466796875, -0.8020782470703125, -0.77435302734375, -0.7466278076171875, -0.718902587890625, -0.6911773681640625, -0.6634521484375, -0.6357269287109375, -0.608001708984375, -0.5802764892578125, -0.55255126953125, -0.5248260498046875, -0.497100830078125, -0.4693756103515625, -0.441650390625, -0.4139251708984375, -0.386199951171875, -0.3584747314453125, -0.33074951171875, -0.3030242919921875, -0.275299072265625, -0.2475738525390625, -0.2198486328125, -0.1921234130859375, -0.164398193359375, -0.1366729736328125, -0.10894775390625, -0.0812225341796875, -0.053497314453125, -0.0257720947265625, 0.001953125, 0.0296783447265625, 0.057403564453125, 0.0851287841796875, 0.11285400390625, 0.1405792236328125, 0.168304443359375, 0.1960296630859375, 0.2237548828125, 0.2514801025390625, 0.279205322265625, 0.3069305419921875, 0.33465576171875, 0.3623809814453125, 0.390106201171875, 0.4178314208984375, 0.445556640625, 0.4732818603515625, 0.501007080078125, 0.5287322998046875, 0.55645751953125, 0.5841827392578125, 0.611907958984375, 0.6396331787109375, 0.6673583984375, 0.6950836181640625, 0.722808837890625, 0.7505340576171875, 0.77825927734375, 0.8059844970703125, 0.833709716796875, 0.8614349365234375, 0.88916015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 7.0, 10.0, 13.0, 10.0, 8.0, 13.0, 24.0, 32.0, 44.0, 48.0, 64.0, 49.0, 73.0, 55.0, 73.0, 60.0, 56.0, 74.0, 33.0, 40.0, 40.0, 31.0, 28.0, 22.0, 21.0, 16.0, 12.0, 15.0, 5.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.43701171875, -0.4247589111328125, -0.412506103515625, -0.4002532958984375, -0.38800048828125, -0.3757476806640625, -0.363494873046875, -0.3512420654296875, -0.3389892578125, -0.3267364501953125, -0.314483642578125, -0.3022308349609375, -0.28997802734375, -0.2777252197265625, -0.265472412109375, -0.2532196044921875, -0.240966796875, -0.2287139892578125, -0.216461181640625, -0.2042083740234375, -0.19195556640625, -0.1797027587890625, -0.167449951171875, -0.1551971435546875, -0.1429443359375, -0.1306915283203125, -0.118438720703125, -0.1061859130859375, -0.09393310546875, -0.0816802978515625, -0.069427490234375, -0.0571746826171875, -0.044921875, -0.0326690673828125, -0.020416259765625, -0.0081634521484375, 0.00408935546875, 0.0163421630859375, 0.028594970703125, 0.0408477783203125, 0.0531005859375, 0.0653533935546875, 0.077606201171875, 0.0898590087890625, 0.10211181640625, 0.1143646240234375, 0.126617431640625, 0.1388702392578125, 0.151123046875, 0.1633758544921875, 0.175628662109375, 0.1878814697265625, 0.20013427734375, 0.2123870849609375, 0.224639892578125, 0.2368927001953125, 0.2491455078125, 0.2613983154296875, 0.273651123046875, 0.2859039306640625, 0.29815673828125, 0.3104095458984375, 0.322662353515625, 0.3349151611328125, 0.34716796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 4.0, 3.0, 0.0, 9.0, 13.0, 9.0, 25.0, 36.0, 33.0, 48.0, 55.0, 96.0, 125.0, 189.0, 387.0, 1070.0, 5029.0, 115147.0, 4042422.0, 25213.0, 2844.0, 736.0, 297.0, 140.0, 84.0, 66.0, 44.0, 37.0, 22.0, 23.0, 17.0, 12.0, 6.0, 10.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.01605224609375, -1.9364013671875, -1.85675048828125, -1.777099609375, -1.69744873046875, -1.6177978515625, -1.53814697265625, -1.45849609375, -1.37884521484375, -1.2991943359375, -1.21954345703125, -1.139892578125, -1.06024169921875, -0.9805908203125, -0.90093994140625, -0.8212890625, -0.74163818359375, -0.6619873046875, -0.58233642578125, -0.502685546875, -0.42303466796875, -0.3433837890625, -0.26373291015625, -0.18408203125, -0.10443115234375, -0.0247802734375, 0.05487060546875, 0.134521484375, 0.21417236328125, 0.2938232421875, 0.37347412109375, 0.453125, 0.53277587890625, 0.6124267578125, 0.69207763671875, 0.771728515625, 0.85137939453125, 0.9310302734375, 1.01068115234375, 1.09033203125, 1.16998291015625, 1.2496337890625, 1.32928466796875, 1.408935546875, 1.48858642578125, 1.5682373046875, 1.64788818359375, 1.7275390625, 1.80718994140625, 1.8868408203125, 1.96649169921875, 2.046142578125, 2.12579345703125, 2.2054443359375, 2.28509521484375, 2.36474609375, 2.44439697265625, 2.5240478515625, 2.60369873046875, 2.683349609375, 2.76300048828125, 2.8426513671875, 2.92230224609375, 3.001953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 13.0, 24.0, 64.0, 141.0, 315.0, 991.0, 1354.0, 692.0, 247.0, 102.0, 43.0, 31.0, 26.0, 9.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.45703125, -1.4119110107421875, -1.366790771484375, -1.3216705322265625, -1.27655029296875, -1.2314300537109375, -1.186309814453125, -1.1411895751953125, -1.0960693359375, -1.0509490966796875, -1.005828857421875, -0.9607086181640625, -0.91558837890625, -0.8704681396484375, -0.825347900390625, -0.7802276611328125, -0.735107421875, -0.6899871826171875, -0.644866943359375, -0.5997467041015625, -0.55462646484375, -0.5095062255859375, -0.464385986328125, -0.4192657470703125, -0.3741455078125, -0.3290252685546875, -0.283905029296875, -0.2387847900390625, -0.19366455078125, -0.1485443115234375, -0.103424072265625, -0.0583038330078125, -0.01318359375, 0.0319366455078125, 0.077056884765625, 0.1221771240234375, 0.16729736328125, 0.2124176025390625, 0.257537841796875, 0.3026580810546875, 0.3477783203125, 0.3928985595703125, 0.438018798828125, 0.4831390380859375, 0.52825927734375, 0.5733795166015625, 0.618499755859375, 0.6636199951171875, 0.708740234375, 0.7538604736328125, 0.798980712890625, 0.8441009521484375, 0.88922119140625, 0.9343414306640625, 0.979461669921875, 1.0245819091796875, 1.0697021484375, 1.1148223876953125, 1.159942626953125, 1.2050628662109375, 1.25018310546875, 1.2953033447265625, 1.340423583984375, 1.3855438232421875, 1.4306640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 22.0, 52.0, 136.0, 218.0, 248.0, 160.0, 69.0, 28.0, 24.0, 9.0, 9.0, 4.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.272615432739258, -13.828376770019531, -13.384138107299805, -12.939899444580078, -12.495661735534668, -12.051423072814941, -11.607184410095215, -11.162945747375488, -10.718707084655762, -10.274468421936035, -9.830229759216309, -9.385992050170898, -8.941753387451172, -8.497514724731445, -8.053276062011719, -7.609037399291992, -7.164799213409424, -6.720560550689697, -6.276322364807129, -5.832083702087402, -5.387845039367676, -4.943606376647949, -4.499368190765381, -4.055129528045654, -3.610891103744507, -3.1666526794433594, -2.722414016723633, -2.2781755924224854, -1.8339370489120483, -1.3896985054016113, -0.9454600811004639, -0.5012214183807373, -0.056982994079589844, 0.3872555196285248, 0.8314940333366394, 1.2757325172424316, 1.7199710607528687, 2.1642096042633057, 2.608448028564453, 3.0526866912841797, 3.496925115585327, 3.9411635398864746, 4.385402202606201, 4.8296403884887695, 5.273879051208496, 5.718117713928223, 6.162356376647949, 6.606595039367676, 7.050833225250244, 7.495071887969971, 7.939310073852539, 8.383548736572266, 8.827787399291992, 9.272026062011719, 9.716264724731445, 10.160503387451172, 10.604741096496582, 11.048979759216309, 11.493218421936035, 11.937456130981445, 12.381694793701172, 12.825933456420898, 13.270172119140625, 13.714410781860352, 14.158649444580078]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 9.0, 11.0, 28.0, 32.0, 23.0, 44.0, 61.0, 61.0, 68.0, 72.0, 70.0, 57.0, 64.0, 51.0, 48.0, 58.0, 52.0, 41.0, 30.0, 20.0, 18.0, 18.0, 12.0, 14.0, 10.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.908550262451172, -5.744234561920166, -5.579919338226318, -5.4156036376953125, -5.251288414001465, -5.086972713470459, -4.922657489776611, -4.7583417892456055, -4.594026565551758, -4.429710865020752, -4.265395641326904, -4.101079940795898, -3.936764717102051, -3.772449016571045, -3.608133554458618, -3.4438180923461914, -3.2795023918151855, -3.115186929702759, -2.950871467590332, -2.7865560054779053, -2.6222405433654785, -2.4579248428344727, -2.293609380722046, -2.129293918609619, -1.9649784564971924, -1.8006629943847656, -1.6363475322723389, -1.4720319509506226, -1.3077164888381958, -1.143401026725769, -0.9790855050086975, -0.814769983291626, -0.6504545211791992, -0.4861390292644501, -0.3218235373497009, -0.15750804543495178, 0.006807446479797363, 0.17112290859222412, 0.33543843030929565, 0.4997539520263672, 0.664069414138794, 0.8283848762512207, 0.9927003979682922, 1.1570159196853638, 1.3213313817977905, 1.4856468439102173, 1.6499624252319336, 1.8142778873443604, 1.978593349456787, 2.142908811569214, 2.3072242736816406, 2.4715397357940674, 2.635855197906494, 2.8001708984375, 2.9644863605499268, 3.1288018226623535, 3.2931172847747803, 3.457432746887207, 3.621748208999634, 3.7860636711120605, 3.9503793716430664, 4.114694595336914, 4.27901029586792, 4.443325996398926, 4.607641220092773]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 13.0, 10.0, 20.0, 16.0, 28.0, 54.0, 87.0, 130.0, 239.0, 467.0, 1182.0, 3495.0, 13951.0, 80478.0, 527507.0, 357683.0, 49304.0, 9439.0, 2649.0, 883.0, 381.0, 213.0, 119.0, 64.0, 46.0, 31.0, 14.0, 13.0, 14.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.162109375, -1.1314239501953125, -1.100738525390625, -1.0700531005859375, -1.03936767578125, -1.0086822509765625, -0.977996826171875, -0.9473114013671875, -0.9166259765625, -0.8859405517578125, -0.855255126953125, -0.8245697021484375, -0.79388427734375, -0.7631988525390625, -0.732513427734375, -0.7018280029296875, -0.671142578125, -0.6404571533203125, -0.609771728515625, -0.5790863037109375, -0.54840087890625, -0.5177154541015625, -0.487030029296875, -0.4563446044921875, -0.4256591796875, -0.3949737548828125, -0.364288330078125, -0.3336029052734375, -0.30291748046875, -0.2722320556640625, -0.241546630859375, -0.2108612060546875, -0.18017578125, -0.1494903564453125, -0.118804931640625, -0.0881195068359375, -0.05743408203125, -0.0267486572265625, 0.003936767578125, 0.0346221923828125, 0.0653076171875, 0.0959930419921875, 0.126678466796875, 0.1573638916015625, 0.18804931640625, 0.2187347412109375, 0.249420166015625, 0.2801055908203125, 0.310791015625, 0.3414764404296875, 0.372161865234375, 0.4028472900390625, 0.43353271484375, 0.4642181396484375, 0.494903564453125, 0.5255889892578125, 0.5562744140625, 0.5869598388671875, 0.617645263671875, 0.6483306884765625, 0.67901611328125, 0.7097015380859375, 0.740386962890625, 0.7710723876953125, 0.8017578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 8.0, 15.0, 19.0, 17.0, 43.0, 39.0, 64.0, 61.0, 61.0, 79.0, 81.0, 88.0, 65.0, 69.0, 66.0, 42.0, 35.0, 27.0, 16.0, 24.0, 24.0, 12.0, 9.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.685546875, -0.6688613891601562, -0.6521759033203125, -0.6354904174804688, -0.618804931640625, -0.6021194458007812, -0.5854339599609375, -0.5687484741210938, -0.55206298828125, -0.5353775024414062, -0.5186920166015625, -0.5020065307617188, -0.485321044921875, -0.46863555908203125, -0.4519500732421875, -0.43526458740234375, -0.4185791015625, -0.40189361572265625, -0.3852081298828125, -0.36852264404296875, -0.351837158203125, -0.33515167236328125, -0.3184661865234375, -0.30178070068359375, -0.28509521484375, -0.26840972900390625, -0.2517242431640625, -0.23503875732421875, -0.218353271484375, -0.20166778564453125, -0.1849822998046875, -0.16829681396484375, -0.151611328125, -0.13492584228515625, -0.1182403564453125, -0.10155487060546875, -0.084869384765625, -0.06818389892578125, -0.0514984130859375, -0.03481292724609375, -0.01812744140625, -0.00144195556640625, 0.0152435302734375, 0.03192901611328125, 0.048614501953125, 0.06529998779296875, 0.0819854736328125, 0.09867095947265625, 0.1153564453125, 0.13204193115234375, 0.1487274169921875, 0.16541290283203125, 0.182098388671875, 0.19878387451171875, 0.2154693603515625, 0.23215484619140625, 0.24884033203125, 0.26552581787109375, 0.2822113037109375, 0.29889678955078125, 0.315582275390625, 0.33226776123046875, 0.3489532470703125, 0.36563873291015625, 0.38232421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 1.0, 6.0, 7.0, 8.0, 10.0, 15.0, 13.0, 23.0, 44.0, 36.0, 49.0, 72.0, 116.0, 155.0, 270.0, 483.0, 896.0, 1790.0, 4404.0, 12393.0, 42621.0, 189055.0, 603522.0, 142063.0, 33331.0, 10018.0, 3624.0, 1486.0, 772.0, 427.0, 263.0, 177.0, 113.0, 75.0, 48.0, 52.0, 28.0, 21.0, 17.0, 10.0, 8.0, 5.0, 6.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.654296875, -0.6312637329101562, -0.6082305908203125, -0.5851974487304688, -0.562164306640625, -0.5391311645507812, -0.5160980224609375, -0.49306488037109375, -0.47003173828125, -0.44699859619140625, -0.4239654541015625, -0.40093231201171875, -0.377899169921875, -0.35486602783203125, -0.3318328857421875, -0.30879974365234375, -0.2857666015625, -0.26273345947265625, -0.2397003173828125, -0.21666717529296875, -0.193634033203125, -0.17060089111328125, -0.1475677490234375, -0.12453460693359375, -0.10150146484375, -0.07846832275390625, -0.0554351806640625, -0.03240203857421875, -0.009368896484375, 0.01366424560546875, 0.0366973876953125, 0.05973052978515625, 0.082763671875, 0.10579681396484375, 0.1288299560546875, 0.15186309814453125, 0.174896240234375, 0.19792938232421875, 0.2209625244140625, 0.24399566650390625, 0.26702880859375, 0.29006195068359375, 0.3130950927734375, 0.33612823486328125, 0.359161376953125, 0.38219451904296875, 0.4052276611328125, 0.42826080322265625, 0.4512939453125, 0.47432708740234375, 0.4973602294921875, 0.5203933715820312, 0.543426513671875, 0.5664596557617188, 0.5894927978515625, 0.6125259399414062, 0.63555908203125, 0.6585922241210938, 0.6816253662109375, 0.7046585083007812, 0.727691650390625, 0.7507247924804688, 0.7737579345703125, 0.7967910766601562, 0.81982421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 6.0, 4.0, 10.0, 18.0, 12.0, 19.0, 18.0, 17.0, 25.0, 35.0, 30.0, 39.0, 39.0, 57.0, 53.0, 41.0, 64.0, 49.0, 60.0, 50.0, 54.0, 47.0, 39.0, 45.0, 34.0, 30.0, 23.0, 25.0, 16.0, 10.0, 11.0, 6.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7333984375, -1.685394287109375, -1.63739013671875, -1.589385986328125, -1.5413818359375, -1.493377685546875, -1.44537353515625, -1.397369384765625, -1.349365234375, -1.301361083984375, -1.25335693359375, -1.205352783203125, -1.1573486328125, -1.109344482421875, -1.06134033203125, -1.013336181640625, -0.96533203125, -0.917327880859375, -0.86932373046875, -0.821319580078125, -0.7733154296875, -0.725311279296875, -0.67730712890625, -0.629302978515625, -0.581298828125, -0.533294677734375, -0.48529052734375, -0.437286376953125, -0.3892822265625, -0.341278076171875, -0.29327392578125, -0.245269775390625, -0.197265625, -0.149261474609375, -0.10125732421875, -0.053253173828125, -0.0052490234375, 0.042755126953125, 0.09075927734375, 0.138763427734375, 0.186767578125, 0.234771728515625, 0.28277587890625, 0.330780029296875, 0.3787841796875, 0.426788330078125, 0.47479248046875, 0.522796630859375, 0.57080078125, 0.618804931640625, 0.66680908203125, 0.714813232421875, 0.7628173828125, 0.810821533203125, 0.85882568359375, 0.906829833984375, 0.954833984375, 1.002838134765625, 1.05084228515625, 1.098846435546875, 1.1468505859375, 1.194854736328125, 1.24285888671875, 1.290863037109375, 1.3388671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 10.0, 7.0, 12.0, 25.0, 35.0, 56.0, 98.0, 179.0, 303.0, 589.0, 1114.0, 2452.0, 5731.0, 15666.0, 47698.0, 201767.0, 614899.0, 110279.0, 29846.0, 10101.0, 3994.0, 1773.0, 835.0, 465.0, 241.0, 143.0, 71.0, 44.0, 43.0, 17.0, 16.0, 11.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.340576171875, -0.3309288024902344, -0.32128143310546875, -0.3116340637207031, -0.3019866943359375, -0.2923393249511719, -0.28269195556640625, -0.2730445861816406, -0.263397216796875, -0.2537498474121094, -0.24410247802734375, -0.23445510864257812, -0.2248077392578125, -0.21516036987304688, -0.20551300048828125, -0.19586563110351562, -0.18621826171875, -0.17657089233398438, -0.16692352294921875, -0.15727615356445312, -0.1476287841796875, -0.13798141479492188, -0.12833404541015625, -0.11868667602539062, -0.109039306640625, -0.09939193725585938, -0.08974456787109375, -0.08009719848632812, -0.0704498291015625, -0.060802459716796875, -0.05115509033203125, -0.041507720947265625, -0.0318603515625, -0.022212982177734375, -0.01256561279296875, -0.002918243408203125, 0.0067291259765625, 0.016376495361328125, 0.02602386474609375, 0.035671234130859375, 0.045318603515625, 0.054965972900390625, 0.06461334228515625, 0.07426071166992188, 0.0839080810546875, 0.09355545043945312, 0.10320281982421875, 0.11285018920898438, 0.12249755859375, 0.13214492797851562, 0.14179229736328125, 0.15143966674804688, 0.1610870361328125, 0.17073440551757812, 0.18038177490234375, 0.19002914428710938, 0.199676513671875, 0.20932388305664062, 0.21897125244140625, 0.22861862182617188, 0.2382659912109375, 0.24791336059570312, 0.25756072998046875, 0.2672080993652344, 0.27685546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 8.0, 10.0, 14.0, 18.0, 21.0, 41.0, 30.0, 63.0, 76.0, 81.0, 96.0, 110.0, 100.0, 76.0, 51.0, 45.0, 28.0, 19.0, 21.0, 10.0, 13.0, 11.0, 6.0, 10.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.623434066772461e-05, -7.368624210357666e-05, -7.113814353942871e-05, -6.859004497528076e-05, -6.604194641113281e-05, -6.349384784698486e-05, -6.0945749282836914e-05, -5.8397650718688965e-05, -5.5849552154541016e-05, -5.3301453590393066e-05, -5.075335502624512e-05, -4.820525646209717e-05, -4.565715789794922e-05, -4.310905933380127e-05, -4.056096076965332e-05, -3.801286220550537e-05, -3.546476364135742e-05, -3.291666507720947e-05, -3.0368566513061523e-05, -2.7820467948913574e-05, -2.5272369384765625e-05, -2.2724270820617676e-05, -2.0176172256469727e-05, -1.7628073692321777e-05, -1.5079975128173828e-05, -1.2531876564025879e-05, -9.98377799987793e-06, -7.4356794357299805e-06, -4.887580871582031e-06, -2.339482307434082e-06, 2.086162567138672e-07, 2.7567148208618164e-06, 5.304813385009766e-06, 7.852911949157715e-06, 1.0401010513305664e-05, 1.2949109077453613e-05, 1.5497207641601562e-05, 1.8045306205749512e-05, 2.059340476989746e-05, 2.314150333404541e-05, 2.568960189819336e-05, 2.823770046234131e-05, 3.078579902648926e-05, 3.333389759063721e-05, 3.5881996154785156e-05, 3.8430094718933105e-05, 4.0978193283081055e-05, 4.3526291847229004e-05, 4.607439041137695e-05, 4.86224889755249e-05, 5.117058753967285e-05, 5.37186861038208e-05, 5.626678466796875e-05, 5.88148832321167e-05, 6.136298179626465e-05, 6.39110803604126e-05, 6.645917892456055e-05, 6.90072774887085e-05, 7.155537605285645e-05, 7.41034746170044e-05, 7.665157318115234e-05, 7.919967174530029e-05, 8.174777030944824e-05, 8.429586887359619e-05, 8.684396743774414e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 21.0, 29.0, 31.0, 31.0, 58.0, 76.0, 133.0, 199.0, 289.0, 439.0, 664.0, 1187.0, 2263.0, 4110.0, 8506.0, 19791.0, 50939.0, 162382.0, 557980.0, 153882.0, 48913.0, 18925.0, 8309.0, 3987.0, 2137.0, 1214.0, 749.0, 484.0, 285.0, 158.0, 108.0, 73.0, 49.0, 43.0, 36.0, 18.0, 14.0, 5.0, 7.0, 2.0, 5.0, 4.0, 4.0, 1.0], "bins": [-0.3251953125, -0.3167438507080078, -0.3082923889160156, -0.29984092712402344, -0.29138946533203125, -0.28293800354003906, -0.2744865417480469, -0.2660350799560547, -0.2575836181640625, -0.2491321563720703, -0.24068069458007812, -0.23222923278808594, -0.22377777099609375, -0.21532630920410156, -0.20687484741210938, -0.1984233856201172, -0.189971923828125, -0.1815204620361328, -0.17306900024414062, -0.16461753845214844, -0.15616607666015625, -0.14771461486816406, -0.13926315307617188, -0.1308116912841797, -0.1223602294921875, -0.11390876770019531, -0.10545730590820312, -0.09700584411621094, -0.08855438232421875, -0.08010292053222656, -0.07165145874023438, -0.06319999694824219, -0.05474853515625, -0.04629707336425781, -0.037845611572265625, -0.029394149780273438, -0.02094268798828125, -0.012491226196289062, -0.004039764404296875, 0.0044116973876953125, 0.0128631591796875, 0.021314620971679688, 0.029766082763671875, 0.03821754455566406, 0.04666900634765625, 0.05512046813964844, 0.06357192993164062, 0.07202339172363281, 0.080474853515625, 0.08892631530761719, 0.09737777709960938, 0.10582923889160156, 0.11428070068359375, 0.12273216247558594, 0.13118362426757812, 0.1396350860595703, 0.1480865478515625, 0.1565380096435547, 0.16498947143554688, 0.17344093322753906, 0.18189239501953125, 0.19034385681152344, 0.19879531860351562, 0.2072467803955078, 0.2156982421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 2.0, 7.0, 7.0, 10.0, 17.0, 16.0, 19.0, 22.0, 30.0, 44.0, 47.0, 53.0, 74.0, 82.0, 88.0, 83.0, 70.0, 65.0, 54.0, 41.0, 34.0, 27.0, 14.0, 18.0, 7.0, 11.0, 10.0, 7.0, 8.0, 5.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.24727630615234375, -0.2391815185546875, -0.23108673095703125, -0.222991943359375, -0.21489715576171875, -0.2068023681640625, -0.19870758056640625, -0.19061279296875, -0.18251800537109375, -0.1744232177734375, -0.16632843017578125, -0.158233642578125, -0.15013885498046875, -0.1420440673828125, -0.13394927978515625, -0.1258544921875, -0.11775970458984375, -0.1096649169921875, -0.10157012939453125, -0.093475341796875, -0.08538055419921875, -0.0772857666015625, -0.06919097900390625, -0.06109619140625, -0.05300140380859375, -0.0449066162109375, -0.03681182861328125, -0.028717041015625, -0.02062225341796875, -0.0125274658203125, -0.00443267822265625, 0.003662109375, 0.01175689697265625, 0.0198516845703125, 0.02794647216796875, 0.036041259765625, 0.04413604736328125, 0.0522308349609375, 0.06032562255859375, 0.06842041015625, 0.07651519775390625, 0.0846099853515625, 0.09270477294921875, 0.100799560546875, 0.10889434814453125, 0.1169891357421875, 0.12508392333984375, 0.1331787109375, 0.14127349853515625, 0.1493682861328125, 0.15746307373046875, 0.165557861328125, 0.17365264892578125, 0.1817474365234375, 0.18984222412109375, 0.19793701171875, 0.20603179931640625, 0.2141265869140625, 0.22222137451171875, 0.230316162109375, 0.23841094970703125, 0.2465057373046875, 0.25460052490234375, 0.2626953125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 12.0, 23.0, 42.0, 112.0, 147.0, 285.0, 196.0, 76.0, 42.0, 23.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.224206924438477, -9.921184539794922, -9.618163108825684, -9.315140724182129, -9.01211929321289, -8.709096908569336, -8.406075477600098, -8.103053092956543, -7.800031661987305, -7.497009754180908, -7.193987846374512, -6.890965938568115, -6.587944030761719, -6.284922122955322, -5.981900215148926, -5.678877830505371, -5.375855922698975, -5.072834014892578, -4.769812107086182, -4.466790199279785, -4.163768291473389, -3.860746383666992, -3.5577242374420166, -3.25470232963562, -2.9516804218292236, -2.648658514022827, -2.3456366062164307, -2.042614459991455, -1.7395926713943481, -1.4365707635879517, -1.1335487365722656, -0.8305268287658691, -0.5275049209594727, -0.22448298335075378, 0.07853895425796509, 0.38156092166900635, 0.6845828294754028, 0.9876047372817993, 1.2906267642974854, 1.5936486721038818, 1.8966705799102783, 2.199692487716675, 2.5027143955230713, 2.805736541748047, 3.1087584495544434, 3.41178035736084, 3.7148022651672363, 4.017824172973633, 4.320846080780029, 4.623867988586426, 4.926889896392822, 5.229911804199219, 5.532933712005615, 5.835955619812012, 6.138978004455566, 6.441999435424805, 6.745021820068359, 7.048043727874756, 7.351065635681152, 7.654087543487549, 7.957109451293945, 8.2601318359375, 8.563153266906738, 8.866175651550293, 9.169197082519531]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 10.0, 10.0, 6.0, 14.0, 11.0, 23.0, 19.0, 27.0, 28.0, 40.0, 39.0, 34.0, 44.0, 52.0, 69.0, 101.0, 77.0, 66.0, 48.0, 35.0, 30.0, 27.0, 24.0, 22.0, 26.0, 18.0, 13.0, 17.0, 12.0, 15.0, 11.0, 6.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.293898582458496, -5.094769477844238, -4.895640850067139, -4.696511745452881, -4.497383117675781, -4.298254013061523, -4.099124908447266, -3.899996042251587, -3.700867176055908, -3.5017383098602295, -3.302609443664551, -3.103480339050293, -2.9043514728546143, -2.7052226066589355, -2.5060935020446777, -2.306964635848999, -2.1078357696533203, -1.9087069034576416, -1.7095779180526733, -1.510448932647705, -1.3113200664520264, -1.1121912002563477, -0.9130622148513794, -0.7139332294464111, -0.5148043632507324, -0.31567543745040894, -0.11654651165008545, 0.08258241415023804, 0.2817113399505615, 0.480840265750885, 0.6799691915512085, 0.8790981769561768, 1.0782265663146973, 1.277355432510376, 1.4764844179153442, 1.6756134033203125, 1.8747422695159912, 2.07387113571167, 2.2730002403259277, 2.4721291065216064, 2.671257972717285, 2.870386838912964, 3.0695157051086426, 3.2686448097229004, 3.467773675918579, 3.666902542114258, 3.8660316467285156, 4.065160751342773, 4.264289379119873, 4.463418483734131, 4.6625471115112305, 4.861676216125488, 5.060805320739746, 5.259933948516846, 5.4590630531311035, 5.658191680908203, 5.857320785522461, 6.056449890136719, 6.255578517913818, 6.454707622528076, 6.653836250305176, 6.852965354919434, 7.052094459533691, 7.251223564147949, 7.450352191925049]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 9.0, 10.0, 12.0, 19.0, 28.0, 32.0, 79.0, 88.0, 162.0, 281.0, 405.0, 725.0, 1286.0, 2679.0, 6745.0, 26227.0, 453149.0, 3517686.0, 158349.0, 15678.0, 4985.0, 2441.0, 1300.0, 710.0, 466.0, 261.0, 158.0, 98.0, 75.0, 43.0, 37.0, 16.0, 14.0, 8.0, 3.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.0478515625, -1.017364501953125, -0.98687744140625, -0.956390380859375, -0.9259033203125, -0.895416259765625, -0.86492919921875, -0.834442138671875, -0.803955078125, -0.773468017578125, -0.74298095703125, -0.712493896484375, -0.6820068359375, -0.651519775390625, -0.62103271484375, -0.590545654296875, -0.56005859375, -0.529571533203125, -0.49908447265625, -0.468597412109375, -0.4381103515625, -0.407623291015625, -0.37713623046875, -0.346649169921875, -0.316162109375, -0.285675048828125, -0.25518798828125, -0.224700927734375, -0.1942138671875, -0.163726806640625, -0.13323974609375, -0.102752685546875, -0.072265625, -0.041778564453125, -0.01129150390625, 0.019195556640625, 0.0496826171875, 0.080169677734375, 0.11065673828125, 0.141143798828125, 0.171630859375, 0.202117919921875, 0.23260498046875, 0.263092041015625, 0.2935791015625, 0.324066162109375, 0.35455322265625, 0.385040283203125, 0.41552734375, 0.446014404296875, 0.47650146484375, 0.506988525390625, 0.5374755859375, 0.567962646484375, 0.59844970703125, 0.628936767578125, 0.659423828125, 0.689910888671875, 0.72039794921875, 0.750885009765625, 0.7813720703125, 0.811859130859375, 0.84234619140625, 0.872833251953125, 0.9033203125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 20.0, 25.0, 33.0, 54.0, 54.0, 60.0, 77.0, 71.0, 73.0, 80.0, 86.0, 62.0, 64.0, 56.0, 33.0, 42.0, 31.0, 20.0, 14.0, 13.0, 5.0, 10.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41796875, -0.400634765625, -0.38330078125, -0.365966796875, -0.3486328125, -0.331298828125, -0.31396484375, -0.296630859375, -0.279296875, -0.261962890625, -0.24462890625, -0.227294921875, -0.2099609375, -0.192626953125, -0.17529296875, -0.157958984375, -0.140625, -0.123291015625, -0.10595703125, -0.088623046875, -0.0712890625, -0.053955078125, -0.03662109375, -0.019287109375, -0.001953125, 0.015380859375, 0.03271484375, 0.050048828125, 0.0673828125, 0.084716796875, 0.10205078125, 0.119384765625, 0.13671875, 0.154052734375, 0.17138671875, 0.188720703125, 0.2060546875, 0.223388671875, 0.24072265625, 0.258056640625, 0.275390625, 0.292724609375, 0.31005859375, 0.327392578125, 0.3447265625, 0.362060546875, 0.37939453125, 0.396728515625, 0.4140625, 0.431396484375, 0.44873046875, 0.466064453125, 0.4833984375, 0.500732421875, 0.51806640625, 0.535400390625, 0.552734375, 0.570068359375, 0.58740234375, 0.604736328125, 0.6220703125, 0.639404296875, 0.65673828125, 0.674072265625, 0.69140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 8.0, 16.0, 31.0, 66.0, 175.0, 495.0, 2283.0, 67829.0, 4115500.0, 6553.0, 849.0, 276.0, 94.0, 49.0, 25.0, 11.0, 11.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.54595947265625, -4.3848876953125, -4.22381591796875, -4.062744140625, -3.90167236328125, -3.7406005859375, -3.57952880859375, -3.41845703125, -3.25738525390625, -3.0963134765625, -2.93524169921875, -2.774169921875, -2.61309814453125, -2.4520263671875, -2.29095458984375, -2.1298828125, -1.96881103515625, -1.8077392578125, -1.64666748046875, -1.485595703125, -1.32452392578125, -1.1634521484375, -1.00238037109375, -0.84130859375, -0.68023681640625, -0.5191650390625, -0.35809326171875, -0.197021484375, -0.03594970703125, 0.1251220703125, 0.28619384765625, 0.447265625, 0.60833740234375, 0.7694091796875, 0.93048095703125, 1.091552734375, 1.25262451171875, 1.4136962890625, 1.57476806640625, 1.73583984375, 1.89691162109375, 2.0579833984375, 2.21905517578125, 2.380126953125, 2.54119873046875, 2.7022705078125, 2.86334228515625, 3.0244140625, 3.18548583984375, 3.3465576171875, 3.50762939453125, 3.668701171875, 3.82977294921875, 3.9908447265625, 4.15191650390625, 4.31298828125, 4.47406005859375, 4.6351318359375, 4.79620361328125, 4.957275390625, 5.11834716796875, 5.2794189453125, 5.44049072265625, 5.6015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 20.0, 26.0, 70.0, 241.0, 803.0, 1726.0, 795.0, 219.0, 77.0, 37.0, 10.0, 11.0, 7.0, 2.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.140625, -2.0819091796875, -2.023193359375, -1.9644775390625, -1.90576171875, -1.8470458984375, -1.788330078125, -1.7296142578125, -1.6708984375, -1.6121826171875, -1.553466796875, -1.4947509765625, -1.43603515625, -1.3773193359375, -1.318603515625, -1.2598876953125, -1.201171875, -1.1424560546875, -1.083740234375, -1.0250244140625, -0.96630859375, -0.9075927734375, -0.848876953125, -0.7901611328125, -0.7314453125, -0.6727294921875, -0.614013671875, -0.5552978515625, -0.49658203125, -0.4378662109375, -0.379150390625, -0.3204345703125, -0.26171875, -0.2030029296875, -0.144287109375, -0.0855712890625, -0.02685546875, 0.0318603515625, 0.090576171875, 0.1492919921875, 0.2080078125, 0.2667236328125, 0.325439453125, 0.3841552734375, 0.44287109375, 0.5015869140625, 0.560302734375, 0.6190185546875, 0.677734375, 0.7364501953125, 0.795166015625, 0.8538818359375, 0.91259765625, 0.9713134765625, 1.030029296875, 1.0887451171875, 1.1474609375, 1.2061767578125, 1.264892578125, 1.3236083984375, 1.38232421875, 1.4410400390625, 1.499755859375, 1.5584716796875, 1.6171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 12.0, 18.0, 37.0, 93.0, 215.0, 278.0, 190.0, 82.0, 29.0, 19.0, 20.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.659038543701172, -18.197010040283203, -17.7349796295166, -17.272951126098633, -16.810922622680664, -16.348892211914062, -15.886863708496094, -15.424835205078125, -14.96280574798584, -14.500776290893555, -14.038747787475586, -13.5767183303833, -13.114689826965332, -12.652660369873047, -12.190631866455078, -11.728602409362793, -11.266572952270508, -10.804543495178223, -10.342514991760254, -9.880485534667969, -9.41845703125, -8.956427574157715, -8.49439811706543, -8.032369613647461, -7.570341110229492, -7.108312129974365, -6.646283149719238, -6.184253692626953, -5.722224712371826, -5.260195732116699, -4.798166751861572, -4.336137771606445, -3.87410831451416, -3.412079334259033, -2.950050115585327, -2.4880211353302, -2.025991916656494, -1.5639629364013672, -1.1019339561462402, -0.6399047374725342, -0.17787575721740723, 0.2841533124446869, 0.746182382106781, 1.2082114219665527, 1.6702405214309692, 2.1322696208953857, 2.5942986011505127, 3.0563278198242188, 3.5183568000793457, 3.9803857803344727, 4.4424147605896, 4.904443740844727, 5.366473197937012, 5.828502178192139, 6.290531158447266, 6.752560615539551, 7.2145891189575195, 7.6766180992126465, 8.138647079467773, 8.600676536560059, 9.062705039978027, 9.524734497070312, 9.986763000488281, 10.448792457580566, 10.910821914672852]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 3.0, 5.0, 9.0, 16.0, 6.0, 17.0, 21.0, 21.0, 15.0, 32.0, 23.0, 26.0, 39.0, 44.0, 51.0, 49.0, 53.0, 66.0, 43.0, 49.0, 38.0, 49.0, 47.0, 42.0, 26.0, 39.0, 26.0, 23.0, 28.0, 25.0, 13.0, 18.0, 17.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.572056293487549, -4.442127704620361, -4.312199115753174, -4.182270526885986, -4.052341938018799, -3.9224133491516113, -3.7924845218658447, -3.6625559329986572, -3.5326273441314697, -3.4026987552642822, -3.2727701663970947, -3.1428415775299072, -3.0129127502441406, -2.882984161376953, -2.7530555725097656, -2.623126983642578, -2.4931983947753906, -2.363269805908203, -2.2333412170410156, -2.103412628173828, -1.973483920097351, -1.8435553312301636, -1.7136266231536865, -1.583698034286499, -1.4537694454193115, -1.323840856552124, -1.1939122676849365, -1.0639835596084595, -0.934054970741272, -0.8041263818740845, -0.6741977334022522, -0.5442690849304199, -0.4143400192260742, -0.28441140055656433, -0.15448278188705444, -0.024554163217544556, 0.10537445545196533, 0.23530304431915283, 0.3652316927909851, 0.4951603412628174, 0.6250889301300049, 0.7550175189971924, 0.8849461674690247, 1.014874815940857, 1.1448034048080444, 1.274731993675232, 1.404660701751709, 1.5345892906188965, 1.664517879486084, 1.7944464683532715, 1.924375057220459, 2.0543036460876465, 2.184232234954834, 2.3141608238220215, 2.444089651107788, 2.5740182399749756, 2.703946828842163, 2.8338754177093506, 2.963804006576538, 3.0937325954437256, 3.223661422729492, 3.3535900115966797, 3.483518600463867, 3.6134471893310547, 3.743375778198242]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 6.0, 3.0, 6.0, 10.0, 13.0, 20.0, 23.0, 21.0, 32.0, 34.0, 68.0, 99.0, 143.0, 230.0, 418.0, 661.0, 1262.0, 2411.0, 4909.0, 12036.0, 33732.0, 126362.0, 476204.0, 286678.0, 67230.0, 20369.0, 7940.0, 3494.0, 1749.0, 952.0, 486.0, 318.0, 225.0, 120.0, 86.0, 62.0, 37.0, 23.0, 13.0, 11.0, 20.0, 16.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.68505859375, -0.66204833984375, -0.6390380859375, -0.61602783203125, -0.593017578125, -0.57000732421875, -0.5469970703125, -0.52398681640625, -0.5009765625, -0.47796630859375, -0.4549560546875, -0.43194580078125, -0.408935546875, -0.38592529296875, -0.3629150390625, -0.33990478515625, -0.31689453125, -0.29388427734375, -0.2708740234375, -0.24786376953125, -0.224853515625, -0.20184326171875, -0.1788330078125, -0.15582275390625, -0.1328125, -0.10980224609375, -0.0867919921875, -0.06378173828125, -0.040771484375, -0.01776123046875, 0.0052490234375, 0.02825927734375, 0.05126953125, 0.07427978515625, 0.0972900390625, 0.12030029296875, 0.143310546875, 0.16632080078125, 0.1893310546875, 0.21234130859375, 0.2353515625, 0.25836181640625, 0.2813720703125, 0.30438232421875, 0.327392578125, 0.35040283203125, 0.3734130859375, 0.39642333984375, 0.41943359375, 0.44244384765625, 0.4654541015625, 0.48846435546875, 0.511474609375, 0.53448486328125, 0.5574951171875, 0.58050537109375, 0.603515625, 0.62652587890625, 0.6495361328125, 0.67254638671875, 0.695556640625, 0.71856689453125, 0.7415771484375, 0.76458740234375, 0.78759765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 8.0, 5.0, 8.0, 11.0, 17.0, 18.0, 22.0, 36.0, 30.0, 45.0, 48.0, 45.0, 58.0, 52.0, 52.0, 57.0, 49.0, 61.0, 43.0, 44.0, 53.0, 38.0, 38.0, 27.0, 37.0, 20.0, 16.0, 14.0, 16.0, 6.0, 6.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46044921875, -0.44675445556640625, -0.4330596923828125, -0.41936492919921875, -0.405670166015625, -0.39197540283203125, -0.3782806396484375, -0.36458587646484375, -0.35089111328125, -0.33719635009765625, -0.3235015869140625, -0.30980682373046875, -0.296112060546875, -0.28241729736328125, -0.2687225341796875, -0.25502777099609375, -0.2413330078125, -0.22763824462890625, -0.2139434814453125, -0.20024871826171875, -0.186553955078125, -0.17285919189453125, -0.1591644287109375, -0.14546966552734375, -0.13177490234375, -0.11808013916015625, -0.1043853759765625, -0.09069061279296875, -0.076995849609375, -0.06330108642578125, -0.0496063232421875, -0.03591156005859375, -0.022216796875, -0.00852203369140625, 0.0051727294921875, 0.01886749267578125, 0.032562255859375, 0.04625701904296875, 0.0599517822265625, 0.07364654541015625, 0.08734130859375, 0.10103607177734375, 0.1147308349609375, 0.12842559814453125, 0.142120361328125, 0.15581512451171875, 0.1695098876953125, 0.18320465087890625, 0.1968994140625, 0.21059417724609375, 0.2242889404296875, 0.23798370361328125, 0.251678466796875, 0.26537322998046875, 0.2790679931640625, 0.29276275634765625, 0.30645751953125, 0.32015228271484375, 0.3338470458984375, 0.34754180908203125, 0.361236572265625, 0.37493133544921875, 0.3886260986328125, 0.40232086181640625, 0.416015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 9.0, 9.0, 12.0, 13.0, 22.0, 24.0, 37.0, 52.0, 85.0, 115.0, 192.0, 300.0, 549.0, 1117.0, 2702.0, 7953.0, 32987.0, 224661.0, 683643.0, 72036.0, 14381.0, 4299.0, 1543.0, 761.0, 363.0, 243.0, 155.0, 76.0, 67.0, 45.0, 26.0, 16.0, 12.0, 15.0, 7.0, 9.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.86962890625, -0.8364639282226562, -0.8032989501953125, -0.7701339721679688, -0.736968994140625, -0.7038040161132812, -0.6706390380859375, -0.6374740600585938, -0.60430908203125, -0.5711441040039062, -0.5379791259765625, -0.5048141479492188, -0.471649169921875, -0.43848419189453125, -0.4053192138671875, -0.37215423583984375, -0.3389892578125, -0.30582427978515625, -0.2726593017578125, -0.23949432373046875, -0.206329345703125, -0.17316436767578125, -0.1399993896484375, -0.10683441162109375, -0.07366943359375, -0.04050445556640625, -0.0073394775390625, 0.02582550048828125, 0.058990478515625, 0.09215545654296875, 0.1253204345703125, 0.15848541259765625, 0.191650390625, 0.22481536865234375, 0.2579803466796875, 0.29114532470703125, 0.324310302734375, 0.35747528076171875, 0.3906402587890625, 0.42380523681640625, 0.45697021484375, 0.49013519287109375, 0.5233001708984375, 0.5564651489257812, 0.589630126953125, 0.6227951049804688, 0.6559600830078125, 0.6891250610351562, 0.7222900390625, 0.7554550170898438, 0.7886199951171875, 0.8217849731445312, 0.854949951171875, 0.8881149291992188, 0.9212799072265625, 0.9544448852539062, 0.98760986328125, 1.0207748413085938, 1.0539398193359375, 1.0871047973632812, 1.120269775390625, 1.1534347534179688, 1.1865997314453125, 1.2197647094726562, 1.2529296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 3.0, 8.0, 14.0, 17.0, 14.0, 27.0, 25.0, 22.0, 37.0, 34.0, 38.0, 37.0, 51.0, 51.0, 62.0, 56.0, 55.0, 51.0, 45.0, 49.0, 43.0, 43.0, 34.0, 27.0, 29.0, 25.0, 18.0, 16.0, 21.0, 9.0, 9.0, 3.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1746978759765625, -1.127716064453125, -1.0807342529296875, -1.03375244140625, -0.9867706298828125, -0.939788818359375, -0.8928070068359375, -0.8458251953125, -0.7988433837890625, -0.751861572265625, -0.7048797607421875, -0.65789794921875, -0.6109161376953125, -0.563934326171875, -0.5169525146484375, -0.469970703125, -0.4229888916015625, -0.376007080078125, -0.3290252685546875, -0.28204345703125, -0.2350616455078125, -0.188079833984375, -0.1410980224609375, -0.0941162109375, -0.0471343994140625, -0.000152587890625, 0.0468292236328125, 0.09381103515625, 0.1407928466796875, 0.187774658203125, 0.2347564697265625, 0.28173828125, 0.3287200927734375, 0.375701904296875, 0.4226837158203125, 0.46966552734375, 0.5166473388671875, 0.563629150390625, 0.6106109619140625, 0.6575927734375, 0.7045745849609375, 0.751556396484375, 0.7985382080078125, 0.84552001953125, 0.8925018310546875, 0.939483642578125, 0.9864654541015625, 1.033447265625, 1.0804290771484375, 1.127410888671875, 1.1743927001953125, 1.22137451171875, 1.2683563232421875, 1.315338134765625, 1.3623199462890625, 1.4093017578125, 1.4562835693359375, 1.503265380859375, 1.5502471923828125, 1.59722900390625, 1.6442108154296875, 1.691192626953125, 1.7381744384765625, 1.78515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 18.0, 24.0, 52.0, 111.0, 291.0, 845.0, 4471.0, 59348.0, 954075.0, 25549.0, 2705.0, 670.0, 198.0, 92.0, 37.0, 10.0, 14.0, 8.0, 12.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93115234375, -0.8944473266601562, -0.8577423095703125, -0.8210372924804688, -0.784332275390625, -0.7476272583007812, -0.7109222412109375, -0.6742172241210938, -0.63751220703125, -0.6008071899414062, -0.5641021728515625, -0.5273971557617188, -0.490692138671875, -0.45398712158203125, -0.4172821044921875, -0.38057708740234375, -0.3438720703125, -0.30716705322265625, -0.2704620361328125, -0.23375701904296875, -0.197052001953125, -0.16034698486328125, -0.1236419677734375, -0.08693695068359375, -0.05023193359375, -0.01352691650390625, 0.0231781005859375, 0.05988311767578125, 0.096588134765625, 0.13329315185546875, 0.1699981689453125, 0.20670318603515625, 0.243408203125, 0.28011322021484375, 0.3168182373046875, 0.35352325439453125, 0.390228271484375, 0.42693328857421875, 0.4636383056640625, 0.5003433227539062, 0.53704833984375, 0.5737533569335938, 0.6104583740234375, 0.6471633911132812, 0.683868408203125, 0.7205734252929688, 0.7572784423828125, 0.7939834594726562, 0.8306884765625, 0.8673934936523438, 0.9040985107421875, 0.9408035278320312, 0.977508544921875, 1.0142135620117188, 1.0509185791015625, 1.0876235961914062, 1.12432861328125, 1.1610336303710938, 1.1977386474609375, 1.2344436645507812, 1.271148681640625, 1.3078536987304688, 1.3445587158203125, 1.3812637329101562, 1.41796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 10.0, 9.0, 11.0, 13.0, 23.0, 26.0, 44.0, 57.0, 102.0, 185.0, 177.0, 110.0, 68.0, 46.0, 25.0, 14.0, 7.0, 13.0, 3.0, 8.0, 5.0, 6.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001399517059326172, -0.00013595353811979294, -0.0001319553703069687, -0.00012795720249414444, -0.0001239590346813202, -0.00011996086686849594, -0.00011596269905567169, -0.00011196453124284744, -0.0001079663634300232, -0.00010396819561719894, -9.99700278043747e-05, -9.597185999155045e-05, -9.19736921787262e-05, -8.797552436590195e-05, -8.39773565530777e-05, -7.997918874025345e-05, -7.59810209274292e-05, -7.198285311460495e-05, -6.79846853017807e-05, -6.398651748895645e-05, -5.99883496761322e-05, -5.599018186330795e-05, -5.1992014050483704e-05, -4.7993846237659454e-05, -4.3995678424835205e-05, -3.9997510612010956e-05, -3.5999342799186707e-05, -3.200117498636246e-05, -2.8003007173538208e-05, -2.400483936071396e-05, -2.000667154788971e-05, -1.600850373506546e-05, -1.2010335922241211e-05, -8.012168109416962e-06, -4.014000296592712e-06, -1.5832483768463135e-08, 3.982335329055786e-06, 7.980503141880035e-06, 1.1978670954704285e-05, 1.5976838767528534e-05, 1.9975006580352783e-05, 2.3973174393177032e-05, 2.7971342206001282e-05, 3.196951001882553e-05, 3.596767783164978e-05, 3.996584564447403e-05, 4.396401345729828e-05, 4.796218127012253e-05, 5.196034908294678e-05, 5.5958516895771027e-05, 5.9956684708595276e-05, 6.395485252141953e-05, 6.795302033424377e-05, 7.195118814706802e-05, 7.594935595989227e-05, 7.994752377271652e-05, 8.394569158554077e-05, 8.794385939836502e-05, 9.194202721118927e-05, 9.594019502401352e-05, 9.993836283683777e-05, 0.00010393653064966202, 0.00010793469846248627, 0.00011193286627531052, 0.00011593103408813477]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 5.0, 6.0, 6.0, 7.0, 12.0, 16.0, 16.0, 29.0, 43.0, 51.0, 60.0, 108.0, 149.0, 251.0, 434.0, 720.0, 1683.0, 4405.0, 19259.0, 225275.0, 754328.0, 31410.0, 6098.0, 1978.0, 874.0, 478.0, 273.0, 179.0, 113.0, 91.0, 61.0, 31.0, 29.0, 21.0, 17.0, 12.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.7661895751953125, -0.742340087890625, -0.7184906005859375, -0.69464111328125, -0.6707916259765625, -0.646942138671875, -0.6230926513671875, -0.5992431640625, -0.5753936767578125, -0.551544189453125, -0.5276947021484375, -0.50384521484375, -0.4799957275390625, -0.456146240234375, -0.4322967529296875, -0.408447265625, -0.3845977783203125, -0.360748291015625, -0.3368988037109375, -0.31304931640625, -0.2891998291015625, -0.265350341796875, -0.2415008544921875, -0.2176513671875, -0.1938018798828125, -0.169952392578125, -0.1461029052734375, -0.12225341796875, -0.0984039306640625, -0.074554443359375, -0.0507049560546875, -0.02685546875, -0.0030059814453125, 0.020843505859375, 0.0446929931640625, 0.06854248046875, 0.0923919677734375, 0.116241455078125, 0.1400909423828125, 0.1639404296875, 0.1877899169921875, 0.211639404296875, 0.2354888916015625, 0.25933837890625, 0.2831878662109375, 0.307037353515625, 0.3308868408203125, 0.354736328125, 0.3785858154296875, 0.402435302734375, 0.4262847900390625, 0.45013427734375, 0.4739837646484375, 0.497833251953125, 0.5216827392578125, 0.5455322265625, 0.5693817138671875, 0.593231201171875, 0.6170806884765625, 0.64093017578125, 0.6647796630859375, 0.688629150390625, 0.7124786376953125, 0.736328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 11.0, 6.0, 12.0, 12.0, 28.0, 33.0, 45.0, 119.0, 262.0, 220.0, 117.0, 54.0, 26.0, 21.0, 18.0, 4.0, 6.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7265625, -0.7014312744140625, -0.676300048828125, -0.6511688232421875, -0.62603759765625, -0.6009063720703125, -0.575775146484375, -0.5506439208984375, -0.5255126953125, -0.5003814697265625, -0.475250244140625, -0.4501190185546875, -0.42498779296875, -0.3998565673828125, -0.374725341796875, -0.3495941162109375, -0.324462890625, -0.2993316650390625, -0.274200439453125, -0.2490692138671875, -0.22393798828125, -0.1988067626953125, -0.173675537109375, -0.1485443115234375, -0.1234130859375, -0.0982818603515625, -0.073150634765625, -0.0480194091796875, -0.02288818359375, 0.0022430419921875, 0.027374267578125, 0.0525054931640625, 0.07763671875, 0.1027679443359375, 0.127899169921875, 0.1530303955078125, 0.17816162109375, 0.2032928466796875, 0.228424072265625, 0.2535552978515625, 0.2786865234375, 0.3038177490234375, 0.328948974609375, 0.3540802001953125, 0.37921142578125, 0.4043426513671875, 0.429473876953125, 0.4546051025390625, 0.479736328125, 0.5048675537109375, 0.529998779296875, 0.5551300048828125, 0.58026123046875, 0.6053924560546875, 0.630523681640625, 0.6556549072265625, 0.6807861328125, 0.7059173583984375, 0.731048583984375, 0.7561798095703125, 0.78131103515625, 0.8064422607421875, 0.831573486328125, 0.8567047119140625, 0.8818359375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 6.0, 34.0, 93.0, 433.0, 334.0, 73.0, 20.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.11299133300781, -33.38637924194336, -32.659767150878906, -31.933156967163086, -31.206546783447266, -30.479934692382812, -29.753324508666992, -29.02671241760254, -28.30010223388672, -27.573490142822266, -26.846879959106445, -26.120267868041992, -25.393657684326172, -24.66704559326172, -23.9404354095459, -23.213823318481445, -22.487213134765625, -21.760601043701172, -21.03399085998535, -20.3073787689209, -19.580768585205078, -18.854156494140625, -18.127546310424805, -17.40093421936035, -16.6743221282959, -15.947710990905762, -15.221099853515625, -14.494488716125488, -13.767877578735352, -13.041266441345215, -12.314655303955078, -11.588043212890625, -10.861433982849121, -10.134822845458984, -9.408211708068848, -8.681600570678711, -7.954989433288574, -7.2283782958984375, -6.501766681671143, -5.775155544281006, -5.048544406890869, -4.321933269500732, -3.5953221321105957, -2.86871075630188, -2.142099618911743, -1.4154884815216064, -0.6888771057128906, 0.037734031677246094, 0.7643451690673828, 1.4909563064575195, 2.2175674438476562, 2.944178819656372, 3.670789957046509, 4.397400856018066, 5.124012470245361, 5.850623607635498, 6.577234745025635, 7.3038458824157715, 8.030457496643066, 8.757068634033203, 9.48367977142334, 10.210290908813477, 10.936902046203613, 11.66351318359375, 12.390124320983887]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 10.0, 7.0, 14.0, 13.0, 20.0, 17.0, 16.0, 23.0, 27.0, 21.0, 22.0, 21.0, 32.0, 34.0, 68.0, 66.0, 76.0, 81.0, 61.0, 42.0, 35.0, 34.0, 31.0, 24.0, 31.0, 28.0, 20.0, 19.0, 15.0, 14.0, 11.0, 11.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.063471794128418, -4.909416198730469, -4.7553606033325195, -4.60130500793457, -4.447249412536621, -4.293193817138672, -4.139138221740723, -3.9850826263427734, -3.831027030944824, -3.676971435546875, -3.522915840148926, -3.3688602447509766, -3.2148046493530273, -3.060749053955078, -2.906693458557129, -2.7526378631591797, -2.5985822677612305, -2.4445266723632812, -2.290471076965332, -2.136415481567383, -1.9823598861694336, -1.8283042907714844, -1.6742486953735352, -1.520193099975586, -1.3661375045776367, -1.2120819091796875, -1.0580263137817383, -0.9039707183837891, -0.7499151229858398, -0.5958595275878906, -0.4418039321899414, -0.2877483367919922, -0.13369321823120117, 0.020362377166748047, 0.17441797256469727, 0.3284735679626465, 0.4825291633605957, 0.6365847587585449, 0.7906403541564941, 0.9446959495544434, 1.0987515449523926, 1.2528071403503418, 1.406862735748291, 1.5609183311462402, 1.7149739265441895, 1.8690295219421387, 2.023085117340088, 2.177140712738037, 2.3311963081359863, 2.4852519035339355, 2.6393074989318848, 2.793363094329834, 2.947418689727783, 3.1014742851257324, 3.2555298805236816, 3.409585475921631, 3.56364107131958, 3.7176966667175293, 3.8717522621154785, 4.025807857513428, 4.179863452911377, 4.333919048309326, 4.487974643707275, 4.642030239105225, 4.796085834503174]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 9.0, 14.0, 16.0, 25.0, 25.0, 33.0, 60.0, 74.0, 112.0, 147.0, 224.0, 338.0, 572.0, 933.0, 1560.0, 3098.0, 7701.0, 31392.0, 324810.0, 3212950.0, 548466.0, 44028.0, 9459.0, 3615.0, 1772.0, 989.0, 576.0, 371.0, 268.0, 183.0, 124.0, 99.0, 60.0, 42.0, 24.0, 26.0, 24.0, 14.0, 13.0, 5.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7880859375, -0.7623214721679688, -0.7365570068359375, -0.7107925415039062, -0.685028076171875, -0.6592636108398438, -0.6334991455078125, -0.6077346801757812, -0.58197021484375, -0.5562057495117188, -0.5304412841796875, -0.5046768188476562, -0.478912353515625, -0.45314788818359375, -0.4273834228515625, -0.40161895751953125, -0.3758544921875, -0.35009002685546875, -0.3243255615234375, -0.29856109619140625, -0.272796630859375, -0.24703216552734375, -0.2212677001953125, -0.19550323486328125, -0.16973876953125, -0.14397430419921875, -0.1182098388671875, -0.09244537353515625, -0.066680908203125, -0.04091644287109375, -0.0151519775390625, 0.01061248779296875, 0.036376953125, 0.06214141845703125, 0.0879058837890625, 0.11367034912109375, 0.139434814453125, 0.16519927978515625, 0.1909637451171875, 0.21672821044921875, 0.24249267578125, 0.26825714111328125, 0.2940216064453125, 0.31978607177734375, 0.345550537109375, 0.37131500244140625, 0.3970794677734375, 0.42284393310546875, 0.4486083984375, 0.47437286376953125, 0.5001373291015625, 0.5259017944335938, 0.551666259765625, 0.5774307250976562, 0.6031951904296875, 0.6289596557617188, 0.65472412109375, 0.6804885864257812, 0.7062530517578125, 0.7320175170898438, 0.757781982421875, 0.7835464477539062, 0.8093109130859375, 0.8350753784179688, 0.86083984375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 13.0, 16.0, 29.0, 27.0, 49.0, 47.0, 57.0, 61.0, 71.0, 93.0, 73.0, 64.0, 67.0, 57.0, 61.0, 56.0, 27.0, 35.0, 23.0, 13.0, 14.0, 7.0, 6.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56298828125, -0.54437255859375, -0.5257568359375, -0.50714111328125, -0.488525390625, -0.46990966796875, -0.4512939453125, -0.43267822265625, -0.4140625, -0.39544677734375, -0.3768310546875, -0.35821533203125, -0.339599609375, -0.32098388671875, -0.3023681640625, -0.28375244140625, -0.26513671875, -0.24652099609375, -0.2279052734375, -0.20928955078125, -0.190673828125, -0.17205810546875, -0.1534423828125, -0.13482666015625, -0.1162109375, -0.09759521484375, -0.0789794921875, -0.06036376953125, -0.041748046875, -0.02313232421875, -0.0045166015625, 0.01409912109375, 0.03271484375, 0.05133056640625, 0.0699462890625, 0.08856201171875, 0.107177734375, 0.12579345703125, 0.1444091796875, 0.16302490234375, 0.181640625, 0.20025634765625, 0.2188720703125, 0.23748779296875, 0.256103515625, 0.27471923828125, 0.2933349609375, 0.31195068359375, 0.33056640625, 0.34918212890625, 0.3677978515625, 0.38641357421875, 0.405029296875, 0.42364501953125, 0.4422607421875, 0.46087646484375, 0.4794921875, 0.49810791015625, 0.5167236328125, 0.53533935546875, 0.553955078125, 0.57257080078125, 0.5911865234375, 0.60980224609375, 0.62841796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 16.0, 15.0, 18.0, 30.0, 65.0, 137.0, 351.0, 1027.0, 4199.0, 34730.0, 4049112.0, 95721.0, 6512.0, 1514.0, 450.0, 174.0, 75.0, 46.0, 21.0, 16.0, 9.0, 5.0, 4.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.8203125, -2.73388671875, -2.6474609375, -2.56103515625, -2.474609375, -2.38818359375, -2.3017578125, -2.21533203125, -2.12890625, -2.04248046875, -1.9560546875, -1.86962890625, -1.783203125, -1.69677734375, -1.6103515625, -1.52392578125, -1.4375, -1.35107421875, -1.2646484375, -1.17822265625, -1.091796875, -1.00537109375, -0.9189453125, -0.83251953125, -0.74609375, -0.65966796875, -0.5732421875, -0.48681640625, -0.400390625, -0.31396484375, -0.2275390625, -0.14111328125, -0.0546875, 0.03173828125, 0.1181640625, 0.20458984375, 0.291015625, 0.37744140625, 0.4638671875, 0.55029296875, 0.63671875, 0.72314453125, 0.8095703125, 0.89599609375, 0.982421875, 1.06884765625, 1.1552734375, 1.24169921875, 1.328125, 1.41455078125, 1.5009765625, 1.58740234375, 1.673828125, 1.76025390625, 1.8466796875, 1.93310546875, 2.01953125, 2.10595703125, 2.1923828125, 2.27880859375, 2.365234375, 2.45166015625, 2.5380859375, 2.62451171875, 2.7109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 6.0, 2.0, 9.0, 8.0, 15.0, 18.0, 32.0, 50.0, 120.0, 247.0, 626.0, 1130.0, 931.0, 461.0, 199.0, 90.0, 41.0, 23.0, 17.0, 16.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3623046875, -1.3179931640625, -1.273681640625, -1.2293701171875, -1.18505859375, -1.1407470703125, -1.096435546875, -1.0521240234375, -1.0078125, -0.9635009765625, -0.919189453125, -0.8748779296875, -0.83056640625, -0.7862548828125, -0.741943359375, -0.6976318359375, -0.6533203125, -0.6090087890625, -0.564697265625, -0.5203857421875, -0.47607421875, -0.4317626953125, -0.387451171875, -0.3431396484375, -0.298828125, -0.2545166015625, -0.210205078125, -0.1658935546875, -0.12158203125, -0.0772705078125, -0.032958984375, 0.0113525390625, 0.0556640625, 0.0999755859375, 0.144287109375, 0.1885986328125, 0.23291015625, 0.2772216796875, 0.321533203125, 0.3658447265625, 0.41015625, 0.4544677734375, 0.498779296875, 0.5430908203125, 0.58740234375, 0.6317138671875, 0.676025390625, 0.7203369140625, 0.7646484375, 0.8089599609375, 0.853271484375, 0.8975830078125, 0.94189453125, 0.9862060546875, 1.030517578125, 1.0748291015625, 1.119140625, 1.1634521484375, 1.207763671875, 1.2520751953125, 1.29638671875, 1.3406982421875, 1.385009765625, 1.4293212890625, 1.4736328125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 8.0, 15.0, 29.0, 45.0, 81.0, 139.0, 163.0, 163.0, 131.0, 82.0, 39.0, 39.0, 15.0, 7.0, 6.0, 6.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.939985752105713, -7.672755241394043, -7.405524253845215, -7.138293743133545, -6.871063232421875, -6.603832721710205, -6.336602210998535, -6.069371223449707, -5.802140712738037, -5.534910202026367, -5.267679214477539, -5.000448703765869, -4.733218193054199, -4.465987682342529, -4.198757171630859, -3.9315261840820312, -3.6642956733703613, -3.3970651626586914, -3.1298344135284424, -2.8626036643981934, -2.5953731536865234, -2.3281426429748535, -2.0609118938446045, -1.793681263923645, -1.5264506340026855, -1.259220004081726, -0.9919893741607666, -0.7247587442398071, -0.45752811431884766, -0.19029748439788818, 0.07693314552307129, 0.34416377544403076, 0.6113948822021484, 0.8786255121231079, 1.1458561420440674, 1.4130867719650269, 1.6803174018859863, 1.9475480318069458, 2.2147786617279053, 2.4820094108581543, 2.749239921569824, 3.016470432281494, 3.283701181411743, 3.550931930541992, 3.818162441253662, 4.085392951965332, 4.35262393951416, 4.61985445022583, 4.8870849609375, 5.15431547164917, 5.42154598236084, 5.688776969909668, 5.956007480621338, 6.223237991333008, 6.490468978881836, 6.757699489593506, 7.024930000305176, 7.292160511016846, 7.559391021728516, 7.826622009277344, 8.093852996826172, 8.361083030700684, 8.628314018249512, 8.895544052124023, 9.162775039672852]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 12.0, 12.0, 7.0, 11.0, 21.0, 19.0, 23.0, 28.0, 36.0, 49.0, 52.0, 53.0, 72.0, 57.0, 61.0, 67.0, 71.0, 57.0, 54.0, 51.0, 44.0, 41.0, 28.0, 18.0, 24.0, 14.0, 10.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.923671245574951, -6.731647968292236, -6.539624214172363, -6.347600936889648, -6.155577659606934, -5.963554382324219, -5.771531105041504, -5.579507350921631, -5.387484073638916, -5.195460796356201, -5.003437042236328, -4.811413764953613, -4.619390487670898, -4.427367210388184, -4.235343933105469, -4.043320178985596, -3.851296901702881, -3.659273624420166, -3.467250108718872, -3.275226593017578, -3.0832033157348633, -2.8911800384521484, -2.6991565227508545, -2.5071330070495605, -2.3151097297668457, -2.123086452484131, -1.931062936782837, -1.7390395402908325, -1.5470161437988281, -1.3549927473068237, -1.1629693508148193, -0.9709459543228149, -0.7789225578308105, -0.5868991613388062, -0.39487576484680176, -0.20285236835479736, -0.010828971862792969, 0.18119442462921143, 0.3732178211212158, 0.5652412176132202, 0.7572646141052246, 0.949288010597229, 1.1413114070892334, 1.3333348035812378, 1.5253582000732422, 1.7173815965652466, 1.909404993057251, 2.101428508758545, 2.2934517860412598, 2.4854750633239746, 2.6774985790252686, 2.8695220947265625, 3.0615453720092773, 3.253568649291992, 3.445592164993286, 3.63761568069458, 3.829638957977295, 4.02166223526001, 4.213685989379883, 4.405709266662598, 4.5977325439453125, 4.789755821228027, 4.981779098510742, 5.173802852630615, 5.36582612991333]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 15.0, 11.0, 11.0, 31.0, 31.0, 47.0, 84.0, 109.0, 169.0, 249.0, 425.0, 613.0, 1089.0, 1890.0, 3605.0, 7085.0, 15053.0, 36889.0, 99794.0, 305194.0, 368717.0, 126190.0, 44983.0, 18433.0, 8309.0, 4141.0, 2227.0, 1203.0, 700.0, 412.0, 281.0, 180.0, 130.0, 75.0, 65.0, 34.0, 16.0, 20.0, 10.0, 12.0, 7.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5787124633789062, -0.5612335205078125, -0.5437545776367188, -0.526275634765625, -0.5087966918945312, -0.4913177490234375, -0.47383880615234375, -0.45635986328125, -0.43888092041015625, -0.4214019775390625, -0.40392303466796875, -0.386444091796875, -0.36896514892578125, -0.3514862060546875, -0.33400726318359375, -0.3165283203125, -0.29904937744140625, -0.2815704345703125, -0.26409149169921875, -0.246612548828125, -0.22913360595703125, -0.2116546630859375, -0.19417572021484375, -0.17669677734375, -0.15921783447265625, -0.1417388916015625, -0.12425994873046875, -0.106781005859375, -0.08930206298828125, -0.0718231201171875, -0.05434417724609375, -0.036865234375, -0.01938629150390625, -0.0019073486328125, 0.01557159423828125, 0.033050537109375, 0.05052947998046875, 0.0680084228515625, 0.08548736572265625, 0.10296630859375, 0.12044525146484375, 0.1379241943359375, 0.15540313720703125, 0.172882080078125, 0.19036102294921875, 0.2078399658203125, 0.22531890869140625, 0.2427978515625, 0.26027679443359375, 0.2777557373046875, 0.29523468017578125, 0.312713623046875, 0.33019256591796875, 0.3476715087890625, 0.36515045166015625, 0.38262939453125, 0.40010833740234375, 0.4175872802734375, 0.43506622314453125, 0.452545166015625, 0.47002410888671875, 0.4875030517578125, 0.5049819946289062, 0.5224609375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 5.0, 6.0, 9.0, 10.0, 12.0, 19.0, 18.0, 16.0, 19.0, 22.0, 25.0, 28.0, 45.0, 36.0, 35.0, 48.0, 46.0, 53.0, 34.0, 62.0, 39.0, 49.0, 38.0, 30.0, 40.0, 40.0, 31.0, 26.0, 24.0, 20.0, 12.0, 13.0, 20.0, 15.0, 9.0, 8.0, 6.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395263671875, -0.3821601867675781, -0.36905670166015625, -0.3559532165527344, -0.3428497314453125, -0.3297462463378906, -0.31664276123046875, -0.3035392761230469, -0.290435791015625, -0.2773323059082031, -0.26422882080078125, -0.2511253356933594, -0.2380218505859375, -0.22491836547851562, -0.21181488037109375, -0.19871139526367188, -0.18560791015625, -0.17250442504882812, -0.15940093994140625, -0.14629745483398438, -0.1331939697265625, -0.12009048461914062, -0.10698699951171875, -0.09388351440429688, -0.080780029296875, -0.06767654418945312, -0.05457305908203125, -0.041469573974609375, -0.0283660888671875, -0.015262603759765625, -0.00215911865234375, 0.010944366455078125, 0.0240478515625, 0.037151336669921875, 0.05025482177734375, 0.06335830688476562, 0.0764617919921875, 0.08956527709960938, 0.10266876220703125, 0.11577224731445312, 0.128875732421875, 0.14197921752929688, 0.15508270263671875, 0.16818618774414062, 0.1812896728515625, 0.19439315795898438, 0.20749664306640625, 0.22060012817382812, 0.23370361328125, 0.24680709838867188, 0.25991058349609375, 0.2730140686035156, 0.2861175537109375, 0.2992210388183594, 0.31232452392578125, 0.3254280090332031, 0.338531494140625, 0.3516349792480469, 0.36473846435546875, 0.3778419494628906, 0.3909454345703125, 0.4040489196777344, 0.41715240478515625, 0.4302558898925781, 0.443359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 10.0, 16.0, 27.0, 37.0, 53.0, 90.0, 144.0, 308.0, 630.0, 1993.0, 10287.0, 148225.0, 847107.0, 33327.0, 4272.0, 1111.0, 426.0, 191.0, 109.0, 60.0, 46.0, 22.0, 16.0, 13.0, 8.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.1059722900390625, -2.047882080078125, -1.9897918701171875, -1.93170166015625, -1.8736114501953125, -1.815521240234375, -1.7574310302734375, -1.6993408203125, -1.6412506103515625, -1.583160400390625, -1.5250701904296875, -1.46697998046875, -1.4088897705078125, -1.350799560546875, -1.2927093505859375, -1.234619140625, -1.1765289306640625, -1.118438720703125, -1.0603485107421875, -1.00225830078125, -0.9441680908203125, -0.886077880859375, -0.8279876708984375, -0.7698974609375, -0.7118072509765625, -0.653717041015625, -0.5956268310546875, -0.53753662109375, -0.4794464111328125, -0.421356201171875, -0.3632659912109375, -0.30517578125, -0.2470855712890625, -0.188995361328125, -0.1309051513671875, -0.07281494140625, -0.0147247314453125, 0.043365478515625, 0.1014556884765625, 0.1595458984375, 0.2176361083984375, 0.275726318359375, 0.3338165283203125, 0.39190673828125, 0.4499969482421875, 0.508087158203125, 0.5661773681640625, 0.624267578125, 0.6823577880859375, 0.740447998046875, 0.7985382080078125, 0.85662841796875, 0.9147186279296875, 0.972808837890625, 1.0308990478515625, 1.0889892578125, 1.1470794677734375, 1.205169677734375, 1.2632598876953125, 1.32135009765625, 1.3794403076171875, 1.437530517578125, 1.4956207275390625, 1.5537109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 8.0, 11.0, 9.0, 21.0, 10.0, 35.0, 24.0, 38.0, 37.0, 42.0, 53.0, 55.0, 79.0, 64.0, 59.0, 64.0, 61.0, 60.0, 46.0, 38.0, 37.0, 25.0, 24.0, 18.0, 16.0, 10.0, 12.0, 14.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.380859375, -2.3116455078125, -2.242431640625, -2.1732177734375, -2.10400390625, -2.0347900390625, -1.965576171875, -1.8963623046875, -1.8271484375, -1.7579345703125, -1.688720703125, -1.6195068359375, -1.55029296875, -1.4810791015625, -1.411865234375, -1.3426513671875, -1.2734375, -1.2042236328125, -1.135009765625, -1.0657958984375, -0.99658203125, -0.9273681640625, -0.858154296875, -0.7889404296875, -0.7197265625, -0.6505126953125, -0.581298828125, -0.5120849609375, -0.44287109375, -0.3736572265625, -0.304443359375, -0.2352294921875, -0.166015625, -0.0968017578125, -0.027587890625, 0.0416259765625, 0.11083984375, 0.1800537109375, 0.249267578125, 0.3184814453125, 0.3876953125, 0.4569091796875, 0.526123046875, 0.5953369140625, 0.66455078125, 0.7337646484375, 0.802978515625, 0.8721923828125, 0.94140625, 1.0106201171875, 1.079833984375, 1.1490478515625, 1.21826171875, 1.2874755859375, 1.356689453125, 1.4259033203125, 1.4951171875, 1.5643310546875, 1.633544921875, 1.7027587890625, 1.77197265625, 1.8411865234375, 1.910400390625, 1.9796142578125, 2.048828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 8.0, 2.0, 2.0, 3.0, 7.0, 10.0, 12.0, 13.0, 14.0, 20.0, 26.0, 17.0, 50.0, 76.0, 101.0, 166.0, 299.0, 576.0, 1263.0, 3587.0, 12797.0, 64219.0, 758393.0, 169690.0, 26814.0, 6548.0, 2005.0, 845.0, 373.0, 206.0, 125.0, 75.0, 46.0, 48.0, 29.0, 20.0, 18.0, 12.0, 12.0, 9.0, 2.0, 9.0, 2.0, 1.0, 6.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.416259765625, -0.40392303466796875, -0.3915863037109375, -0.37924957275390625, -0.366912841796875, -0.35457611083984375, -0.3422393798828125, -0.32990264892578125, -0.31756591796875, -0.30522918701171875, -0.2928924560546875, -0.28055572509765625, -0.268218994140625, -0.25588226318359375, -0.2435455322265625, -0.23120880126953125, -0.2188720703125, -0.20653533935546875, -0.1941986083984375, -0.18186187744140625, -0.169525146484375, -0.15718841552734375, -0.1448516845703125, -0.13251495361328125, -0.12017822265625, -0.10784149169921875, -0.0955047607421875, -0.08316802978515625, -0.070831298828125, -0.05849456787109375, -0.0461578369140625, -0.03382110595703125, -0.021484375, -0.00914764404296875, 0.0031890869140625, 0.01552581787109375, 0.027862548828125, 0.04019927978515625, 0.0525360107421875, 0.06487274169921875, 0.07720947265625, 0.08954620361328125, 0.1018829345703125, 0.11421966552734375, 0.126556396484375, 0.13889312744140625, 0.1512298583984375, 0.16356658935546875, 0.1759033203125, 0.18824005126953125, 0.2005767822265625, 0.21291351318359375, 0.225250244140625, 0.23758697509765625, 0.2499237060546875, 0.26226043701171875, 0.27459716796875, 0.28693389892578125, 0.2992706298828125, 0.31160736083984375, 0.323944091796875, 0.33628082275390625, 0.3486175537109375, 0.36095428466796875, 0.373291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 4.0, 6.0, 12.0, 7.0, 24.0, 19.0, 34.0, 46.0, 68.0, 76.0, 130.0, 139.0, 108.0, 78.0, 60.0, 42.0, 31.0, 16.0, 21.0, 7.0, 19.0, 9.0, 7.0, 8.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010526180267333984, -0.00010227877646684647, -9.929575026035309e-05, -9.631272405385971e-05, -9.332969784736633e-05, -9.034667164087296e-05, -8.736364543437958e-05, -8.43806192278862e-05, -8.139759302139282e-05, -7.841456681489944e-05, -7.543154060840607e-05, -7.244851440191269e-05, -6.946548819541931e-05, -6.648246198892593e-05, -6.349943578243256e-05, -6.051640957593918e-05, -5.75333833694458e-05, -5.455035716295242e-05, -5.1567330956459045e-05, -4.858430474996567e-05, -4.560127854347229e-05, -4.261825233697891e-05, -3.9635226130485535e-05, -3.665219992399216e-05, -3.366917371749878e-05, -3.06861475110054e-05, -2.7703121304512024e-05, -2.4720095098018646e-05, -2.173706889152527e-05, -1.875404268503189e-05, -1.5771016478538513e-05, -1.2787990272045135e-05, -9.804964065551758e-06, -6.82193785905838e-06, -3.8389116525650024e-06, -8.558854460716248e-07, 2.127140760421753e-06, 5.110166966915131e-06, 8.093193173408508e-06, 1.1076219379901886e-05, 1.4059245586395264e-05, 1.704227179288864e-05, 2.002529799938202e-05, 2.3008324205875397e-05, 2.5991350412368774e-05, 2.8974376618862152e-05, 3.195740282535553e-05, 3.494042903184891e-05, 3.7923455238342285e-05, 4.090648144483566e-05, 4.388950765132904e-05, 4.687253385782242e-05, 4.9855560064315796e-05, 5.2838586270809174e-05, 5.582161247730255e-05, 5.880463868379593e-05, 6.17876648902893e-05, 6.477069109678268e-05, 6.775371730327606e-05, 7.073674350976944e-05, 7.371976971626282e-05, 7.67027959227562e-05, 7.968582212924957e-05, 8.266884833574295e-05, 8.565187454223633e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 12.0, 13.0, 20.0, 29.0, 52.0, 79.0, 109.0, 169.0, 316.0, 483.0, 890.0, 1689.0, 3683.0, 8115.0, 22446.0, 72448.0, 608135.0, 244210.0, 54602.0, 17701.0, 6950.0, 3078.0, 1456.0, 739.0, 405.0, 239.0, 159.0, 108.0, 64.0, 42.0, 23.0, 26.0, 17.0, 14.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.2639732360839844, -0.25450897216796875, -0.24504470825195312, -0.2355804443359375, -0.22611618041992188, -0.21665191650390625, -0.20718765258789062, -0.197723388671875, -0.18825912475585938, -0.17879486083984375, -0.16933059692382812, -0.1598663330078125, -0.15040206909179688, -0.14093780517578125, -0.13147354125976562, -0.12200927734375, -0.11254501342773438, -0.10308074951171875, -0.09361648559570312, -0.0841522216796875, -0.07468795776367188, -0.06522369384765625, -0.055759429931640625, -0.046295166015625, -0.036830902099609375, -0.02736663818359375, -0.017902374267578125, -0.0084381103515625, 0.001026153564453125, 0.01049041748046875, 0.019954681396484375, 0.0294189453125, 0.038883209228515625, 0.04834747314453125, 0.057811737060546875, 0.0672760009765625, 0.07674026489257812, 0.08620452880859375, 0.09566879272460938, 0.105133056640625, 0.11459732055664062, 0.12406158447265625, 0.13352584838867188, 0.1429901123046875, 0.15245437622070312, 0.16191864013671875, 0.17138290405273438, 0.18084716796875, 0.19031143188476562, 0.19977569580078125, 0.20923995971679688, 0.2187042236328125, 0.22816848754882812, 0.23763275146484375, 0.24709701538085938, 0.256561279296875, 0.2660255432128906, 0.27548980712890625, 0.2849540710449219, 0.2944183349609375, 0.3038825988769531, 0.31334686279296875, 0.3228111267089844, 0.332275390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 7.0, 6.0, 5.0, 9.0, 22.0, 14.0, 18.0, 25.0, 27.0, 36.0, 41.0, 51.0, 65.0, 60.0, 92.0, 77.0, 72.0, 72.0, 51.0, 32.0, 34.0, 35.0, 23.0, 17.0, 25.0, 18.0, 10.0, 7.0, 6.0, 3.0, 10.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2626953125, -0.2533988952636719, -0.24410247802734375, -0.23480606079101562, -0.2255096435546875, -0.21621322631835938, -0.20691680908203125, -0.19762039184570312, -0.188323974609375, -0.17902755737304688, -0.16973114013671875, -0.16043472290039062, -0.1511383056640625, -0.14184188842773438, -0.13254547119140625, -0.12324905395507812, -0.11395263671875, -0.10465621948242188, -0.09535980224609375, -0.08606338500976562, -0.0767669677734375, -0.06747055053710938, -0.05817413330078125, -0.048877716064453125, -0.039581298828125, -0.030284881591796875, -0.02098846435546875, -0.011692047119140625, -0.0023956298828125, 0.006900787353515625, 0.01619720458984375, 0.025493621826171875, 0.0347900390625, 0.044086456298828125, 0.05338287353515625, 0.06267929077148438, 0.0719757080078125, 0.08127212524414062, 0.09056854248046875, 0.09986495971679688, 0.109161376953125, 0.11845779418945312, 0.12775421142578125, 0.13705062866210938, 0.1463470458984375, 0.15564346313476562, 0.16493988037109375, 0.17423629760742188, 0.18353271484375, 0.19282913208007812, 0.20212554931640625, 0.21142196655273438, 0.2207183837890625, 0.23001480102539062, 0.23931121826171875, 0.24860763549804688, 0.257904052734375, 0.2672004699707031, 0.27649688720703125, 0.2857933044433594, 0.2950897216796875, 0.3043861389160156, 0.31368255615234375, 0.3229789733886719, 0.332275390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 11.0, 47.0, 70.0, 167.0, 375.0, 134.0, 83.0, 46.0, 13.0, 11.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.934327125549316, -7.579606056213379, -7.224884986877441, -6.870163440704346, -6.515442371368408, -6.160721302032471, -5.805999755859375, -5.4512786865234375, -5.0965576171875, -4.7418365478515625, -4.387115478515625, -4.032393932342529, -3.677672863006592, -3.3229517936706543, -2.9682304859161377, -2.613509178161621, -2.2587881088256836, -1.9040669202804565, -1.5493457317352295, -1.1946245431900024, -0.8399033546447754, -0.48518216609954834, -0.1304609775543213, 0.2242603302001953, 0.5789813995361328, 0.9337025880813599, 1.288423776626587, 1.643144965171814, 1.997866153717041, 2.3525872230529785, 2.707308530807495, 3.0620298385620117, 3.416749954223633, 3.7714710235595703, 4.126192092895508, 4.4809136390686035, 4.835634708404541, 5.1903557777404785, 5.545077323913574, 5.899798393249512, 6.254519462585449, 6.609240531921387, 6.963961601257324, 7.31868314743042, 7.673404216766357, 8.028125762939453, 8.38284683227539, 8.737567901611328, 9.092288970947266, 9.447010040283203, 9.80173110961914, 10.156452178955078, 10.511173248291016, 10.86589527130127, 11.220616340637207, 11.575337409973145, 11.930058479309082, 12.28477954864502, 12.639500617980957, 12.994221687316895, 13.348943710327148, 13.703664779663086, 14.058385848999023, 14.413106918334961, 14.767827987670898]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 4.0, 4.0, 4.0, 8.0, 4.0, 6.0, 16.0, 25.0, 20.0, 18.0, 17.0, 19.0, 21.0, 21.0, 30.0, 38.0, 40.0, 49.0, 79.0, 131.0, 90.0, 76.0, 39.0, 30.0, 29.0, 25.0, 17.0, 26.0, 15.0, 12.0, 13.0, 13.0, 10.0, 6.0, 8.0, 9.0, 6.0, 7.0, 1.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.095690727233887, -5.882575511932373, -5.669460296630859, -5.456345081329346, -5.243229866027832, -5.030114650726318, -4.816999435424805, -4.603883743286133, -4.390769004821777, -4.177653789520264, -3.96453857421875, -3.7514233589172363, -3.5383081436157227, -3.325192928314209, -3.112077474594116, -2.8989622592926025, -2.6858468055725098, -2.472731590270996, -2.2596163749694824, -2.0465011596679688, -1.8333858251571655, -1.6202706098556519, -1.4071552753448486, -1.194040060043335, -0.9809248447418213, -0.7678096294403076, -0.5546943545341492, -0.3415790796279907, -0.12846386432647705, 0.08465135097503662, 0.29776668548583984, 0.5108819007873535, 0.723996639251709, 0.9371118545532227, 1.1502270698547363, 1.3633424043655396, 1.5764576196670532, 1.789572834968567, 2.00268816947937, 2.215803384780884, 2.4289186000823975, 2.642033815383911, 2.855149030685425, 3.0682644844055176, 3.2813796997070312, 3.494494915008545, 3.7076101303100586, 3.9207253456115723, 4.133840560913086, 4.3469557762146, 4.560070991516113, 4.773186206817627, 4.986301422119141, 5.199416637420654, 5.412531852722168, 5.62564754486084, 5.838762283325195, 6.051877498626709, 6.264992713928223, 6.478107929229736, 6.69122314453125, 6.904338359832764, 7.117453575134277, 7.330569267272949, 7.543684482574463]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 14.0, 17.0, 28.0, 40.0, 54.0, 95.0, 125.0, 184.0, 326.0, 538.0, 976.0, 1775.0, 3240.0, 7198.0, 18133.0, 70981.0, 520699.0, 2489971.0, 919586.0, 116865.0, 25374.0, 9040.0, 4113.0, 2095.0, 1126.0, 644.0, 340.0, 235.0, 141.0, 101.0, 59.0, 40.0, 28.0, 25.0, 17.0, 10.0, 14.0, 3.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.89404296875, -0.8648605346679688, -0.8356781005859375, -0.8064956665039062, -0.777313232421875, -0.7481307983398438, -0.7189483642578125, -0.6897659301757812, -0.66058349609375, -0.6314010620117188, -0.6022186279296875, -0.5730361938476562, -0.543853759765625, -0.5146713256835938, -0.4854888916015625, -0.45630645751953125, -0.4271240234375, -0.39794158935546875, -0.3687591552734375, -0.33957672119140625, -0.310394287109375, -0.28121185302734375, -0.2520294189453125, -0.22284698486328125, -0.19366455078125, -0.16448211669921875, -0.1352996826171875, -0.10611724853515625, -0.076934814453125, -0.04775238037109375, -0.0185699462890625, 0.01061248779296875, 0.039794921875, 0.06897735595703125, 0.0981597900390625, 0.12734222412109375, 0.156524658203125, 0.18570709228515625, 0.2148895263671875, 0.24407196044921875, 0.27325439453125, 0.30243682861328125, 0.3316192626953125, 0.36080169677734375, 0.389984130859375, 0.41916656494140625, 0.4483489990234375, 0.47753143310546875, 0.5067138671875, 0.5358963012695312, 0.5650787353515625, 0.5942611694335938, 0.623443603515625, 0.6526260375976562, 0.6818084716796875, 0.7109909057617188, 0.74017333984375, 0.7693557739257812, 0.7985382080078125, 0.8277206420898438, 0.856903076171875, 0.8860855102539062, 0.9152679443359375, 0.9444503784179688, 0.9736328125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 10.0, 13.0, 17.0, 25.0, 21.0, 19.0, 31.0, 25.0, 34.0, 40.0, 39.0, 42.0, 39.0, 33.0, 52.0, 54.0, 55.0, 50.0, 51.0, 44.0, 49.0, 35.0, 29.0, 34.0, 30.0, 23.0, 18.0, 13.0, 11.0, 7.0, 9.0, 8.0, 1.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.403076171875, -0.3893318176269531, -0.37558746337890625, -0.3618431091308594, -0.3480987548828125, -0.3343544006347656, -0.32061004638671875, -0.3068656921386719, -0.293121337890625, -0.2793769836425781, -0.26563262939453125, -0.2518882751464844, -0.2381439208984375, -0.22439956665039062, -0.21065521240234375, -0.19691085815429688, -0.18316650390625, -0.16942214965820312, -0.15567779541015625, -0.14193344116210938, -0.1281890869140625, -0.11444473266601562, -0.10070037841796875, -0.08695602416992188, -0.073211669921875, -0.059467315673828125, -0.04572296142578125, -0.031978607177734375, -0.0182342529296875, -0.004489898681640625, 0.00925445556640625, 0.022998809814453125, 0.0367431640625, 0.050487518310546875, 0.06423187255859375, 0.07797622680664062, 0.0917205810546875, 0.10546493530273438, 0.11920928955078125, 0.13295364379882812, 0.146697998046875, 0.16044235229492188, 0.17418670654296875, 0.18793106079101562, 0.2016754150390625, 0.21541976928710938, 0.22916412353515625, 0.24290847778320312, 0.25665283203125, 0.2703971862792969, 0.28414154052734375, 0.2978858947753906, 0.3116302490234375, 0.3253746032714844, 0.33911895751953125, 0.3528633117675781, 0.366607666015625, 0.3803520202636719, 0.39409637451171875, 0.4078407287597656, 0.4215850830078125, 0.4353294372558594, 0.44907379150390625, 0.4628181457519531, 0.4765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 3.0, 3.0, 10.0, 16.0, 16.0, 27.0, 41.0, 45.0, 85.0, 152.0, 286.0, 467.0, 1071.0, 2975.0, 13445.0, 445771.0, 3694882.0, 27656.0, 4485.0, 1422.0, 610.0, 332.0, 154.0, 105.0, 73.0, 48.0, 28.0, 15.0, 9.0, 8.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.947265625, -3.834991455078125, -3.72271728515625, -3.610443115234375, -3.4981689453125, -3.385894775390625, -3.27362060546875, -3.161346435546875, -3.049072265625, -2.936798095703125, -2.82452392578125, -2.712249755859375, -2.5999755859375, -2.487701416015625, -2.37542724609375, -2.263153076171875, -2.15087890625, -2.038604736328125, -1.92633056640625, -1.814056396484375, -1.7017822265625, -1.589508056640625, -1.47723388671875, -1.364959716796875, -1.252685546875, -1.140411376953125, -1.02813720703125, -0.915863037109375, -0.8035888671875, -0.691314697265625, -0.57904052734375, -0.466766357421875, -0.3544921875, -0.242218017578125, -0.12994384765625, -0.017669677734375, 0.0946044921875, 0.206878662109375, 0.31915283203125, 0.431427001953125, 0.543701171875, 0.655975341796875, 0.76824951171875, 0.880523681640625, 0.9927978515625, 1.105072021484375, 1.21734619140625, 1.329620361328125, 1.44189453125, 1.554168701171875, 1.66644287109375, 1.778717041015625, 1.8909912109375, 2.003265380859375, 2.11553955078125, 2.227813720703125, 2.340087890625, 2.452362060546875, 2.56463623046875, 2.676910400390625, 2.7891845703125, 2.901458740234375, 3.01373291015625, 3.126007080078125, 3.23828125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 7.0, 10.0, 18.0, 14.0, 32.0, 44.0, 45.0, 74.0, 93.0, 175.0, 285.0, 448.0, 647.0, 677.0, 539.0, 337.0, 176.0, 125.0, 72.0, 63.0, 43.0, 29.0, 28.0, 22.0, 17.0, 7.0, 14.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.865234375, -1.813446044921875, -1.76165771484375, -1.709869384765625, -1.6580810546875, -1.606292724609375, -1.55450439453125, -1.502716064453125, -1.450927734375, -1.399139404296875, -1.34735107421875, -1.295562744140625, -1.2437744140625, -1.191986083984375, -1.14019775390625, -1.088409423828125, -1.03662109375, -0.984832763671875, -0.93304443359375, -0.881256103515625, -0.8294677734375, -0.777679443359375, -0.72589111328125, -0.674102783203125, -0.622314453125, -0.570526123046875, -0.51873779296875, -0.466949462890625, -0.4151611328125, -0.363372802734375, -0.31158447265625, -0.259796142578125, -0.2080078125, -0.156219482421875, -0.10443115234375, -0.052642822265625, -0.0008544921875, 0.050933837890625, 0.10272216796875, 0.154510498046875, 0.206298828125, 0.258087158203125, 0.30987548828125, 0.361663818359375, 0.4134521484375, 0.465240478515625, 0.51702880859375, 0.568817138671875, 0.62060546875, 0.672393798828125, 0.72418212890625, 0.775970458984375, 0.8277587890625, 0.879547119140625, 0.93133544921875, 0.983123779296875, 1.034912109375, 1.086700439453125, 1.13848876953125, 1.190277099609375, 1.2420654296875, 1.293853759765625, 1.34564208984375, 1.397430419921875, 1.44921875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 17.0, 12.0, 16.0, 35.0, 39.0, 83.0, 127.0, 167.0, 149.0, 109.0, 78.0, 55.0, 32.0, 20.0, 15.0, 3.0, 9.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.559200286865234, -15.053767204284668, -14.548334121704102, -14.042901992797852, -13.537468910217285, -13.032035827636719, -12.526603698730469, -12.021170616149902, -11.515737533569336, -11.01030445098877, -10.504871368408203, -9.999439239501953, -9.494006156921387, -8.98857307434082, -8.48314094543457, -7.977707862854004, -7.4722747802734375, -6.966841697692871, -6.461409091949463, -5.955976486206055, -5.450543403625488, -4.945110321044922, -4.439677715301514, -3.9342448711395264, -3.428812026977539, -2.9233791828155518, -2.4179463386535645, -1.9125134944915771, -1.4070806503295898, -0.9016478061676025, -0.39621496200561523, 0.10921788215637207, 0.6146526336669922, 1.1200854778289795, 1.6255183219909668, 2.130951166152954, 2.6363840103149414, 3.1418168544769287, 3.647249698638916, 4.152682304382324, 4.658115386962891, 5.163548469543457, 5.668981075286865, 6.174413681030273, 6.67984676361084, 7.185279846191406, 7.6907124519348145, 8.196145057678223, 8.701578140258789, 9.207011222839355, 9.712444305419922, 10.217876434326172, 10.723309516906738, 11.228742599487305, 11.734174728393555, 12.239607810974121, 12.745040893554688, 13.250473976135254, 13.75590705871582, 14.26133918762207, 14.766772270202637, 15.272205352783203, 15.777637481689453, 16.283071517944336, 16.788503646850586]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 6.0, 12.0, 14.0, 11.0, 15.0, 19.0, 26.0, 26.0, 31.0, 31.0, 34.0, 38.0, 67.0, 60.0, 57.0, 59.0, 61.0, 50.0, 57.0, 42.0, 44.0, 38.0, 29.0, 26.0, 26.0, 18.0, 16.0, 13.0, 15.0, 13.0, 6.0, 6.0, 8.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.41578483581543, -8.112004280090332, -7.808223247528076, -7.50444221496582, -7.200661659240723, -6.896880626678467, -6.593099594116211, -6.289319038391113, -5.985538005828857, -5.681756973266602, -5.377976417541504, -5.074195384979248, -4.770414352416992, -4.4666337966918945, -4.162852764129639, -3.859071969985962, -3.555291175842285, -3.2515103816986084, -2.9477295875549316, -2.643948554992676, -2.340167760848999, -2.0363869667053223, -1.732606053352356, -1.4288251399993896, -1.125044345855713, -0.8212634921073914, -0.5174826383590698, -0.2137017846107483, 0.09007906913757324, 0.39385986328125, 0.6976407766342163, 1.0014216899871826, 1.3052024841308594, 1.6089832782745361, 1.9127641916275024, 2.2165451049804688, 2.5203258991241455, 2.8241066932678223, 3.127887725830078, 3.431668519973755, 3.7354493141174316, 4.0392303466796875, 4.343010902404785, 4.646791934967041, 4.950572967529297, 5.2543535232543945, 5.55813455581665, 5.861915588378906, 6.165696144104004, 6.46947717666626, 6.773257732391357, 7.077038764953613, 7.380819320678711, 7.684600353240967, 7.988381385803223, 8.29216194152832, 8.595943450927734, 8.899724006652832, 9.203505516052246, 9.507286071777344, 9.811066627502441, 10.114847183227539, 10.418628692626953, 10.72240924835205, 11.026189804077148]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 10.0, 6.0, 6.0, 17.0, 20.0, 25.0, 56.0, 70.0, 103.0, 167.0, 290.0, 439.0, 769.0, 1330.0, 2625.0, 6079.0, 17121.0, 69439.0, 599148.0, 285720.0, 43241.0, 12168.0, 4771.0, 2100.0, 1126.0, 632.0, 432.0, 211.0, 141.0, 98.0, 61.0, 50.0, 25.0, 19.0, 13.0, 8.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.138671875, -1.1017608642578125, -1.064849853515625, -1.0279388427734375, -0.99102783203125, -0.9541168212890625, -0.917205810546875, -0.8802947998046875, -0.8433837890625, -0.8064727783203125, -0.769561767578125, -0.7326507568359375, -0.69573974609375, -0.6588287353515625, -0.621917724609375, -0.5850067138671875, -0.548095703125, -0.5111846923828125, -0.474273681640625, -0.4373626708984375, -0.40045166015625, -0.3635406494140625, -0.326629638671875, -0.2897186279296875, -0.2528076171875, -0.2158966064453125, -0.178985595703125, -0.1420745849609375, -0.10516357421875, -0.0682525634765625, -0.031341552734375, 0.0055694580078125, 0.04248046875, 0.0793914794921875, 0.116302490234375, 0.1532135009765625, 0.19012451171875, 0.2270355224609375, 0.263946533203125, 0.3008575439453125, 0.3377685546875, 0.3746795654296875, 0.411590576171875, 0.4485015869140625, 0.48541259765625, 0.5223236083984375, 0.559234619140625, 0.5961456298828125, 0.633056640625, 0.6699676513671875, 0.706878662109375, 0.7437896728515625, 0.78070068359375, 0.8176116943359375, 0.854522705078125, 0.8914337158203125, 0.9283447265625, 0.9652557373046875, 1.002166748046875, 1.0390777587890625, 1.07598876953125, 1.1128997802734375, 1.149810791015625, 1.1867218017578125, 1.2236328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 7.0, 7.0, 5.0, 10.0, 14.0, 20.0, 24.0, 23.0, 29.0, 22.0, 46.0, 54.0, 48.0, 46.0, 71.0, 70.0, 60.0, 47.0, 56.0, 52.0, 49.0, 45.0, 29.0, 34.0, 32.0, 20.0, 19.0, 18.0, 7.0, 3.0, 6.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6661376953125, -0.643798828125, -0.6214599609375, -0.59912109375, -0.5767822265625, -0.554443359375, -0.5321044921875, -0.509765625, -0.4874267578125, -0.465087890625, -0.4427490234375, -0.42041015625, -0.3980712890625, -0.375732421875, -0.3533935546875, -0.3310546875, -0.3087158203125, -0.286376953125, -0.2640380859375, -0.24169921875, -0.2193603515625, -0.197021484375, -0.1746826171875, -0.15234375, -0.1300048828125, -0.107666015625, -0.0853271484375, -0.06298828125, -0.0406494140625, -0.018310546875, 0.0040283203125, 0.0263671875, 0.0487060546875, 0.071044921875, 0.0933837890625, 0.11572265625, 0.1380615234375, 0.160400390625, 0.1827392578125, 0.205078125, 0.2274169921875, 0.249755859375, 0.2720947265625, 0.29443359375, 0.3167724609375, 0.339111328125, 0.3614501953125, 0.3837890625, 0.4061279296875, 0.428466796875, 0.4508056640625, 0.47314453125, 0.4954833984375, 0.517822265625, 0.5401611328125, 0.5625, 0.5848388671875, 0.607177734375, 0.6295166015625, 0.65185546875, 0.6741943359375, 0.696533203125, 0.7188720703125, 0.7412109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 7.0, 7.0, 11.0, 11.0, 18.0, 26.0, 39.0, 60.0, 90.0, 162.0, 311.0, 789.0, 3066.0, 32560.0, 978828.0, 28063.0, 2999.0, 776.0, 299.0, 154.0, 94.0, 54.0, 39.0, 21.0, 14.0, 18.0, 4.0, 8.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.51702880859375, -2.4344482421875, -2.35186767578125, -2.269287109375, -2.18670654296875, -2.1041259765625, -2.02154541015625, -1.93896484375, -1.85638427734375, -1.7738037109375, -1.69122314453125, -1.608642578125, -1.52606201171875, -1.4434814453125, -1.36090087890625, -1.2783203125, -1.19573974609375, -1.1131591796875, -1.03057861328125, -0.947998046875, -0.86541748046875, -0.7828369140625, -0.70025634765625, -0.61767578125, -0.53509521484375, -0.4525146484375, -0.36993408203125, -0.287353515625, -0.20477294921875, -0.1221923828125, -0.03961181640625, 0.04296875, 0.12554931640625, 0.2081298828125, 0.29071044921875, 0.373291015625, 0.45587158203125, 0.5384521484375, 0.62103271484375, 0.70361328125, 0.78619384765625, 0.8687744140625, 0.95135498046875, 1.033935546875, 1.11651611328125, 1.1990966796875, 1.28167724609375, 1.3642578125, 1.44683837890625, 1.5294189453125, 1.61199951171875, 1.694580078125, 1.77716064453125, 1.8597412109375, 1.94232177734375, 2.02490234375, 2.10748291015625, 2.1900634765625, 2.27264404296875, 2.355224609375, 2.43780517578125, 2.5203857421875, 2.60296630859375, 2.685546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 13.0, 9.0, 16.0, 13.0, 12.0, 28.0, 24.0, 31.0, 25.0, 39.0, 62.0, 75.0, 102.0, 98.0, 79.0, 64.0, 66.0, 32.0, 42.0, 26.0, 21.0, 24.0, 13.0, 13.0, 13.0, 9.0, 7.0, 10.0, 4.0, 6.0, 5.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.927398681640625, -2.83135986328125, -2.735321044921875, -2.6392822265625, -2.543243408203125, -2.44720458984375, -2.351165771484375, -2.255126953125, -2.159088134765625, -2.06304931640625, -1.967010498046875, -1.8709716796875, -1.774932861328125, -1.67889404296875, -1.582855224609375, -1.48681640625, -1.390777587890625, -1.29473876953125, -1.198699951171875, -1.1026611328125, -1.006622314453125, -0.91058349609375, -0.814544677734375, -0.718505859375, -0.622467041015625, -0.52642822265625, -0.430389404296875, -0.3343505859375, -0.238311767578125, -0.14227294921875, -0.046234130859375, 0.0498046875, 0.145843505859375, 0.24188232421875, 0.337921142578125, 0.4339599609375, 0.529998779296875, 0.62603759765625, 0.722076416015625, 0.818115234375, 0.914154052734375, 1.01019287109375, 1.106231689453125, 1.2022705078125, 1.298309326171875, 1.39434814453125, 1.490386962890625, 1.58642578125, 1.682464599609375, 1.77850341796875, 1.874542236328125, 1.9705810546875, 2.066619873046875, 2.16265869140625, 2.258697509765625, 2.354736328125, 2.450775146484375, 2.54681396484375, 2.642852783203125, 2.7388916015625, 2.834930419921875, 2.93096923828125, 3.027008056640625, 3.123046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 9.0, 13.0, 21.0, 33.0, 54.0, 101.0, 208.0, 516.0, 1541.0, 8333.0, 263455.0, 762548.0, 9079.0, 1615.0, 513.0, 215.0, 115.0, 51.0, 36.0, 20.0, 22.0, 8.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.43994140625, -0.4236602783203125, -0.407379150390625, -0.3910980224609375, -0.37481689453125, -0.3585357666015625, -0.342254638671875, -0.3259735107421875, -0.3096923828125, -0.2934112548828125, -0.277130126953125, -0.2608489990234375, -0.24456787109375, -0.2282867431640625, -0.212005615234375, -0.1957244873046875, -0.179443359375, -0.1631622314453125, -0.146881103515625, -0.1305999755859375, -0.11431884765625, -0.0980377197265625, -0.081756591796875, -0.0654754638671875, -0.0491943359375, -0.0329132080078125, -0.016632080078125, -0.0003509521484375, 0.01593017578125, 0.0322113037109375, 0.048492431640625, 0.0647735595703125, 0.0810546875, 0.0973358154296875, 0.113616943359375, 0.1298980712890625, 0.14617919921875, 0.1624603271484375, 0.178741455078125, 0.1950225830078125, 0.2113037109375, 0.2275848388671875, 0.243865966796875, 0.2601470947265625, 0.27642822265625, 0.2927093505859375, 0.308990478515625, 0.3252716064453125, 0.341552734375, 0.3578338623046875, 0.374114990234375, 0.3903961181640625, 0.40667724609375, 0.4229583740234375, 0.439239501953125, 0.4555206298828125, 0.4718017578125, 0.4880828857421875, 0.504364013671875, 0.5206451416015625, 0.53692626953125, 0.5532073974609375, 0.569488525390625, 0.5857696533203125, 0.60205078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 10.0, 15.0, 28.0, 42.0, 75.0, 179.0, 296.0, 161.0, 72.0, 48.0, 35.0, 9.0, 7.0, 5.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015843287110328674, -0.00015354901552200317, -0.0001486651599407196, -0.00014378130435943604, -0.00013889744877815247, -0.0001340135931968689, -0.00012912973761558533, -0.00012424588203430176, -0.00011936202645301819, -0.00011447817087173462, -0.00010959431529045105, -0.00010471045970916748, -9.982660412788391e-05, -9.494274854660034e-05, -9.005889296531677e-05, -8.51750373840332e-05, -8.029118180274963e-05, -7.540732622146606e-05, -7.05234706401825e-05, -6.563961505889893e-05, -6.0755759477615356e-05, -5.587190389633179e-05, -5.098804831504822e-05, -4.610419273376465e-05, -4.122033715248108e-05, -3.633648157119751e-05, -3.145262598991394e-05, -2.656877040863037e-05, -2.1684914827346802e-05, -1.6801059246063232e-05, -1.1917203664779663e-05, -7.033348083496094e-06, -2.1494925022125244e-06, 2.734363079071045e-06, 7.618218660354614e-06, 1.2502074241638184e-05, 1.7385929822921753e-05, 2.2269785404205322e-05, 2.715364098548889e-05, 3.203749656677246e-05, 3.692135214805603e-05, 4.18052077293396e-05, 4.668906331062317e-05, 5.157291889190674e-05, 5.645677447319031e-05, 6.134063005447388e-05, 6.622448563575745e-05, 7.110834121704102e-05, 7.599219679832458e-05, 8.087605237960815e-05, 8.575990796089172e-05, 9.064376354217529e-05, 9.552761912345886e-05, 0.00010041147470474243, 0.000105295330286026, 0.00011017918586730957, 0.00011506304144859314, 0.00011994689702987671, 0.00012483075261116028, 0.00012971460819244385, 0.00013459846377372742, 0.00013948231935501099, 0.00014436617493629456, 0.00014925003051757812]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 20.0, 33.0, 61.0, 170.0, 346.0, 883.0, 2722.0, 20495.0, 964119.0, 53181.0, 4581.0, 1185.0, 391.0, 190.0, 84.0, 40.0, 23.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6416397094726562, -0.6231231689453125, -0.6046066284179688, -0.586090087890625, -0.5675735473632812, -0.5490570068359375, -0.5305404663085938, -0.51202392578125, -0.49350738525390625, -0.4749908447265625, -0.45647430419921875, -0.437957763671875, -0.41944122314453125, -0.4009246826171875, -0.38240814208984375, -0.3638916015625, -0.34537506103515625, -0.3268585205078125, -0.30834197998046875, -0.289825439453125, -0.27130889892578125, -0.2527923583984375, -0.23427581787109375, -0.21575927734375, -0.19724273681640625, -0.1787261962890625, -0.16020965576171875, -0.141693115234375, -0.12317657470703125, -0.1046600341796875, -0.08614349365234375, -0.067626953125, -0.04911041259765625, -0.0305938720703125, -0.01207733154296875, 0.006439208984375, 0.02495574951171875, 0.0434722900390625, 0.06198883056640625, 0.08050537109375, 0.09902191162109375, 0.1175384521484375, 0.13605499267578125, 0.154571533203125, 0.17308807373046875, 0.1916046142578125, 0.21012115478515625, 0.2286376953125, 0.24715423583984375, 0.2656707763671875, 0.28418731689453125, 0.302703857421875, 0.32122039794921875, 0.3397369384765625, 0.35825347900390625, 0.37677001953125, 0.39528656005859375, 0.4138031005859375, 0.43231964111328125, 0.450836181640625, 0.46935272216796875, 0.4878692626953125, 0.5063858032226562, 0.52490234375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 9.0, 15.0, 20.0, 25.0, 28.0, 72.0, 79.0, 142.0, 196.0, 131.0, 83.0, 64.0, 30.0, 24.0, 15.0, 11.0, 9.0, 6.0, 4.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.457763671875, -0.4452247619628906, -0.43268585205078125, -0.4201469421386719, -0.4076080322265625, -0.3950691223144531, -0.38253021240234375, -0.3699913024902344, -0.357452392578125, -0.3449134826660156, -0.33237457275390625, -0.3198356628417969, -0.3072967529296875, -0.2947578430175781, -0.28221893310546875, -0.2696800231933594, -0.25714111328125, -0.24460220336914062, -0.23206329345703125, -0.21952438354492188, -0.2069854736328125, -0.19444656372070312, -0.18190765380859375, -0.16936874389648438, -0.156829833984375, -0.14429092407226562, -0.13175201416015625, -0.11921310424804688, -0.1066741943359375, -0.09413528442382812, -0.08159637451171875, -0.06905746459960938, -0.0565185546875, -0.043979644775390625, -0.03144073486328125, -0.018901824951171875, -0.0063629150390625, 0.006175994873046875, 0.01871490478515625, 0.031253814697265625, 0.043792724609375, 0.056331634521484375, 0.06887054443359375, 0.08140945434570312, 0.0939483642578125, 0.10648727416992188, 0.11902618408203125, 0.13156509399414062, 0.14410400390625, 0.15664291381835938, 0.16918182373046875, 0.18172073364257812, 0.1942596435546875, 0.20679855346679688, 0.21933746337890625, 0.23187637329101562, 0.244415283203125, 0.2569541931152344, 0.26949310302734375, 0.2820320129394531, 0.2945709228515625, 0.3071098327636719, 0.31964874267578125, 0.3321876525878906, 0.3447265625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 12.0, 41.0, 129.0, 677.0, 89.0, 34.0, 13.0, 7.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.802444458007812, -17.877893447875977, -16.953344345092773, -16.028793334960938, -15.104244232177734, -14.179693222045898, -13.255143165588379, -12.33059310913086, -11.40604305267334, -10.48149299621582, -9.5569429397583, -8.632392883300781, -7.7078423500061035, -6.783292293548584, -5.858741760253906, -4.934191703796387, -4.009641647338867, -3.0850915908813477, -2.160541296005249, -1.2359910011291504, -0.31144094467163086, 0.6131091117858887, 1.5376596450805664, 2.462209701538086, 3.3867597579956055, 4.311309814453125, 5.2358598709106445, 6.160410404205322, 7.084960460662842, 8.009510040283203, 8.934061050415039, 9.858611106872559, 10.783161163330078, 11.707711219787598, 12.632261276245117, 13.556812286376953, 14.481361389160156, 15.405912399291992, 16.330463409423828, 17.25501251220703, 18.179561614990234, 19.10411262512207, 20.028661727905273, 20.95321273803711, 21.877761840820312, 22.80231285095215, 23.726863861083984, 24.651412963867188, 25.575963973999023, 26.50051498413086, 27.425064086914062, 28.3496150970459, 29.2741641998291, 30.198715209960938, 31.12326431274414, 32.047813415527344, 32.97236633300781, 33.896915435791016, 34.821468353271484, 35.74601745605469, 36.67056655883789, 37.595115661621094, 38.51966857910156, 39.444217681884766, 40.36876678466797]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 7.0, 5.0, 3.0, 12.0, 7.0, 5.0, 10.0, 11.0, 13.0, 18.0, 27.0, 19.0, 27.0, 27.0, 48.0, 174.0, 215.0, 91.0, 38.0, 31.0, 28.0, 20.0, 25.0, 10.0, 21.0, 22.0, 15.0, 13.0, 8.0, 10.0, 5.0, 9.0, 7.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.967225074768066, -7.694420337677002, -7.421615123748779, -7.148810386657715, -6.876005172729492, -6.603200435638428, -6.330395698547363, -6.057590484619141, -5.784785747528076, -5.511981010437012, -5.239175796508789, -4.966371059417725, -4.69356632232666, -4.4207611083984375, -4.147956371307373, -3.8751513957977295, -3.602346420288086, -3.3295414447784424, -3.056736469268799, -2.7839317321777344, -2.511126756668091, -2.2383217811584473, -1.9655169248580933, -1.6927120685577393, -1.4199070930480957, -1.1471021175384521, -0.8742972612380981, -0.6014923453330994, -0.3286874294281006, -0.05588245391845703, 0.21692240238189697, 0.489727258682251, 0.7625331878662109, 1.0353381633758545, 1.3081430196762085, 1.5809478759765625, 1.853752851486206, 2.1265578269958496, 2.399362564086914, 2.6721675395965576, 2.944972515106201, 3.2177774906158447, 3.4905824661254883, 3.7633872032165527, 4.036191940307617, 4.30899715423584, 4.581801891326904, 4.854606628417969, 5.127411842346191, 5.400216579437256, 5.6730217933654785, 5.945826530456543, 6.218631744384766, 6.49143648147583, 6.7642412185668945, 7.037046432495117, 7.309851169586182, 7.582655906677246, 7.855461120605469, 8.128266334533691, 8.401070594787598, 8.67387580871582, 8.946681022644043, 9.21948528289795, 9.492290496826172]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 3.0, 6.0, 7.0, 10.0, 10.0, 16.0, 19.0, 22.0, 21.0, 24.0, 28.0, 45.0, 42.0, 53.0, 100.0, 188.0, 88.0, 46.0, 35.0, 35.0, 29.0, 36.0, 19.0, 18.0, 20.0, 9.0, 9.0, 4.0, 12.0, 8.0, 3.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5895233154296875, -0.570159912109375, -0.5507965087890625, -0.53143310546875, -0.5120697021484375, -0.492706298828125, -0.4733428955078125, -0.4539794921875, -0.4346160888671875, -0.415252685546875, -0.3958892822265625, -0.37652587890625, -0.3571624755859375, -0.337799072265625, -0.3184356689453125, -0.299072265625, -0.2797088623046875, -0.260345458984375, -0.2409820556640625, -0.22161865234375, -0.2022552490234375, -0.182891845703125, -0.1635284423828125, -0.1441650390625, -0.1248016357421875, -0.105438232421875, -0.0860748291015625, -0.06671142578125, -0.0473480224609375, -0.027984619140625, -0.0086212158203125, 0.0107421875, 0.0301055908203125, 0.049468994140625, 0.0688323974609375, 0.08819580078125, 0.1075592041015625, 0.126922607421875, 0.1462860107421875, 0.1656494140625, 0.1850128173828125, 0.204376220703125, 0.2237396240234375, 0.24310302734375, 0.2624664306640625, 0.281829833984375, 0.3011932373046875, 0.320556640625, 0.3399200439453125, 0.359283447265625, 0.3786468505859375, 0.39801025390625, 0.4173736572265625, 0.436737060546875, 0.4561004638671875, 0.4754638671875, 0.4948272705078125, 0.514190673828125, 0.5335540771484375, 0.55291748046875, 0.5722808837890625, 0.591644287109375, 0.6110076904296875, 0.63037109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 7.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 16.0, 21.0, 41.0, 42.0, 114.0, 156.0, 302.0, 717.0, 2537.0, 17329.0, 8352736.0, 11225.0, 2012.0, 651.0, 253.0, 127.0, 70.0, 50.0, 38.0, 16.0, 28.0, 20.0, 9.0, 6.0, 8.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.435363292694092, -5.229613304138184, -5.023863315582275, -4.818113327026367, -4.612362861633301, -4.406613349914551, -4.200862884521484, -3.995112895965576, -3.789362907409668, -3.5836129188537598, -3.3778629302978516, -3.1721127033233643, -2.966362714767456, -2.760612726211548, -2.5548624992370605, -2.3491125106811523, -2.143362522125244, -1.937612533569336, -1.7318624258041382, -1.5261123180389404, -1.3203623294830322, -1.114612340927124, -0.9088622331619263, -0.7031121253967285, -0.4973621368408203, -0.29161208868026733, -0.08586204051971436, 0.11988800764083862, 0.3256380558013916, 0.5313880443572998, 0.7371381521224976, 0.9428882598876953, 1.1486382484436035, 1.3543882369995117, 1.5601383447647095, 1.7658884525299072, 1.9716384410858154, 2.1773884296417236, 2.383138656616211, 2.588888645172119, 2.7946386337280273, 3.0003886222839355, 3.2061386108398438, 3.411888837814331, 3.6176388263702393, 3.8233888149261475, 4.029139041900635, 4.234889030456543, 4.440639019012451, 4.646389007568359, 4.852138996124268, 5.057888984680176, 5.263639450073242, 5.469388961791992, 5.675139427185059, 5.880889415740967, 6.086639404296875, 6.292389392852783, 6.498139381408691, 6.7038893699646, 6.909639358520508, 7.115389823913574, 7.321139812469482, 7.526889801025391, 7.732639789581299]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 6.0, 4.0, 4.0, 4.0, 2.0, 5.0, 8.0, 4.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4959611892700195, -6.249114990234375, -6.0022687911987305, -5.755422592163086, -5.508576393127441, -5.261730194091797, -5.014883995056152, -4.768038272857666, -4.5211920738220215, -4.274345874786377, -4.027499675750732, -3.780653476715088, -3.5338075160980225, -3.286961317062378, -3.0401151180267334, -2.793269157409668, -2.5464227199554443, -2.2995765209198, -2.0527303218841553, -1.8058842420578003, -1.5590381622314453, -1.3121919631958008, -1.0653457641601562, -0.8184996843338013, -0.5716534852981567, -0.324807345867157, -0.07796117663383484, 0.1688849925994873, 0.41573113203048706, 0.6625772714614868, 0.9094234704971313, 1.1562695503234863, 1.4031157493591309, 1.6499619483947754, 1.8968080282211304, 2.1436543464660645, 2.39050030708313, 2.6373465061187744, 2.884192705154419, 3.1310386657714844, 3.377884864807129, 3.6247310638427734, 3.871577262878418, 4.1184234619140625, 4.365269660949707, 4.612115859985352, 4.858962059020996, 5.105807781219482, 5.352654457092285, 5.59950065612793, 5.846346855163574, 6.093193054199219, 6.340039253234863, 6.586885452270508, 6.833731651306152, 7.080577373504639, 7.327423572540283, 7.574269771575928, 7.821115970611572, 8.067961692810059, 8.314807891845703, 8.561654090881348, 8.808500289916992, 9.055346488952637, 9.302192687988281]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 6.0, 1.0, 5.0, 8.0, 12.0, 16.0, 20.0, 25.0, 33.0, 45.0, 66.0, 80.0, 84.0, 114.0, 99.0, 95.0, 75.0, 59.0, 48.0, 25.0, 26.0, 17.0, 17.0, 8.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302734375, -0.5147476196289062, -0.4992218017578125, -0.48369598388671875, -0.468170166015625, -0.45264434814453125, -0.4371185302734375, -0.42159271240234375, -0.40606689453125, -0.39054107666015625, -0.3750152587890625, -0.35948944091796875, -0.343963623046875, -0.32843780517578125, -0.3129119873046875, -0.29738616943359375, -0.2818603515625, -0.26633453369140625, -0.2508087158203125, -0.23528289794921875, -0.219757080078125, -0.20423126220703125, -0.1887054443359375, -0.17317962646484375, -0.15765380859375, -0.14212799072265625, -0.1266021728515625, -0.11107635498046875, -0.095550537109375, -0.08002471923828125, -0.0644989013671875, -0.04897308349609375, -0.033447265625, -0.01792144775390625, -0.0023956298828125, 0.01313018798828125, 0.028656005859375, 0.04418182373046875, 0.0597076416015625, 0.07523345947265625, 0.09075927734375, 0.10628509521484375, 0.1218109130859375, 0.13733673095703125, 0.152862548828125, 0.16838836669921875, 0.1839141845703125, 0.19944000244140625, 0.2149658203125, 0.23049163818359375, 0.2460174560546875, 0.26154327392578125, 0.277069091796875, 0.29259490966796875, 0.3081207275390625, 0.32364654541015625, 0.33917236328125, 0.35469818115234375, 0.3702239990234375, 0.38574981689453125, 0.401275634765625, 0.41680145263671875, 0.4323272705078125, 0.44785308837890625, 0.46337890625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 13.0, 12.0, 12.0, 31.0, 40.0, 77.0, 231.0, 732.0, 4082.0, 59021.0, 417124.0, 38734.0, 3251.0, 600.0, 156.0, 57.0, 25.0, 16.0, 8.0, 17.0, 7.0, 7.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.35986328125, -7.9697265625, -7.57958984375, -7.189453125, -6.79931640625, -6.4091796875, -6.01904296875, -5.62890625, -5.23876953125, -4.8486328125, -4.45849609375, -4.068359375, -3.67822265625, -3.2880859375, -2.89794921875, -2.5078125, -2.11767578125, -1.7275390625, -1.33740234375, -0.947265625, -0.55712890625, -0.1669921875, 0.22314453125, 0.61328125, 1.00341796875, 1.3935546875, 1.78369140625, 2.173828125, 2.56396484375, 2.9541015625, 3.34423828125, 3.734375, 4.12451171875, 4.5146484375, 4.90478515625, 5.294921875, 5.68505859375, 6.0751953125, 6.46533203125, 6.85546875, 7.24560546875, 7.6357421875, 8.02587890625, 8.416015625, 8.80615234375, 9.1962890625, 9.58642578125, 9.9765625, 10.36669921875, 10.7568359375, 11.14697265625, 11.537109375, 11.92724609375, 12.3173828125, 12.70751953125, 13.09765625, 13.48779296875, 13.8779296875, 14.26806640625, 14.658203125, 15.04833984375, 15.4384765625, 15.82861328125, 16.21875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 10.0, 5.0, 13.0, 20.0, 14.0, 17.0, 35.0, 32.0, 48.0, 47.0, 65.0, 52.0, 80.0, 95.0, 63.0, 65.0, 60.0, 43.0, 54.0, 34.0, 27.0, 22.0, 21.0, 13.0, 11.0, 13.0, 4.0, 9.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.6615676879882812, -0.6366119384765625, -0.6116561889648438, -0.586700439453125, -0.5617446899414062, -0.5367889404296875, -0.5118331909179688, -0.48687744140625, -0.46192169189453125, -0.4369659423828125, -0.41201019287109375, -0.387054443359375, -0.36209869384765625, -0.3371429443359375, -0.31218719482421875, -0.2872314453125, -0.26227569580078125, -0.2373199462890625, -0.21236419677734375, -0.187408447265625, -0.16245269775390625, -0.1374969482421875, -0.11254119873046875, -0.08758544921875, -0.06262969970703125, -0.0376739501953125, -0.01271820068359375, 0.012237548828125, 0.03719329833984375, 0.0621490478515625, 0.08710479736328125, 0.112060546875, 0.13701629638671875, 0.1619720458984375, 0.18692779541015625, 0.211883544921875, 0.23683929443359375, 0.2617950439453125, 0.28675079345703125, 0.31170654296875, 0.33666229248046875, 0.3616180419921875, 0.38657379150390625, 0.411529541015625, 0.43648529052734375, 0.4614410400390625, 0.48639678955078125, 0.5113525390625, 0.5363082885742188, 0.5612640380859375, 0.5862197875976562, 0.611175537109375, 0.6361312866210938, 0.6610870361328125, 0.6860427856445312, 0.71099853515625, 0.7359542846679688, 0.7609100341796875, 0.7858657836914062, 0.810821533203125, 0.8357772827148438, 0.8607330322265625, 0.8856887817382812, 0.91064453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 6.0, 11.0, 14.0, 24.0, 33.0, 53.0, 61.0, 78.0, 72.0, 50.0, 24.0, 16.0, 13.0, 5.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.444786071777344, -5.267969608306885, -5.091153621673584, -4.914337158203125, -4.737520694732666, -4.560704231262207, -4.383888244628906, -4.207071781158447, -4.030255317687988, -3.8534390926361084, -3.6766226291656494, -3.4998064041137695, -3.3229899406433105, -3.1461737155914307, -2.969357490539551, -2.792541027069092, -2.615725040435791, -2.438908815383911, -2.262092351913452, -2.0852761268615723, -1.9084597826004028, -1.7316434383392334, -1.5548272132873535, -1.378010869026184, -1.2011945247650146, -1.0243781805038452, -0.8475618958473206, -0.6707456111907959, -0.49392926692962646, -0.31711292266845703, -0.14029669761657715, 0.036519646644592285, 0.21333599090576172, 0.39015230536460876, 0.5669686198234558, 0.7437849044799805, 0.9206012487411499, 1.0974175930023193, 1.2742338180541992, 1.4510501623153687, 1.627866506576538, 1.8046828508377075, 1.981499195098877, 2.158315420150757, 2.3351316452026367, 2.5119481086730957, 2.6887643337249756, 2.8655805587768555, 3.0423970222473145, 3.2192132472991943, 3.3960297107696533, 3.572845935821533, 3.749662399291992, 3.926478624343872, 4.103294849395752, 4.280111312866211, 4.456927299499512, 4.633743762969971, 4.8105597496032715, 4.9873762130737305, 5.1641926765441895, 5.341009140014648, 5.517825126647949, 5.694641590118408, 5.871458053588867]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 3.0, 9.0, 9.0, 10.0, 7.0, 17.0, 33.0, 40.0, 69.0, 56.0, 51.0, 57.0, 31.0, 18.0, 13.0, 12.0, 9.0, 5.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.513657569885254, -4.382663726806641, -4.251669406890869, -4.120675086975098, -3.9896812438964844, -3.858687162399292, -3.7276930809020996, -3.5966989994049072, -3.465704917907715, -3.3347108364105225, -3.20371675491333, -3.0727226734161377, -2.9417285919189453, -2.810734510421753, -2.6797404289245605, -2.548746347427368, -2.417752265930176, -2.2867581844329834, -2.155764102935791, -2.0247700214385986, -1.8937759399414062, -1.7627818584442139, -1.6317877769470215, -1.500793695449829, -1.3697996139526367, -1.2388055324554443, -1.107811450958252, -0.9768173694610596, -0.8458232879638672, -0.7148292064666748, -0.5838351249694824, -0.45284104347229004, -0.32184696197509766, -0.19085288047790527, -0.05985879898071289, 0.07113528251647949, 0.20212936401367188, 0.33312344551086426, 0.46411752700805664, 0.595111608505249, 0.7261056900024414, 0.8570997714996338, 0.9880938529968262, 1.1190879344940186, 1.250082015991211, 1.3810760974884033, 1.5120701789855957, 1.643064260482788, 1.7740583419799805, 1.9050524234771729, 2.0360465049743652, 2.1670405864715576, 2.29803466796875, 2.4290287494659424, 2.5600228309631348, 2.691016912460327, 2.8220109939575195, 2.953005075454712, 3.0839991569519043, 3.2149932384490967, 3.345987319946289, 3.4769814014434814, 3.607975482940674, 3.738969564437866, 3.8699636459350586]}, "eval/loss": 4.492813587188721, "eval/wer": 1.8771717572391908, "eval/runtime": 899.5193, "eval/samples_per_second": 2.937, "eval/steps_per_second": 0.368} \ No newline at end of file +{"train/loss": 0.5145, "train/learning_rate": 7.6270783847981e-05, "train/epoch": 5.61, "train/global_step": 5000, "_runtime": 31656, "_timestamp": 1647625533, "_step": 5001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 12.0, 13.0, 34.0, 81.0, 154.0, 297.0, 204.0, 101.0, 50.0, 29.0, 9.0, 6.0, 9.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.6256103515625, -130.96363830566406, -127.30166625976562, -123.63969421386719, -119.97772216796875, -116.31575012207031, -112.65377807617188, -108.99180603027344, -105.329833984375, -101.66786193847656, -98.00588989257812, -94.34391784667969, -90.68194580078125, -87.01997375488281, -83.35800170898438, -79.69602966308594, -76.0340576171875, -72.37208557128906, -68.71011352539062, -65.04814147949219, -61.38616943359375, -57.72419738769531, -54.062225341796875, -50.40025329589844, -46.73828887939453, -43.076316833496094, -39.414344787597656, -35.75237274169922, -32.09040069580078, -28.428430557250977, -24.76645851135254, -21.1044864654541, -17.44251251220703, -13.780540466308594, -10.118568420410156, -6.456597328186035, -2.7946252822875977, 0.8673458099365234, 4.529317855834961, 8.191289901733398, 11.853261947631836, 15.515233993530273, 19.17720603942871, 22.839176177978516, 26.501148223876953, 30.16312026977539, 33.82509231567383, 37.487064361572266, 41.1490364074707, 44.81100845336914, 48.47298049926758, 52.134952545166016, 55.79692459106445, 59.458892822265625, 63.12086486816406, 66.7828369140625, 70.44480895996094, 74.10678100585938, 77.76875305175781, 81.43072509765625, 85.09269714355469, 88.75466918945312, 92.41664123535156, 96.07861328125, 99.74058532714844]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 4.0, 9.0, 5.0, 12.0, 17.0, 16.0, 13.0, 28.0, 32.0, 31.0, 46.0, 40.0, 37.0, 42.0, 61.0, 44.0, 63.0, 88.0, 54.0, 42.0, 38.0, 39.0, 34.0, 41.0, 29.0, 24.0, 23.0, 16.0, 17.0, 8.0, 8.0, 7.0, 9.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-134.67343139648438, -130.7504425048828, -126.82745361328125, -122.90446472167969, -118.98147583007812, -115.05848693847656, -111.135498046875, -107.21250915527344, -103.28952026367188, -99.36653137207031, -95.44354248046875, -91.52055358886719, -87.59756469726562, -83.67457580566406, -79.7515869140625, -75.82859802246094, -71.9056167602539, -67.98262786865234, -64.05963897705078, -60.13665008544922, -56.213661193847656, -52.290672302246094, -48.3676872253418, -44.444698333740234, -40.52170944213867, -36.59872055053711, -32.67573165893555, -28.752744674682617, -24.829755783081055, -20.906766891479492, -16.983779907226562, -13.060791015625, -9.137809753417969, -5.2148213386535645, -1.2918329238891602, 2.631155014038086, 6.554143905639648, 10.477132797241211, 14.40011978149414, 18.323108673095703, 22.246097564697266, 26.169086456298828, 30.09207534790039, 34.01506042480469, 37.93804931640625, 41.86103820800781, 45.784027099609375, 49.70701599121094, 53.6300048828125, 57.55299377441406, 61.475982666015625, 65.39897155761719, 69.32196044921875, 73.24494934082031, 77.16793823242188, 81.09092712402344, 85.013916015625, 88.93690490722656, 92.85989379882812, 96.78288269042969, 100.70587158203125, 104.62886047363281, 108.55184936523438, 112.47483825683594, 116.39781951904297]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 11.0, 5.0, 9.0, 11.0, 14.0, 7.0, 20.0, 18.0, 34.0, 33.0, 36.0, 42.0, 29.0, 52.0, 54.0, 70.0, 51.0, 68.0, 63.0, 47.0, 58.0, 42.0, 37.0, 25.0, 29.0, 26.0, 18.0, 22.0, 14.0, 13.0, 10.0, 2.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.529296875, -3.425628662109375, -3.32196044921875, -3.218292236328125, -3.1146240234375, -3.010955810546875, -2.90728759765625, -2.803619384765625, -2.699951171875, -2.596282958984375, -2.49261474609375, -2.388946533203125, -2.2852783203125, -2.181610107421875, -2.07794189453125, -1.974273681640625, -1.87060546875, -1.766937255859375, -1.66326904296875, -1.559600830078125, -1.4559326171875, -1.352264404296875, -1.24859619140625, -1.144927978515625, -1.041259765625, -0.937591552734375, -0.83392333984375, -0.730255126953125, -0.6265869140625, -0.522918701171875, -0.41925048828125, -0.315582275390625, -0.2119140625, -0.108245849609375, -0.00457763671875, 0.099090576171875, 0.2027587890625, 0.306427001953125, 0.41009521484375, 0.513763427734375, 0.617431640625, 0.721099853515625, 0.82476806640625, 0.928436279296875, 1.0321044921875, 1.135772705078125, 1.23944091796875, 1.343109130859375, 1.44677734375, 1.550445556640625, 1.65411376953125, 1.757781982421875, 1.8614501953125, 1.965118408203125, 2.06878662109375, 2.172454833984375, 2.276123046875, 2.379791259765625, 2.48345947265625, 2.587127685546875, 2.6907958984375, 2.794464111328125, 2.89813232421875, 3.001800537109375, 3.10546875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 8.0, 4.0, 9.0, 8.0, 18.0, 18.0, 23.0, 23.0, 34.0, 49.0, 89.0, 110.0, 179.0, 246.0, 370.0, 528.0, 841.0, 1371.0, 2516.0, 4512.0, 9200.0, 21314.0, 62283.0, 1164393.0, 2802842.0, 75340.0, 24402.0, 10775.0, 5321.0, 2896.0, 1649.0, 974.0, 631.0, 401.0, 260.0, 205.0, 112.0, 88.0, 69.0, 46.0, 40.0, 18.0, 27.0, 12.0, 12.0, 5.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.40625, -24.68212890625, -23.9580078125, -23.23388671875, -22.509765625, -21.78564453125, -21.0615234375, -20.33740234375, -19.61328125, -18.88916015625, -18.1650390625, -17.44091796875, -16.716796875, -15.99267578125, -15.2685546875, -14.54443359375, -13.8203125, -13.09619140625, -12.3720703125, -11.64794921875, -10.923828125, -10.19970703125, -9.4755859375, -8.75146484375, -8.02734375, -7.30322265625, -6.5791015625, -5.85498046875, -5.130859375, -4.40673828125, -3.6826171875, -2.95849609375, -2.234375, -1.51025390625, -0.7861328125, -0.06201171875, 0.662109375, 1.38623046875, 2.1103515625, 2.83447265625, 3.55859375, 4.28271484375, 5.0068359375, 5.73095703125, 6.455078125, 7.17919921875, 7.9033203125, 8.62744140625, 9.3515625, 10.07568359375, 10.7998046875, 11.52392578125, 12.248046875, 12.97216796875, 13.6962890625, 14.42041015625, 15.14453125, 15.86865234375, 16.5927734375, 17.31689453125, 18.041015625, 18.76513671875, 19.4892578125, 20.21337890625, 20.9375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 12.0, 18.0, 18.0, 27.0, 17.0, 31.0, 35.0, 40.0, 57.0, 103.0, 149.0, 209.0, 400.0, 693.0, 834.0, 520.0, 279.0, 149.0, 115.0, 72.0, 61.0, 34.0, 38.0, 29.0, 20.0, 23.0, 16.0, 15.0, 8.0, 7.0, 11.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.25, -13.8336181640625, -13.417236328125, -13.0008544921875, -12.58447265625, -12.1680908203125, -11.751708984375, -11.3353271484375, -10.9189453125, -10.5025634765625, -10.086181640625, -9.6697998046875, -9.25341796875, -8.8370361328125, -8.420654296875, -8.0042724609375, -7.587890625, -7.1715087890625, -6.755126953125, -6.3387451171875, -5.92236328125, -5.5059814453125, -5.089599609375, -4.6732177734375, -4.2568359375, -3.8404541015625, -3.424072265625, -3.0076904296875, -2.59130859375, -2.1749267578125, -1.758544921875, -1.3421630859375, -0.92578125, -0.5093994140625, -0.093017578125, 0.3233642578125, 0.73974609375, 1.1561279296875, 1.572509765625, 1.9888916015625, 2.4052734375, 2.8216552734375, 3.238037109375, 3.6544189453125, 4.07080078125, 4.4871826171875, 4.903564453125, 5.3199462890625, 5.736328125, 6.1527099609375, 6.569091796875, 6.9854736328125, 7.40185546875, 7.8182373046875, 8.234619140625, 8.6510009765625, 9.0673828125, 9.4837646484375, 9.900146484375, 10.3165283203125, 10.73291015625, 11.1492919921875, 11.565673828125, 11.9820556640625, 12.3984375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 9.0, 5.0, 6.0, 14.0, 13.0, 23.0, 29.0, 40.0, 60.0, 63.0, 98.0, 144.0, 207.0, 370.0, 764.0, 2016.0, 6092.0, 24410.0, 165253.0, 3648778.0, 299772.0, 33649.0, 7830.0, 2491.0, 926.0, 425.0, 244.0, 147.0, 114.0, 76.0, 51.0, 51.0, 26.0, 21.0, 15.0, 10.0, 10.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-45.65625, -44.29736328125, -42.9384765625, -41.57958984375, -40.220703125, -38.86181640625, -37.5029296875, -36.14404296875, -34.78515625, -33.42626953125, -32.0673828125, -30.70849609375, -29.349609375, -27.99072265625, -26.6318359375, -25.27294921875, -23.9140625, -22.55517578125, -21.1962890625, -19.83740234375, -18.478515625, -17.11962890625, -15.7607421875, -14.40185546875, -13.04296875, -11.68408203125, -10.3251953125, -8.96630859375, -7.607421875, -6.24853515625, -4.8896484375, -3.53076171875, -2.171875, -0.81298828125, 0.5458984375, 1.90478515625, 3.263671875, 4.62255859375, 5.9814453125, 7.34033203125, 8.69921875, 10.05810546875, 11.4169921875, 12.77587890625, 14.134765625, 15.49365234375, 16.8525390625, 18.21142578125, 19.5703125, 20.92919921875, 22.2880859375, 23.64697265625, 25.005859375, 26.36474609375, 27.7236328125, 29.08251953125, 30.44140625, 31.80029296875, 33.1591796875, 34.51806640625, 35.876953125, 37.23583984375, 38.5947265625, 39.95361328125, 41.3125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 11.0, 24.0, 41.0, 95.0, 226.0, 310.0, 174.0, 62.0, 37.0, 18.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.96576499938965, -25.505510330200195, -22.045255661010742, -18.584999084472656, -15.12474536895752, -11.66448974609375, -8.204235076904297, -4.743980407714844, -1.2837257385253906, 2.1765291690826416, 5.636784076690674, 9.097039222717285, 12.557293891906738, 16.017549514770508, 19.47780418395996, 22.938058853149414, 26.398313522338867, 29.85856819152832, 33.318824768066406, 36.77907943725586, 40.23933410644531, 43.699588775634766, 47.15984344482422, 50.62009811401367, 54.080352783203125, 57.54060745239258, 61.00086212158203, 64.46112060546875, 67.92137145996094, 71.38162994384766, 74.84188079833984, 78.30213928222656, 81.76239776611328, 85.22265625, 88.68290710449219, 92.1431655883789, 95.6034164428711, 99.06367492675781, 102.52392578125, 105.98418426513672, 109.4444351196289, 112.90469360351562, 116.36494445800781, 119.82520294189453, 123.28545379638672, 126.74571228027344, 130.20596313476562, 133.6662139892578, 137.12648010253906, 140.58673095703125, 144.0469970703125, 147.5072479248047, 150.96749877929688, 154.42774963378906, 157.8880157470703, 161.3482666015625, 164.8085174560547, 168.26876831054688, 171.72903442382812, 175.1892852783203, 178.6495361328125, 182.1097869873047, 185.57005310058594, 189.03030395507812, 192.4905548095703]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 10.0, 12.0, 17.0, 15.0, 16.0, 18.0, 23.0, 18.0, 26.0, 33.0, 29.0, 35.0, 38.0, 40.0, 35.0, 47.0, 34.0, 48.0, 36.0, 40.0, 48.0, 33.0, 42.0, 21.0, 28.0, 43.0, 28.0, 31.0, 27.0, 18.0, 13.0, 11.0, 15.0, 14.0, 7.0, 7.0, 7.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-43.81364059448242, -42.432498931884766, -41.051353454589844, -39.67021179199219, -38.28907012939453, -36.907928466796875, -35.52678298950195, -34.1456413269043, -32.764495849609375, -31.383352279663086, -30.00221061706543, -28.62106704711914, -27.239925384521484, -25.858781814575195, -24.477638244628906, -23.09649658203125, -21.715354919433594, -20.334211349487305, -18.95306968688965, -17.57192611694336, -16.190784454345703, -14.809640884399414, -13.428497314453125, -12.047354698181152, -10.66621208190918, -9.285069465637207, -7.903926372528076, -6.522783279418945, -5.141640663146973, -3.760498046875, -2.379354476928711, -0.9982118606567383, 0.3829307556152344, 1.7640736103057861, 3.145216464996338, 4.526359558105469, 5.907502174377441, 7.288644790649414, 8.669788360595703, 10.050930976867676, 11.432073593139648, 12.813216209411621, 14.194358825683594, 15.575502395629883, 16.956645965576172, 18.337787628173828, 19.718931198120117, 21.100074768066406, 22.481216430664062, 23.86236000061035, 25.243501663208008, 26.624645233154297, 28.005786895751953, 29.386930465698242, 30.76807403564453, 32.14921569824219, 33.530357360839844, 34.9114990234375, 36.29264450073242, 37.67378616333008, 39.054927825927734, 40.436073303222656, 41.81721496582031, 43.19835662841797, 44.57950210571289]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 7.0, 7.0, 9.0, 13.0, 7.0, 19.0, 24.0, 21.0, 31.0, 30.0, 45.0, 36.0, 33.0, 60.0, 69.0, 53.0, 60.0, 71.0, 55.0, 44.0, 54.0, 57.0, 28.0, 20.0, 21.0, 25.0, 19.0, 22.0, 9.0, 9.0, 10.0, 5.0, 6.0, 8.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8203125, -3.709442138671875, -3.59857177734375, -3.487701416015625, -3.3768310546875, -3.265960693359375, -3.15509033203125, -3.044219970703125, -2.933349609375, -2.822479248046875, -2.71160888671875, -2.600738525390625, -2.4898681640625, -2.378997802734375, -2.26812744140625, -2.157257080078125, -2.04638671875, -1.935516357421875, -1.82464599609375, -1.713775634765625, -1.6029052734375, -1.492034912109375, -1.38116455078125, -1.270294189453125, -1.159423828125, -1.048553466796875, -0.93768310546875, -0.826812744140625, -0.7159423828125, -0.605072021484375, -0.49420166015625, -0.383331298828125, -0.2724609375, -0.161590576171875, -0.05072021484375, 0.060150146484375, 0.1710205078125, 0.281890869140625, 0.39276123046875, 0.503631591796875, 0.614501953125, 0.725372314453125, 0.83624267578125, 0.947113037109375, 1.0579833984375, 1.168853759765625, 1.27972412109375, 1.390594482421875, 1.50146484375, 1.612335205078125, 1.72320556640625, 1.834075927734375, 1.9449462890625, 2.055816650390625, 2.16668701171875, 2.277557373046875, 2.388427734375, 2.499298095703125, 2.61016845703125, 2.721038818359375, 2.8319091796875, 2.942779541015625, 3.05364990234375, 3.164520263671875, 3.275390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 16.0, 19.0, 25.0, 53.0, 91.0, 131.0, 259.0, 357.0, 655.0, 965.0, 1704.0, 2910.0, 4806.0, 8137.0, 14190.0, 25990.0, 51845.0, 121291.0, 319349.0, 285994.0, 106975.0, 46857.0, 23892.0, 13246.0, 7554.0, 4501.0, 2704.0, 1512.0, 961.0, 641.0, 355.0, 221.0, 140.0, 94.0, 40.0, 22.0, 18.0, 12.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.880340576171875, -2.78411865234375, -2.687896728515625, -2.5916748046875, -2.495452880859375, -2.39923095703125, -2.303009033203125, -2.206787109375, -2.110565185546875, -2.01434326171875, -1.918121337890625, -1.8218994140625, -1.725677490234375, -1.62945556640625, -1.533233642578125, -1.43701171875, -1.340789794921875, -1.24456787109375, -1.148345947265625, -1.0521240234375, -0.955902099609375, -0.85968017578125, -0.763458251953125, -0.667236328125, -0.571014404296875, -0.47479248046875, -0.378570556640625, -0.2823486328125, -0.186126708984375, -0.08990478515625, 0.006317138671875, 0.1025390625, 0.198760986328125, 0.29498291015625, 0.391204833984375, 0.4874267578125, 0.583648681640625, 0.67987060546875, 0.776092529296875, 0.872314453125, 0.968536376953125, 1.06475830078125, 1.160980224609375, 1.2572021484375, 1.353424072265625, 1.44964599609375, 1.545867919921875, 1.64208984375, 1.738311767578125, 1.83453369140625, 1.930755615234375, 2.0269775390625, 2.123199462890625, 2.21942138671875, 2.315643310546875, 2.411865234375, 2.508087158203125, 2.60430908203125, 2.700531005859375, 2.7967529296875, 2.892974853515625, 2.98919677734375, 3.085418701171875, 3.181640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 10.0, 8.0, 10.0, 14.0, 11.0, 17.0, 21.0, 17.0, 24.0, 26.0, 25.0, 31.0, 39.0, 32.0, 26.0, 40.0, 37.0, 46.0, 1065.0, 42.0, 39.0, 40.0, 39.0, 33.0, 34.0, 40.0, 28.0, 22.0, 31.0, 28.0, 26.0, 17.0, 14.0, 12.0, 15.0, 12.0, 13.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.55078125, -3.448822021484375, -3.34686279296875, -3.244903564453125, -3.1429443359375, -3.040985107421875, -2.93902587890625, -2.837066650390625, -2.735107421875, -2.633148193359375, -2.53118896484375, -2.429229736328125, -2.3272705078125, -2.225311279296875, -2.12335205078125, -2.021392822265625, -1.91943359375, -1.817474365234375, -1.71551513671875, -1.613555908203125, -1.5115966796875, -1.409637451171875, -1.30767822265625, -1.205718994140625, -1.103759765625, -1.001800537109375, -0.89984130859375, -0.797882080078125, -0.6959228515625, -0.593963623046875, -0.49200439453125, -0.390045166015625, -0.2880859375, -0.186126708984375, -0.08416748046875, 0.017791748046875, 0.1197509765625, 0.221710205078125, 0.32366943359375, 0.425628662109375, 0.527587890625, 0.629547119140625, 0.73150634765625, 0.833465576171875, 0.9354248046875, 1.037384033203125, 1.13934326171875, 1.241302490234375, 1.34326171875, 1.445220947265625, 1.54718017578125, 1.649139404296875, 1.7510986328125, 1.853057861328125, 1.95501708984375, 2.056976318359375, 2.158935546875, 2.260894775390625, 2.36285400390625, 2.464813232421875, 2.5667724609375, 2.668731689453125, 2.77069091796875, 2.872650146484375, 2.974609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 8.0, 5.0, 11.0, 15.0, 16.0, 23.0, 38.0, 54.0, 66.0, 110.0, 148.0, 215.0, 289.0, 384.0, 690.0, 1031.0, 1695.0, 3008.0, 5950.0, 13588.0, 37723.0, 152734.0, 1286331.0, 465231.0, 82841.0, 24399.0, 9757.0, 4465.0, 2402.0, 1344.0, 792.0, 558.0, 357.0, 265.0, 179.0, 103.0, 84.0, 55.0, 57.0, 28.0, 30.0, 17.0, 16.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-2.771484375, -2.689483642578125, -2.60748291015625, -2.525482177734375, -2.4434814453125, -2.361480712890625, -2.27947998046875, -2.197479248046875, -2.115478515625, -2.033477783203125, -1.95147705078125, -1.869476318359375, -1.7874755859375, -1.705474853515625, -1.62347412109375, -1.541473388671875, -1.45947265625, -1.377471923828125, -1.29547119140625, -1.213470458984375, -1.1314697265625, -1.049468994140625, -0.96746826171875, -0.885467529296875, -0.803466796875, -0.721466064453125, -0.63946533203125, -0.557464599609375, -0.4754638671875, -0.393463134765625, -0.31146240234375, -0.229461669921875, -0.1474609375, -0.065460205078125, 0.01654052734375, 0.098541259765625, 0.1805419921875, 0.262542724609375, 0.34454345703125, 0.426544189453125, 0.508544921875, 0.590545654296875, 0.67254638671875, 0.754547119140625, 0.8365478515625, 0.918548583984375, 1.00054931640625, 1.082550048828125, 1.16455078125, 1.246551513671875, 1.32855224609375, 1.410552978515625, 1.4925537109375, 1.574554443359375, 1.65655517578125, 1.738555908203125, 1.820556640625, 1.902557373046875, 1.98455810546875, 2.066558837890625, 2.1485595703125, 2.230560302734375, 2.31256103515625, 2.394561767578125, 2.4765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 14.0, 11.0, 5.0, 25.0, 54.0, 73.0, 314.0, 300.0, 75.0, 44.0, 23.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3203125, -2.24542236328125, -2.1705322265625, -2.09564208984375, -2.020751953125, -1.94586181640625, -1.8709716796875, -1.79608154296875, -1.72119140625, -1.64630126953125, -1.5714111328125, -1.49652099609375, -1.421630859375, -1.34674072265625, -1.2718505859375, -1.19696044921875, -1.1220703125, -1.04718017578125, -0.9722900390625, -0.89739990234375, -0.822509765625, -0.74761962890625, -0.6727294921875, -0.59783935546875, -0.52294921875, -0.44805908203125, -0.3731689453125, -0.29827880859375, -0.223388671875, -0.14849853515625, -0.0736083984375, 0.00128173828125, 0.076171875, 0.15106201171875, 0.2259521484375, 0.30084228515625, 0.375732421875, 0.45062255859375, 0.5255126953125, 0.60040283203125, 0.67529296875, 0.75018310546875, 0.8250732421875, 0.89996337890625, 0.974853515625, 1.04974365234375, 1.1246337890625, 1.19952392578125, 1.2744140625, 1.34930419921875, 1.4241943359375, 1.49908447265625, 1.573974609375, 1.64886474609375, 1.7237548828125, 1.79864501953125, 1.87353515625, 1.94842529296875, 2.0233154296875, 2.09820556640625, 2.173095703125, 2.24798583984375, 2.3228759765625, 2.39776611328125, 2.47265625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 7.0, 6.0, 9.0, 10.0, 17.0, 18.0, 39.0, 44.0, 62.0, 198.0, 2453.0, 1019026.0, 25621.0, 675.0, 116.0, 49.0, 38.0, 31.0, 15.0, 16.0, 11.0, 9.0, 7.0, 7.0, 6.0, 6.0, 5.0, 0.0, 7.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.1875, -41.78515625, -40.3828125, -38.98046875, -37.578125, -36.17578125, -34.7734375, -33.37109375, -31.96875, -30.56640625, -29.1640625, -27.76171875, -26.359375, -24.95703125, -23.5546875, -22.15234375, -20.75, -19.34765625, -17.9453125, -16.54296875, -15.140625, -13.73828125, -12.3359375, -10.93359375, -9.53125, -8.12890625, -6.7265625, -5.32421875, -3.921875, -2.51953125, -1.1171875, 0.28515625, 1.6875, 3.08984375, 4.4921875, 5.89453125, 7.296875, 8.69921875, 10.1015625, 11.50390625, 12.90625, 14.30859375, 15.7109375, 17.11328125, 18.515625, 19.91796875, 21.3203125, 22.72265625, 24.125, 25.52734375, 26.9296875, 28.33203125, 29.734375, 31.13671875, 32.5390625, 33.94140625, 35.34375, 36.74609375, 38.1484375, 39.55078125, 40.953125, 42.35546875, 43.7578125, 45.16015625, 46.5625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 29.0, 79.0, 305.0, 434.0, 114.0, 23.0, 11.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.780243873596191, -11.50096607208252, -11.221687316894531, -10.94240951538086, -10.663131713867188, -10.3838529586792, -10.104575157165527, -9.825297355651855, -9.546018600463867, -9.266740798950195, -8.987462043762207, -8.708184242248535, -8.428906440734863, -8.149627685546875, -7.870349884033203, -7.591071605682373, -7.311793804168701, -7.032515525817871, -6.753237724304199, -6.473959445953369, -6.194681167602539, -5.915403366088867, -5.636125087738037, -5.356846809387207, -5.077569007873535, -4.798290729522705, -4.519012928009033, -4.239734649658203, -3.960456371307373, -3.681178331375122, -3.401900291442871, -3.122622013092041, -2.8433432579040527, -2.5640652179718018, -2.2847869396209717, -2.0055088996887207, -1.7262307405471802, -1.4469525814056396, -1.1676745414733887, -0.8883963823318481, -0.6091182231903076, -0.3298400938510895, -0.05056196451187134, 0.22871613502502441, 0.5079942941665649, 0.7872724533081055, 1.0665504932403564, 1.345828652381897, 1.6251068115234375, 1.904384970664978, 2.1836631298065186, 2.4629411697387695, 2.7422194480895996, 3.0214974880218506, 3.3007755279541016, 3.5800538063049316, 3.8593318462371826, 4.138609886169434, 4.417888164520264, 4.697166442871094, 4.976444244384766, 5.255722522735596, 5.535000801086426, 5.814278602600098, 6.093556880950928]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 7.0, 3.0, 7.0, 5.0, 7.0, 13.0, 13.0, 14.0, 23.0, 22.0, 24.0, 22.0, 24.0, 32.0, 32.0, 31.0, 35.0, 48.0, 36.0, 38.0, 39.0, 40.0, 44.0, 45.0, 45.0, 30.0, 34.0, 28.0, 29.0, 29.0, 16.0, 29.0, 20.0, 17.0, 24.0, 23.0, 16.0, 8.0, 9.0, 6.0, 4.0, 6.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7098567485809326, -1.6552585363388062, -1.6006604433059692, -1.5460622310638428, -1.4914641380310059, -1.4368659257888794, -1.382267713546753, -1.327669620513916, -1.2730714082717896, -1.218473196029663, -1.1638751029968262, -1.1092768907546997, -1.0546786785125732, -1.0000805854797363, -0.9454823732376099, -0.8908842206001282, -0.8362860679626465, -0.7816879153251648, -0.7270897626876831, -0.6724915504455566, -0.617893397808075, -0.5632952451705933, -0.5086970329284668, -0.4540988802909851, -0.3995007276535034, -0.34490257501602173, -0.29030439257621765, -0.23570622503757477, -0.18110805749893188, -0.1265099048614502, -0.07191172242164612, -0.01731353998184204, 0.03728461265563965, 0.09188278019428253, 0.14648094773292542, 0.2010791152715683, 0.2556772828102112, 0.31027543544769287, 0.36487361788749695, 0.419471800327301, 0.4740699529647827, 0.5286681056022644, 0.5832662582397461, 0.6378644704818726, 0.6924626231193542, 0.7470607757568359, 0.8016589879989624, 0.8562571406364441, 0.9108552932739258, 0.9654534459114075, 1.0200515985488892, 1.0746498107910156, 1.1292479038238525, 1.183846116065979, 1.2384443283081055, 1.2930424213409424, 1.3476406335830688, 1.4022388458251953, 1.4568369388580322, 1.5114351511001587, 1.5660333633422852, 1.620631456375122, 1.6752296686172485, 1.729827880859375, 1.784425973892212]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 2.0, 6.0, 5.0, 8.0, 12.0, 13.0, 14.0, 27.0, 33.0, 35.0, 26.0, 45.0, 35.0, 42.0, 52.0, 60.0, 70.0, 68.0, 57.0, 56.0, 54.0, 50.0, 45.0, 34.0, 33.0, 16.0, 21.0, 13.0, 14.0, 9.0, 9.0, 9.0, 6.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.04296875, -3.928314208984375, -3.81365966796875, -3.699005126953125, -3.5843505859375, -3.469696044921875, -3.35504150390625, -3.240386962890625, -3.125732421875, -3.011077880859375, -2.89642333984375, -2.781768798828125, -2.6671142578125, -2.552459716796875, -2.43780517578125, -2.323150634765625, -2.20849609375, -2.093841552734375, -1.97918701171875, -1.864532470703125, -1.7498779296875, -1.635223388671875, -1.52056884765625, -1.405914306640625, -1.291259765625, -1.176605224609375, -1.06195068359375, -0.947296142578125, -0.8326416015625, -0.717987060546875, -0.60333251953125, -0.488677978515625, -0.3740234375, -0.259368896484375, -0.14471435546875, -0.030059814453125, 0.0845947265625, 0.199249267578125, 0.31390380859375, 0.428558349609375, 0.543212890625, 0.657867431640625, 0.77252197265625, 0.887176513671875, 1.0018310546875, 1.116485595703125, 1.23114013671875, 1.345794677734375, 1.46044921875, 1.575103759765625, 1.68975830078125, 1.804412841796875, 1.9190673828125, 2.033721923828125, 2.14837646484375, 2.263031005859375, 2.377685546875, 2.492340087890625, 2.60699462890625, 2.721649169921875, 2.8363037109375, 2.950958251953125, 3.06561279296875, 3.180267333984375, 3.294921875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 12.0, 21.0, 28.0, 59.0, 83.0, 107.0, 197.0, 303.0, 456.0, 855.0, 1447.0, 2656.0, 5005.0, 10472.0, 24490.0, 70895.0, 308092.0, 459744.0, 104409.0, 32387.0, 13369.0, 6201.0, 3145.0, 1691.0, 974.0, 585.0, 296.0, 186.0, 122.0, 91.0, 56.0, 25.0, 34.0, 13.0, 13.0, 6.0, 9.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.7890625, -13.38525390625, -12.9814453125, -12.57763671875, -12.173828125, -11.77001953125, -11.3662109375, -10.96240234375, -10.55859375, -10.15478515625, -9.7509765625, -9.34716796875, -8.943359375, -8.53955078125, -8.1357421875, -7.73193359375, -7.328125, -6.92431640625, -6.5205078125, -6.11669921875, -5.712890625, -5.30908203125, -4.9052734375, -4.50146484375, -4.09765625, -3.69384765625, -3.2900390625, -2.88623046875, -2.482421875, -2.07861328125, -1.6748046875, -1.27099609375, -0.8671875, -0.46337890625, -0.0595703125, 0.34423828125, 0.748046875, 1.15185546875, 1.5556640625, 1.95947265625, 2.36328125, 2.76708984375, 3.1708984375, 3.57470703125, 3.978515625, 4.38232421875, 4.7861328125, 5.18994140625, 5.59375, 5.99755859375, 6.4013671875, 6.80517578125, 7.208984375, 7.61279296875, 8.0166015625, 8.42041015625, 8.82421875, 9.22802734375, 9.6318359375, 10.03564453125, 10.439453125, 10.84326171875, 11.2470703125, 11.65087890625, 12.0546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 10.0, 10.0, 15.0, 12.0, 15.0, 17.0, 16.0, 24.0, 23.0, 26.0, 58.0, 44.0, 55.0, 70.0, 111.0, 142.0, 240.0, 1320.0, 201.0, 135.0, 79.0, 81.0, 63.0, 40.0, 46.0, 38.0, 35.0, 23.0, 26.0, 17.0, 13.0, 13.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0, -11.640380859375, -11.28076171875, -10.921142578125, -10.5615234375, -10.201904296875, -9.84228515625, -9.482666015625, -9.123046875, -8.763427734375, -8.40380859375, -8.044189453125, -7.6845703125, -7.324951171875, -6.96533203125, -6.605712890625, -6.24609375, -5.886474609375, -5.52685546875, -5.167236328125, -4.8076171875, -4.447998046875, -4.08837890625, -3.728759765625, -3.369140625, -3.009521484375, -2.64990234375, -2.290283203125, -1.9306640625, -1.571044921875, -1.21142578125, -0.851806640625, -0.4921875, -0.132568359375, 0.22705078125, 0.586669921875, 0.9462890625, 1.305908203125, 1.66552734375, 2.025146484375, 2.384765625, 2.744384765625, 3.10400390625, 3.463623046875, 3.8232421875, 4.182861328125, 4.54248046875, 4.902099609375, 5.26171875, 5.621337890625, 5.98095703125, 6.340576171875, 6.7001953125, 7.059814453125, 7.41943359375, 7.779052734375, 8.138671875, 8.498291015625, 8.85791015625, 9.217529296875, 9.5771484375, 9.936767578125, 10.29638671875, 10.656005859375, 11.015625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 6.0, 23.0, 23.0, 26.0, 46.0, 66.0, 98.0, 277.0, 1201.0, 13948.0, 1166593.0, 1943431.0, 17890.0, 1432.0, 307.0, 118.0, 44.0, 37.0, 24.0, 19.0, 14.0, 16.0, 10.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.8125, -50.1953125, -48.578125, -46.9609375, -45.34375, -43.7265625, -42.109375, -40.4921875, -38.875, -37.2578125, -35.640625, -34.0234375, -32.40625, -30.7890625, -29.171875, -27.5546875, -25.9375, -24.3203125, -22.703125, -21.0859375, -19.46875, -17.8515625, -16.234375, -14.6171875, -13.0, -11.3828125, -9.765625, -8.1484375, -6.53125, -4.9140625, -3.296875, -1.6796875, -0.0625, 1.5546875, 3.171875, 4.7890625, 6.40625, 8.0234375, 9.640625, 11.2578125, 12.875, 14.4921875, 16.109375, 17.7265625, 19.34375, 20.9609375, 22.578125, 24.1953125, 25.8125, 27.4296875, 29.046875, 30.6640625, 32.28125, 33.8984375, 35.515625, 37.1328125, 38.75, 40.3671875, 41.984375, 43.6015625, 45.21875, 46.8359375, 48.453125, 50.0703125, 51.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [3.0, 11.0, 47.0, 234.0, 419.0, 234.0, 50.0, 17.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.466659545898438, -12.729753494262695, -8.992847442626953, -5.2559404373168945, -1.5190343856811523, 2.2178726196289062, 5.954778671264648, 9.69168472290039, 13.428590774536133, 17.165496826171875, 20.902402877807617, 24.63930892944336, 28.376216888427734, 32.113121032714844, 35.85002899169922, 39.586936950683594, 43.3238410949707, 47.06074905395508, 50.79765319824219, 54.53456115722656, 58.27146530151367, 62.00837326049805, 65.74527740478516, 69.48218536376953, 73.2190933227539, 76.95600128173828, 80.69290924072266, 84.4298095703125, 88.16671752929688, 91.90362548828125, 95.64053344726562, 99.37744140625, 103.11434173583984, 106.85124969482422, 110.5881576538086, 114.32505798339844, 118.06196594238281, 121.79887390136719, 125.53578186035156, 129.27268981933594, 133.0095977783203, 136.7465057373047, 140.48341369628906, 144.22032165527344, 147.9572296142578, 151.69412231445312, 155.4310302734375, 159.16793823242188, 162.90484619140625, 166.64175415039062, 170.378662109375, 174.11557006835938, 177.85247802734375, 181.58938598632812, 185.32627868652344, 189.0631866455078, 192.8000946044922, 196.53700256347656, 200.27391052246094, 204.0108184814453, 207.7477264404297, 211.484619140625, 215.22152709960938, 218.95843505859375, 222.69534301757812]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 6.0, 7.0, 6.0, 6.0, 9.0, 18.0, 13.0, 16.0, 23.0, 21.0, 16.0, 19.0, 27.0, 26.0, 31.0, 35.0, 44.0, 38.0, 35.0, 42.0, 56.0, 41.0, 40.0, 41.0, 39.0, 38.0, 29.0, 29.0, 38.0, 28.0, 31.0, 15.0, 25.0, 19.0, 13.0, 13.0, 13.0, 14.0, 7.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.441776275634766, -30.3626708984375, -29.283565521240234, -28.20446014404297, -27.125354766845703, -26.046249389648438, -24.96714210510254, -23.888036727905273, -22.808931350708008, -21.729825973510742, -20.650720596313477, -19.57161521911621, -18.492507934570312, -17.413402557373047, -16.33429718017578, -15.255191802978516, -14.17608642578125, -13.096981048583984, -12.017875671386719, -10.938769340515137, -9.859663963317871, -8.780558586120605, -7.701452732086182, -6.622346878051758, -5.543241500854492, -4.464136123657227, -3.3850302696228027, -2.305924654006958, -1.2268190383911133, -0.14771366119384766, 0.9313921928405762, 2.010498046875, 3.0896034240722656, 4.168708801269531, 5.247814655303955, 6.326920509338379, 7.4060258865356445, 8.48513126373291, 9.564237594604492, 10.643342971801758, 11.722448348999023, 12.801553726196289, 13.880659103393555, 14.959765434265137, 16.03887176513672, 17.117977142333984, 18.19708251953125, 19.276187896728516, 20.35529327392578, 21.434398651123047, 22.513504028320312, 23.592609405517578, 24.671714782714844, 25.75082015991211, 26.829927444458008, 27.909032821655273, 28.98813819885254, 30.067243576049805, 31.14634895324707, 32.22545623779297, 33.304561614990234, 34.3836669921875, 35.462772369384766, 36.54187774658203, 37.6209831237793]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 9.0, 9.0, 15.0, 19.0, 18.0, 24.0, 27.0, 27.0, 41.0, 41.0, 40.0, 54.0, 46.0, 52.0, 49.0, 63.0, 72.0, 51.0, 47.0, 41.0, 41.0, 30.0, 31.0, 21.0, 30.0, 9.0, 18.0, 13.0, 12.0, 6.0, 8.0, 6.0, 6.0, 3.0, 7.0, 3.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.87481689453125, -3.7613525390625, -3.64788818359375, -3.534423828125, -3.42095947265625, -3.3074951171875, -3.19403076171875, -3.08056640625, -2.96710205078125, -2.8536376953125, -2.74017333984375, -2.626708984375, -2.51324462890625, -2.3997802734375, -2.28631591796875, -2.1728515625, -2.05938720703125, -1.9459228515625, -1.83245849609375, -1.718994140625, -1.60552978515625, -1.4920654296875, -1.37860107421875, -1.26513671875, -1.15167236328125, -1.0382080078125, -0.92474365234375, -0.811279296875, -0.69781494140625, -0.5843505859375, -0.47088623046875, -0.357421875, -0.24395751953125, -0.1304931640625, -0.01702880859375, 0.096435546875, 0.20989990234375, 0.3233642578125, 0.43682861328125, 0.55029296875, 0.66375732421875, 0.7772216796875, 0.89068603515625, 1.004150390625, 1.11761474609375, 1.2310791015625, 1.34454345703125, 1.4580078125, 1.57147216796875, 1.6849365234375, 1.79840087890625, 1.911865234375, 2.02532958984375, 2.1387939453125, 2.25225830078125, 2.36572265625, 2.47918701171875, 2.5926513671875, 2.70611572265625, 2.819580078125, 2.93304443359375, 3.0465087890625, 3.15997314453125, 3.2734375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 14.0, 11.0, 23.0, 29.0, 39.0, 39.0, 50.0, 71.0, 142.0, 204.0, 366.0, 698.0, 1675.0, 3989.0, 11958.0, 46327.0, 2741077.0, 1330302.0, 38408.0, 10987.0, 4145.0, 1767.0, 847.0, 432.0, 213.0, 146.0, 90.0, 67.0, 40.0, 25.0, 16.0, 20.0, 11.0, 16.0, 9.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 5.0], "bins": [-30.71875, -29.88720703125, -29.0556640625, -28.22412109375, -27.392578125, -26.56103515625, -25.7294921875, -24.89794921875, -24.06640625, -23.23486328125, -22.4033203125, -21.57177734375, -20.740234375, -19.90869140625, -19.0771484375, -18.24560546875, -17.4140625, -16.58251953125, -15.7509765625, -14.91943359375, -14.087890625, -13.25634765625, -12.4248046875, -11.59326171875, -10.76171875, -9.93017578125, -9.0986328125, -8.26708984375, -7.435546875, -6.60400390625, -5.7724609375, -4.94091796875, -4.109375, -3.27783203125, -2.4462890625, -1.61474609375, -0.783203125, 0.04833984375, 0.8798828125, 1.71142578125, 2.54296875, 3.37451171875, 4.2060546875, 5.03759765625, 5.869140625, 6.70068359375, 7.5322265625, 8.36376953125, 9.1953125, 10.02685546875, 10.8583984375, 11.68994140625, 12.521484375, 13.35302734375, 14.1845703125, 15.01611328125, 15.84765625, 16.67919921875, 17.5107421875, 18.34228515625, 19.173828125, 20.00537109375, 20.8369140625, 21.66845703125, 22.5]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 14.0, 9.0, 7.0, 15.0, 28.0, 44.0, 56.0, 99.0, 201.0, 420.0, 926.0, 1161.0, 538.0, 223.0, 109.0, 66.0, 45.0, 32.0, 22.0, 17.0, 15.0, 8.0, 6.0, 7.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.3443603515625, -9.774658203125, -9.2049560546875, -8.63525390625, -8.0655517578125, -7.495849609375, -6.9261474609375, -6.3564453125, -5.7867431640625, -5.217041015625, -4.6473388671875, -4.07763671875, -3.5079345703125, -2.938232421875, -2.3685302734375, -1.798828125, -1.2291259765625, -0.659423828125, -0.0897216796875, 0.47998046875, 1.0496826171875, 1.619384765625, 2.1890869140625, 2.7587890625, 3.3284912109375, 3.898193359375, 4.4678955078125, 5.03759765625, 5.6072998046875, 6.177001953125, 6.7467041015625, 7.31640625, 7.8861083984375, 8.455810546875, 9.0255126953125, 9.59521484375, 10.1649169921875, 10.734619140625, 11.3043212890625, 11.8740234375, 12.4437255859375, 13.013427734375, 13.5831298828125, 14.15283203125, 14.7225341796875, 15.292236328125, 15.8619384765625, 16.431640625, 17.0013427734375, 17.571044921875, 18.1407470703125, 18.71044921875, 19.2801513671875, 19.849853515625, 20.4195556640625, 20.9892578125, 21.5589599609375, 22.128662109375, 22.6983642578125, 23.26806640625, 23.8377685546875, 24.407470703125, 24.9771728515625, 25.546875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 6.0, 6.0, 5.0, 15.0, 24.0, 27.0, 26.0, 46.0, 66.0, 112.0, 261.0, 664.0, 1763.0, 5334.0, 21139.0, 162026.0, 3789135.0, 182749.0, 22175.0, 5604.0, 1788.0, 671.0, 284.0, 140.0, 74.0, 39.0, 31.0, 19.0, 13.0, 15.0, 15.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.109375, -25.720458984375, -24.33154296875, -22.942626953125, -21.5537109375, -20.164794921875, -18.77587890625, -17.386962890625, -15.998046875, -14.609130859375, -13.22021484375, -11.831298828125, -10.4423828125, -9.053466796875, -7.66455078125, -6.275634765625, -4.88671875, -3.497802734375, -2.10888671875, -0.719970703125, 0.6689453125, 2.057861328125, 3.44677734375, 4.835693359375, 6.224609375, 7.613525390625, 9.00244140625, 10.391357421875, 11.7802734375, 13.169189453125, 14.55810546875, 15.947021484375, 17.3359375, 18.724853515625, 20.11376953125, 21.502685546875, 22.8916015625, 24.280517578125, 25.66943359375, 27.058349609375, 28.447265625, 29.836181640625, 31.22509765625, 32.614013671875, 34.0029296875, 35.391845703125, 36.78076171875, 38.169677734375, 39.55859375, 40.947509765625, 42.33642578125, 43.725341796875, 45.1142578125, 46.503173828125, 47.89208984375, 49.281005859375, 50.669921875, 52.058837890625, 53.44775390625, 54.836669921875, 56.2255859375, 57.614501953125, 59.00341796875, 60.392333984375, 61.78125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 7.0, 4.0, 15.0, 18.0, 28.0, 44.0, 56.0, 82.0, 111.0, 142.0, 145.0, 116.0, 77.0, 39.0, 37.0, 33.0, 12.0, 9.0, 8.0, 13.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.72919273376465, -21.91128921508789, -20.0933837890625, -18.275480270385742, -16.457576751708984, -14.639671325683594, -12.821767807006836, -11.003863334655762, -9.185958862304688, -7.368054389953613, -5.550150394439697, -3.7322463989257812, -1.914341926574707, -0.09643745422363281, 1.721466064453125, 3.539370536804199, 5.357275009155273, 7.175179481506348, 8.993083953857422, 10.81098747253418, 12.628891944885254, 14.446796417236328, 16.264699935913086, 18.082603454589844, 19.900508880615234, 21.718412399291992, 23.536317825317383, 25.35422134399414, 27.17212677001953, 28.99003028869629, 30.807933807373047, 32.62583923339844, 34.44374084472656, 36.26164627075195, 38.07954788208008, 39.89745330810547, 41.71535873413086, 43.53326416015625, 45.351165771484375, 47.169071197509766, 48.986976623535156, 50.80488204956055, 52.62278366088867, 54.44068908691406, 56.25859451293945, 58.076499938964844, 59.89440155029297, 61.71230697631836, 63.530208587646484, 65.34811401367188, 67.166015625, 68.98391723632812, 70.80182647705078, 72.6197280883789, 74.43763732910156, 76.25553894042969, 78.07344055175781, 79.89134216308594, 81.7092514038086, 83.52715301513672, 85.34505462646484, 87.1629638671875, 88.98086547851562, 90.79876708984375, 92.6166763305664]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 5.0, 12.0, 17.0, 16.0, 26.0, 17.0, 16.0, 27.0, 27.0, 33.0, 24.0, 35.0, 28.0, 39.0, 27.0, 38.0, 37.0, 48.0, 41.0, 33.0, 40.0, 34.0, 33.0, 39.0, 30.0, 33.0, 27.0, 30.0, 24.0, 25.0, 20.0, 18.0, 17.0, 13.0, 10.0, 13.0, 9.0, 4.0, 10.0, 6.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.889301300048828, -30.84830093383789, -29.807300567626953, -28.766300201416016, -27.725299835205078, -26.68429946899414, -25.643299102783203, -24.602298736572266, -23.561298370361328, -22.52029800415039, -21.479297637939453, -20.438297271728516, -19.397296905517578, -18.35629653930664, -17.315296173095703, -16.274295806884766, -15.233297348022461, -14.192296981811523, -13.151296615600586, -12.110296249389648, -11.069295883178711, -10.028295516967773, -8.987296104431152, -7.946295738220215, -6.905295372009277, -5.86429500579834, -4.823294639587402, -3.782294750213623, -2.7412943840026855, -1.700294017791748, -0.6592941284179688, 0.38170623779296875, 1.4227066040039062, 2.4637069702148438, 3.504707098007202, 4.5457072257995605, 5.586707592010498, 6.6277079582214355, 7.668707847595215, 8.709708213806152, 9.75070858001709, 10.791708946228027, 11.832709312438965, 12.873708724975586, 13.914709091186523, 14.955709457397461, 15.996709823608398, 17.037710189819336, 18.078710556030273, 19.11971092224121, 20.16071128845215, 21.201711654663086, 22.242712020874023, 23.28371238708496, 24.324710845947266, 25.365711212158203, 26.40671157836914, 27.447711944580078, 28.488712310791016, 29.529712677001953, 30.57071304321289, 31.611713409423828, 32.652713775634766, 33.6937141418457, 34.73471450805664]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 3.0, 8.0, 6.0, 14.0, 15.0, 6.0, 23.0, 17.0, 25.0, 31.0, 42.0, 43.0, 64.0, 53.0, 39.0, 52.0, 52.0, 58.0, 63.0, 45.0, 49.0, 49.0, 43.0, 33.0, 29.0, 28.0, 18.0, 14.0, 20.0, 13.0, 10.0, 7.0, 11.0, 7.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.795318603515625, -3.67266845703125, -3.550018310546875, -3.4273681640625, -3.304718017578125, -3.18206787109375, -3.059417724609375, -2.936767578125, -2.814117431640625, -2.69146728515625, -2.568817138671875, -2.4461669921875, -2.323516845703125, -2.20086669921875, -2.078216552734375, -1.95556640625, -1.832916259765625, -1.71026611328125, -1.587615966796875, -1.4649658203125, -1.342315673828125, -1.21966552734375, -1.097015380859375, -0.974365234375, -0.851715087890625, -0.72906494140625, -0.606414794921875, -0.4837646484375, -0.361114501953125, -0.23846435546875, -0.115814208984375, 0.0068359375, 0.129486083984375, 0.25213623046875, 0.374786376953125, 0.4974365234375, 0.620086669921875, 0.74273681640625, 0.865386962890625, 0.988037109375, 1.110687255859375, 1.23333740234375, 1.355987548828125, 1.4786376953125, 1.601287841796875, 1.72393798828125, 1.846588134765625, 1.96923828125, 2.091888427734375, 2.21453857421875, 2.337188720703125, 2.4598388671875, 2.582489013671875, 2.70513916015625, 2.827789306640625, 2.950439453125, 3.073089599609375, 3.19573974609375, 3.318389892578125, 3.4410400390625, 3.563690185546875, 3.68634033203125, 3.808990478515625, 3.931640625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 5.0, 5.0, 7.0, 4.0, 12.0, 20.0, 34.0, 34.0, 47.0, 83.0, 113.0, 201.0, 340.0, 561.0, 1081.0, 1869.0, 3181.0, 5770.0, 10664.0, 21957.0, 67579.0, 336934.0, 450111.0, 93811.0, 26708.0, 12154.0, 6609.0, 3652.0, 2006.0, 1242.0, 725.0, 381.0, 227.0, 144.0, 94.0, 55.0, 40.0, 31.0, 14.0, 15.0, 13.0, 6.0, 4.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5078125, -5.318603515625, -5.12939453125, -4.940185546875, -4.7509765625, -4.561767578125, -4.37255859375, -4.183349609375, -3.994140625, -3.804931640625, -3.61572265625, -3.426513671875, -3.2373046875, -3.048095703125, -2.85888671875, -2.669677734375, -2.48046875, -2.291259765625, -2.10205078125, -1.912841796875, -1.7236328125, -1.534423828125, -1.34521484375, -1.156005859375, -0.966796875, -0.777587890625, -0.58837890625, -0.399169921875, -0.2099609375, -0.020751953125, 0.16845703125, 0.357666015625, 0.546875, 0.736083984375, 0.92529296875, 1.114501953125, 1.3037109375, 1.492919921875, 1.68212890625, 1.871337890625, 2.060546875, 2.249755859375, 2.43896484375, 2.628173828125, 2.8173828125, 3.006591796875, 3.19580078125, 3.385009765625, 3.57421875, 3.763427734375, 3.95263671875, 4.141845703125, 4.3310546875, 4.520263671875, 4.70947265625, 4.898681640625, 5.087890625, 5.277099609375, 5.46630859375, 5.655517578125, 5.8447265625, 6.033935546875, 6.22314453125, 6.412353515625, 6.6015625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 0.0, 5.0, 4.0, 15.0, 6.0, 8.0, 13.0, 19.0, 22.0, 22.0, 26.0, 27.0, 36.0, 33.0, 36.0, 35.0, 46.0, 41.0, 46.0, 38.0, 1072.0, 49.0, 35.0, 40.0, 30.0, 31.0, 34.0, 41.0, 29.0, 24.0, 23.0, 27.0, 26.0, 10.0, 11.0, 11.0, 10.0, 6.0, 10.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.115234375, -3.017333984375, -2.91943359375, -2.821533203125, -2.7236328125, -2.625732421875, -2.52783203125, -2.429931640625, -2.33203125, -2.234130859375, -2.13623046875, -2.038330078125, -1.9404296875, -1.842529296875, -1.74462890625, -1.646728515625, -1.548828125, -1.450927734375, -1.35302734375, -1.255126953125, -1.1572265625, -1.059326171875, -0.96142578125, -0.863525390625, -0.765625, -0.667724609375, -0.56982421875, -0.471923828125, -0.3740234375, -0.276123046875, -0.17822265625, -0.080322265625, 0.017578125, 0.115478515625, 0.21337890625, 0.311279296875, 0.4091796875, 0.507080078125, 0.60498046875, 0.702880859375, 0.80078125, 0.898681640625, 0.99658203125, 1.094482421875, 1.1923828125, 1.290283203125, 1.38818359375, 1.486083984375, 1.583984375, 1.681884765625, 1.77978515625, 1.877685546875, 1.9755859375, 2.073486328125, 2.17138671875, 2.269287109375, 2.3671875, 2.465087890625, 2.56298828125, 2.660888671875, 2.7587890625, 2.856689453125, 2.95458984375, 3.052490234375, 3.150390625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 0.0, 6.0, 3.0, 2.0, 4.0, 8.0, 13.0, 21.0, 31.0, 35.0, 63.0, 78.0, 127.0, 134.0, 238.0, 347.0, 586.0, 882.0, 1660.0, 3143.0, 6798.0, 16062.0, 49902.0, 271076.0, 1519405.0, 164792.0, 36889.0, 12763.0, 5633.0, 2607.0, 1507.0, 807.0, 499.0, 305.0, 226.0, 140.0, 88.0, 74.0, 43.0, 34.0, 29.0, 19.0, 22.0, 10.0, 5.0, 8.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.734375, -3.602783203125, -3.47119140625, -3.339599609375, -3.2080078125, -3.076416015625, -2.94482421875, -2.813232421875, -2.681640625, -2.550048828125, -2.41845703125, -2.286865234375, -2.1552734375, -2.023681640625, -1.89208984375, -1.760498046875, -1.62890625, -1.497314453125, -1.36572265625, -1.234130859375, -1.1025390625, -0.970947265625, -0.83935546875, -0.707763671875, -0.576171875, -0.444580078125, -0.31298828125, -0.181396484375, -0.0498046875, 0.081787109375, 0.21337890625, 0.344970703125, 0.4765625, 0.608154296875, 0.73974609375, 0.871337890625, 1.0029296875, 1.134521484375, 1.26611328125, 1.397705078125, 1.529296875, 1.660888671875, 1.79248046875, 1.924072265625, 2.0556640625, 2.187255859375, 2.31884765625, 2.450439453125, 2.58203125, 2.713623046875, 2.84521484375, 2.976806640625, 3.1083984375, 3.239990234375, 3.37158203125, 3.503173828125, 3.634765625, 3.766357421875, 3.89794921875, 4.029541015625, 4.1611328125, 4.292724609375, 4.42431640625, 4.555908203125, 4.6875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 6.0, 7.0, 6.0, 8.0, 27.0, 50.0, 74.0, 313.0, 247.0, 84.0, 51.0, 16.0, 12.0, 10.0, 11.0, 2.0, 9.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.255859375, -1.203399658203125, -1.15093994140625, -1.098480224609375, -1.0460205078125, -0.993560791015625, -0.94110107421875, -0.888641357421875, -0.836181640625, -0.783721923828125, -0.73126220703125, -0.678802490234375, -0.6263427734375, -0.573883056640625, -0.52142333984375, -0.468963623046875, -0.41650390625, -0.364044189453125, -0.31158447265625, -0.259124755859375, -0.2066650390625, -0.154205322265625, -0.10174560546875, -0.049285888671875, 0.003173828125, 0.055633544921875, 0.10809326171875, 0.160552978515625, 0.2130126953125, 0.265472412109375, 0.31793212890625, 0.370391845703125, 0.4228515625, 0.475311279296875, 0.52777099609375, 0.580230712890625, 0.6326904296875, 0.685150146484375, 0.73760986328125, 0.790069580078125, 0.842529296875, 0.894989013671875, 0.94744873046875, 0.999908447265625, 1.0523681640625, 1.104827880859375, 1.15728759765625, 1.209747314453125, 1.26220703125, 1.314666748046875, 1.36712646484375, 1.419586181640625, 1.4720458984375, 1.524505615234375, 1.57696533203125, 1.629425048828125, 1.681884765625, 1.734344482421875, 1.78680419921875, 1.839263916015625, 1.8917236328125, 1.944183349609375, 1.99664306640625, 2.049102783203125, 2.1015625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 9.0, 8.0, 14.0, 22.0, 20.0, 29.0, 28.0, 49.0, 61.0, 140.0, 878.0, 7412.0, 904813.0, 129106.0, 4956.0, 572.0, 118.0, 66.0, 44.0, 27.0, 37.0, 19.0, 18.0, 17.0, 8.0, 19.0, 6.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.671875, -23.81884765625, -22.9658203125, -22.11279296875, -21.259765625, -20.40673828125, -19.5537109375, -18.70068359375, -17.84765625, -16.99462890625, -16.1416015625, -15.28857421875, -14.435546875, -13.58251953125, -12.7294921875, -11.87646484375, -11.0234375, -10.17041015625, -9.3173828125, -8.46435546875, -7.611328125, -6.75830078125, -5.9052734375, -5.05224609375, -4.19921875, -3.34619140625, -2.4931640625, -1.64013671875, -0.787109375, 0.06591796875, 0.9189453125, 1.77197265625, 2.625, 3.47802734375, 4.3310546875, 5.18408203125, 6.037109375, 6.89013671875, 7.7431640625, 8.59619140625, 9.44921875, 10.30224609375, 11.1552734375, 12.00830078125, 12.861328125, 13.71435546875, 14.5673828125, 15.42041015625, 16.2734375, 17.12646484375, 17.9794921875, 18.83251953125, 19.685546875, 20.53857421875, 21.3916015625, 22.24462890625, 23.09765625, 23.95068359375, 24.8037109375, 25.65673828125, 26.509765625, 27.36279296875, 28.2158203125, 29.06884765625, 29.921875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 23.0, 32.0, 58.0, 118.0, 203.0, 270.0, 164.0, 51.0, 39.0, 15.0, 5.0, 9.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910794973373413, -3.7719953060150146, -3.6331958770751953, -3.494396209716797, -3.3555965423583984, -3.216796875, -3.0779972076416016, -2.9391977787017822, -2.800398111343384, -2.6615984439849854, -2.522799015045166, -2.3839993476867676, -2.245199680328369, -2.1064000129699707, -1.9676004648208618, -1.828800916671753, -1.6900012493133545, -1.551201581954956, -1.4124020338058472, -1.2736024856567383, -1.1348028182983398, -0.9960032105445862, -0.8572036027908325, -0.7184039950370789, -0.5796043872833252, -0.44080477952957153, -0.30200517177581787, -0.1632055640220642, -0.024405956268310547, 0.11439365148544312, 0.2531932592391968, 0.39199286699295044, 0.530792236328125, 0.6695918440818787, 0.8083914518356323, 0.947191059589386, 1.0859906673431396, 1.224790334701538, 1.363589882850647, 1.5023894309997559, 1.6411890983581543, 1.7799887657165527, 1.9187883138656616, 2.0575878620147705, 2.196387529373169, 2.3351871967315674, 2.4739866256713867, 2.612786293029785, 2.7515859603881836, 2.890385627746582, 3.0291852951049805, 3.1679847240448, 3.3067843914031982, 3.4455840587615967, 3.584383487701416, 3.7231831550598145, 3.861982822418213, 4.000782489776611, 4.13958215713501, 4.278381824493408, 4.417181015014648, 4.555980682373047, 4.694780349731445, 4.833580017089844, 4.972379684448242]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 3.0, 11.0, 11.0, 8.0, 11.0, 15.0, 21.0, 16.0, 22.0, 30.0, 21.0, 27.0, 34.0, 49.0, 30.0, 44.0, 34.0, 37.0, 60.0, 38.0, 48.0, 43.0, 38.0, 45.0, 36.0, 29.0, 31.0, 32.0, 28.0, 18.0, 21.0, 16.0, 17.0, 16.0, 11.0, 7.0, 10.0, 9.0, 7.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9071562886238098, -0.876125156879425, -0.8450940251350403, -0.8140628337860107, -0.783031702041626, -0.7520005702972412, -0.7209694385528564, -0.6899383068084717, -0.6589071750640869, -0.6278760433197021, -0.5968449115753174, -0.5658137798309326, -0.5347825884819031, -0.5037514567375183, -0.47272032499313354, -0.4416891932487488, -0.41065800189971924, -0.3796268701553345, -0.3485957086086273, -0.31756457686424255, -0.2865334153175354, -0.25550228357315063, -0.22447115182876587, -0.1934400051832199, -0.16240885853767395, -0.131377711892128, -0.10034657269716263, -0.06931543350219727, -0.038284286856651306, -0.007253140211105347, 0.02377799153327942, 0.05480913817882538, 0.08584022521972656, 0.11687137186527252, 0.14790251851081848, 0.17893365025520325, 0.2099647969007492, 0.24099594354629517, 0.27202707529067993, 0.3030582070350647, 0.33408936858177185, 0.3651205003261566, 0.39615166187286377, 0.42718279361724854, 0.4582139253616333, 0.48924508690834045, 0.5202761888504028, 0.5513073801994324, 0.5823385119438171, 0.6133696436882019, 0.6444007754325867, 0.6754319667816162, 0.706463098526001, 0.7374942302703857, 0.7685253620147705, 0.7995564937591553, 0.83058762550354, 0.8616187572479248, 0.8926498889923096, 0.9236810207366943, 0.9547122120857239, 0.9857433438301086, 1.0167744159698486, 1.047805666923523, 1.0788367986679077]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 13.0, 13.0, 19.0, 14.0, 15.0, 19.0, 21.0, 26.0, 41.0, 45.0, 48.0, 51.0, 50.0, 48.0, 58.0, 74.0, 49.0, 62.0, 54.0, 35.0, 42.0, 29.0, 32.0, 20.0, 23.0, 14.0, 20.0, 16.0, 9.0, 7.0, 8.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.84765625, -3.7235107421875, -3.599365234375, -3.4752197265625, -3.35107421875, -3.2269287109375, -3.102783203125, -2.9786376953125, -2.8544921875, -2.7303466796875, -2.606201171875, -2.4820556640625, -2.35791015625, -2.2337646484375, -2.109619140625, -1.9854736328125, -1.861328125, -1.7371826171875, -1.613037109375, -1.4888916015625, -1.36474609375, -1.2406005859375, -1.116455078125, -0.9923095703125, -0.8681640625, -0.7440185546875, -0.619873046875, -0.4957275390625, -0.37158203125, -0.2474365234375, -0.123291015625, 0.0008544921875, 0.125, 0.2491455078125, 0.373291015625, 0.4974365234375, 0.62158203125, 0.7457275390625, 0.869873046875, 0.9940185546875, 1.1181640625, 1.2423095703125, 1.366455078125, 1.4906005859375, 1.61474609375, 1.7388916015625, 1.863037109375, 1.9871826171875, 2.111328125, 2.2354736328125, 2.359619140625, 2.4837646484375, 2.60791015625, 2.7320556640625, 2.856201171875, 2.9803466796875, 3.1044921875, 3.2286376953125, 3.352783203125, 3.4769287109375, 3.60107421875, 3.7252197265625, 3.849365234375, 3.9735107421875, 4.09765625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 7.0, 10.0, 11.0, 26.0, 22.0, 38.0, 65.0, 67.0, 131.0, 162.0, 272.0, 413.0, 655.0, 1099.0, 1991.0, 3572.0, 7302.0, 15765.0, 40561.0, 125012.0, 405368.0, 303152.0, 87319.0, 30073.0, 12469.0, 5782.0, 2972.0, 1608.0, 1004.0, 541.0, 371.0, 247.0, 135.0, 105.0, 69.0, 53.0, 25.0, 24.0, 23.0, 11.0, 8.0, 2.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.25390625, -5.1031494140625, -4.952392578125, -4.8016357421875, -4.65087890625, -4.5001220703125, -4.349365234375, -4.1986083984375, -4.0478515625, -3.8970947265625, -3.746337890625, -3.5955810546875, -3.44482421875, -3.2940673828125, -3.143310546875, -2.9925537109375, -2.841796875, -2.6910400390625, -2.540283203125, -2.3895263671875, -2.23876953125, -2.0880126953125, -1.937255859375, -1.7864990234375, -1.6357421875, -1.4849853515625, -1.334228515625, -1.1834716796875, -1.03271484375, -0.8819580078125, -0.731201171875, -0.5804443359375, -0.4296875, -0.2789306640625, -0.128173828125, 0.0225830078125, 0.17333984375, 0.3240966796875, 0.474853515625, 0.6256103515625, 0.7763671875, 0.9271240234375, 1.077880859375, 1.2286376953125, 1.37939453125, 1.5301513671875, 1.680908203125, 1.8316650390625, 1.982421875, 2.1331787109375, 2.283935546875, 2.4346923828125, 2.58544921875, 2.7362060546875, 2.886962890625, 3.0377197265625, 3.1884765625, 3.3392333984375, 3.489990234375, 3.6407470703125, 3.79150390625, 3.9422607421875, 4.093017578125, 4.2437744140625, 4.39453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 4.0, 9.0, 9.0, 10.0, 8.0, 11.0, 14.0, 17.0, 19.0, 23.0, 21.0, 34.0, 26.0, 28.0, 55.0, 51.0, 57.0, 61.0, 54.0, 113.0, 288.0, 1438.0, 158.0, 78.0, 52.0, 72.0, 54.0, 36.0, 41.0, 36.0, 21.0, 28.0, 16.0, 15.0, 20.0, 10.0, 11.0, 15.0, 6.0, 10.0, 3.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.1171875, -11.715087890625, -11.31298828125, -10.910888671875, -10.5087890625, -10.106689453125, -9.70458984375, -9.302490234375, -8.900390625, -8.498291015625, -8.09619140625, -7.694091796875, -7.2919921875, -6.889892578125, -6.48779296875, -6.085693359375, -5.68359375, -5.281494140625, -4.87939453125, -4.477294921875, -4.0751953125, -3.673095703125, -3.27099609375, -2.868896484375, -2.466796875, -2.064697265625, -1.66259765625, -1.260498046875, -0.8583984375, -0.456298828125, -0.05419921875, 0.347900390625, 0.75, 1.152099609375, 1.55419921875, 1.956298828125, 2.3583984375, 2.760498046875, 3.16259765625, 3.564697265625, 3.966796875, 4.368896484375, 4.77099609375, 5.173095703125, 5.5751953125, 5.977294921875, 6.37939453125, 6.781494140625, 7.18359375, 7.585693359375, 7.98779296875, 8.389892578125, 8.7919921875, 9.194091796875, 9.59619140625, 9.998291015625, 10.400390625, 10.802490234375, 11.20458984375, 11.606689453125, 12.0087890625, 12.410888671875, 12.81298828125, 13.215087890625, 13.6171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 3.0, 1.0, 4.0, 6.0, 2.0, 14.0, 12.0, 14.0, 21.0, 32.0, 33.0, 46.0, 79.0, 118.0, 186.0, 276.0, 470.0, 876.0, 2060.0, 5296.0, 17477.0, 106688.0, 2728712.0, 244618.0, 26280.0, 7111.0, 2563.0, 1157.0, 604.0, 310.0, 200.0, 113.0, 83.0, 67.0, 34.0, 39.0, 31.0, 15.0, 8.0, 9.0, 10.0, 9.0, 12.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.203125, -24.453857421875, -23.70458984375, -22.955322265625, -22.2060546875, -21.456787109375, -20.70751953125, -19.958251953125, -19.208984375, -18.459716796875, -17.71044921875, -16.961181640625, -16.2119140625, -15.462646484375, -14.71337890625, -13.964111328125, -13.21484375, -12.465576171875, -11.71630859375, -10.967041015625, -10.2177734375, -9.468505859375, -8.71923828125, -7.969970703125, -7.220703125, -6.471435546875, -5.72216796875, -4.972900390625, -4.2236328125, -3.474365234375, -2.72509765625, -1.975830078125, -1.2265625, -0.477294921875, 0.27197265625, 1.021240234375, 1.7705078125, 2.519775390625, 3.26904296875, 4.018310546875, 4.767578125, 5.516845703125, 6.26611328125, 7.015380859375, 7.7646484375, 8.513916015625, 9.26318359375, 10.012451171875, 10.76171875, 11.510986328125, 12.26025390625, 13.009521484375, 13.7587890625, 14.508056640625, 15.25732421875, 16.006591796875, 16.755859375, 17.505126953125, 18.25439453125, 19.003662109375, 19.7529296875, 20.502197265625, 21.25146484375, 22.000732421875, 22.75]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 22.0, 181.0, 554.0, 214.0, 34.0, 5.0], "bins": [-302.636474609375, -297.6337890625, -292.6310729980469, -287.6283874511719, -282.6257019042969, -277.6230163574219, -272.62030029296875, -267.61761474609375, -262.61492919921875, -257.61224365234375, -252.6095428466797, -247.60684204101562, -242.60415649414062, -237.60145568847656, -232.59877014160156, -227.5960693359375, -222.59336853027344, -217.59066772460938, -212.58798217773438, -207.5852813720703, -202.5825958251953, -197.57989501953125, -192.57720947265625, -187.5745086669922, -182.57180786132812, -177.56910705566406, -172.56642150878906, -167.563720703125, -162.56103515625, -157.55833435058594, -152.55564880371094, -147.55294799804688, -142.5502471923828, -137.54754638671875, -132.54486083984375, -127.54216766357422, -122.53947448730469, -117.53677368164062, -112.5340805053711, -107.53138732910156, -102.52870178222656, -97.52600860595703, -92.5233154296875, -87.52062225341797, -82.51792907714844, -77.51522827148438, -72.51253509521484, -67.50984191894531, -62.507144927978516, -57.504451751708984, -52.50175476074219, -47.499061584472656, -42.496368408203125, -37.493675231933594, -32.49098205566406, -27.488285064697266, -22.485591888427734, -17.482898712158203, -12.480203628540039, -7.477509498596191, -2.4748153686523438, 2.5278778076171875, 7.530572891235352, 12.533267974853516, 17.535961151123047]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 8.0, 8.0, 11.0, 15.0, 14.0, 12.0, 16.0, 18.0, 20.0, 18.0, 17.0, 28.0, 30.0, 41.0, 37.0, 46.0, 39.0, 45.0, 35.0, 34.0, 48.0, 46.0, 39.0, 43.0, 39.0, 33.0, 43.0, 27.0, 29.0, 21.0, 22.0, 20.0, 16.0, 13.0, 9.0, 6.0, 9.0, 9.0, 10.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-45.60725021362305, -44.210269927978516, -42.813289642333984, -41.41630935668945, -40.01932907104492, -38.62234878540039, -37.22536849975586, -35.82838821411133, -34.4314079284668, -33.034427642822266, -31.637447357177734, -30.240467071533203, -28.843486785888672, -27.44650650024414, -26.04952621459961, -24.652545928955078, -23.255565643310547, -21.858585357666016, -20.461605072021484, -19.064624786376953, -17.667644500732422, -16.27066421508789, -14.87368392944336, -13.476703643798828, -12.079723358154297, -10.682743072509766, -9.285762786865234, -7.888782501220703, -6.491802215576172, -5.094821929931641, -3.6978416442871094, -2.300861358642578, -0.9038772583007812, 0.49310302734375, 1.8900833129882812, 3.2870635986328125, 4.684043884277344, 6.081024169921875, 7.478004455566406, 8.874984741210938, 10.271965026855469, 11.6689453125, 13.065925598144531, 14.462905883789062, 15.859886169433594, 17.256866455078125, 18.653846740722656, 20.050827026367188, 21.44780731201172, 22.84478759765625, 24.24176788330078, 25.638748168945312, 27.035728454589844, 28.432708740234375, 29.829689025878906, 31.226669311523438, 32.62364959716797, 34.0206298828125, 35.41761016845703, 36.81459045410156, 38.211570739746094, 39.608551025390625, 41.005531311035156, 42.40251159667969, 43.79949188232422]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 8.0, 4.0, 4.0, 6.0, 9.0, 13.0, 11.0, 17.0, 9.0, 28.0, 29.0, 29.0, 37.0, 51.0, 44.0, 57.0, 41.0, 61.0, 45.0, 58.0, 51.0, 51.0, 55.0, 36.0, 41.0, 27.0, 38.0, 25.0, 19.0, 20.0, 12.0, 16.0, 14.0, 6.0, 9.0, 6.0, 3.0, 9.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.894317626953125, -3.77301025390625, -3.651702880859375, -3.5303955078125, -3.409088134765625, -3.28778076171875, -3.166473388671875, -3.045166015625, -2.923858642578125, -2.80255126953125, -2.681243896484375, -2.5599365234375, -2.438629150390625, -2.31732177734375, -2.196014404296875, -2.07470703125, -1.953399658203125, -1.83209228515625, -1.710784912109375, -1.5894775390625, -1.468170166015625, -1.34686279296875, -1.225555419921875, -1.104248046875, -0.982940673828125, -0.86163330078125, -0.740325927734375, -0.6190185546875, -0.497711181640625, -0.37640380859375, -0.255096435546875, -0.1337890625, -0.012481689453125, 0.10882568359375, 0.230133056640625, 0.3514404296875, 0.472747802734375, 0.59405517578125, 0.715362548828125, 0.836669921875, 0.957977294921875, 1.07928466796875, 1.200592041015625, 1.3218994140625, 1.443206787109375, 1.56451416015625, 1.685821533203125, 1.80712890625, 1.928436279296875, 2.04974365234375, 2.171051025390625, 2.2923583984375, 2.413665771484375, 2.53497314453125, 2.656280517578125, 2.777587890625, 2.898895263671875, 3.02020263671875, 3.141510009765625, 3.2628173828125, 3.384124755859375, 3.50543212890625, 3.626739501953125, 3.748046875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 11.0, 10.0, 24.0, 29.0, 32.0, 75.0, 96.0, 124.0, 196.0, 287.0, 429.0, 606.0, 869.0, 1360.0, 2145.0, 3649.0, 6060.0, 10913.0, 21117.0, 51826.0, 393173.0, 3309380.0, 298958.0, 46440.0, 19530.0, 10389.0, 6065.0, 3657.0, 2237.0, 1460.0, 999.0, 641.0, 430.0, 314.0, 227.0, 154.0, 109.0, 72.0, 56.0, 28.0, 32.0, 20.0, 15.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-14.8828125, -14.450927734375, -14.01904296875, -13.587158203125, -13.1552734375, -12.723388671875, -12.29150390625, -11.859619140625, -11.427734375, -10.995849609375, -10.56396484375, -10.132080078125, -9.7001953125, -9.268310546875, -8.83642578125, -8.404541015625, -7.97265625, -7.540771484375, -7.10888671875, -6.677001953125, -6.2451171875, -5.813232421875, -5.38134765625, -4.949462890625, -4.517578125, -4.085693359375, -3.65380859375, -3.221923828125, -2.7900390625, -2.358154296875, -1.92626953125, -1.494384765625, -1.0625, -0.630615234375, -0.19873046875, 0.233154296875, 0.6650390625, 1.096923828125, 1.52880859375, 1.960693359375, 2.392578125, 2.824462890625, 3.25634765625, 3.688232421875, 4.1201171875, 4.552001953125, 4.98388671875, 5.415771484375, 5.84765625, 6.279541015625, 6.71142578125, 7.143310546875, 7.5751953125, 8.007080078125, 8.43896484375, 8.870849609375, 9.302734375, 9.734619140625, 10.16650390625, 10.598388671875, 11.0302734375, 11.462158203125, 11.89404296875, 12.325927734375, 12.7578125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 4.0, 3.0, 3.0, 7.0, 12.0, 13.0, 15.0, 14.0, 19.0, 34.0, 39.0, 45.0, 75.0, 139.0, 241.0, 511.0, 951.0, 850.0, 454.0, 246.0, 123.0, 65.0, 49.0, 42.0, 31.0, 17.0, 15.0, 14.0, 11.0, 8.0, 6.0, 8.0, 2.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.46875, -14.984130859375, -14.49951171875, -14.014892578125, -13.5302734375, -13.045654296875, -12.56103515625, -12.076416015625, -11.591796875, -11.107177734375, -10.62255859375, -10.137939453125, -9.6533203125, -9.168701171875, -8.68408203125, -8.199462890625, -7.71484375, -7.230224609375, -6.74560546875, -6.260986328125, -5.7763671875, -5.291748046875, -4.80712890625, -4.322509765625, -3.837890625, -3.353271484375, -2.86865234375, -2.384033203125, -1.8994140625, -1.414794921875, -0.93017578125, -0.445556640625, 0.0390625, 0.523681640625, 1.00830078125, 1.492919921875, 1.9775390625, 2.462158203125, 2.94677734375, 3.431396484375, 3.916015625, 4.400634765625, 4.88525390625, 5.369873046875, 5.8544921875, 6.339111328125, 6.82373046875, 7.308349609375, 7.79296875, 8.277587890625, 8.76220703125, 9.246826171875, 9.7314453125, 10.216064453125, 10.70068359375, 11.185302734375, 11.669921875, 12.154541015625, 12.63916015625, 13.123779296875, 13.6083984375, 14.093017578125, 14.57763671875, 15.062255859375, 15.546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 6.0, 15.0, 18.0, 23.0, 37.0, 46.0, 96.0, 190.0, 341.0, 665.0, 1384.0, 2914.0, 6367.0, 15699.0, 47008.0, 285682.0, 3455714.0, 301860.0, 47859.0, 15994.0, 6545.0, 2943.0, 1413.0, 653.0, 354.0, 190.0, 79.0, 70.0, 44.0, 16.0, 17.0, 11.0, 8.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.875, -27.896484375, -26.91796875, -25.939453125, -24.9609375, -23.982421875, -23.00390625, -22.025390625, -21.046875, -20.068359375, -19.08984375, -18.111328125, -17.1328125, -16.154296875, -15.17578125, -14.197265625, -13.21875, -12.240234375, -11.26171875, -10.283203125, -9.3046875, -8.326171875, -7.34765625, -6.369140625, -5.390625, -4.412109375, -3.43359375, -2.455078125, -1.4765625, -0.498046875, 0.48046875, 1.458984375, 2.4375, 3.416015625, 4.39453125, 5.373046875, 6.3515625, 7.330078125, 8.30859375, 9.287109375, 10.265625, 11.244140625, 12.22265625, 13.201171875, 14.1796875, 15.158203125, 16.13671875, 17.115234375, 18.09375, 19.072265625, 20.05078125, 21.029296875, 22.0078125, 22.986328125, 23.96484375, 24.943359375, 25.921875, 26.900390625, 27.87890625, 28.857421875, 29.8359375, 30.814453125, 31.79296875, 32.771484375, 33.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 8.0, 6.0, 21.0, 22.0, 28.0, 40.0, 66.0, 72.0, 100.0, 150.0, 109.0, 99.0, 76.0, 46.0, 44.0, 15.0, 28.0, 12.0, 9.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.2528190612793, -55.40382766723633, -53.55483627319336, -51.70584487915039, -49.85685348510742, -48.00786209106445, -46.158870697021484, -44.309879302978516, -42.46088790893555, -40.61189651489258, -38.76290512084961, -36.91391372680664, -35.06492233276367, -33.2159309387207, -31.366939544677734, -29.517948150634766, -27.668956756591797, -25.819965362548828, -23.97097396850586, -22.12198257446289, -20.272991180419922, -18.423999786376953, -16.575008392333984, -14.726016998291016, -12.877025604248047, -11.028034210205078, -9.17904281616211, -7.330051422119141, -5.481060028076172, -3.632068634033203, -1.7830772399902344, 0.06591415405273438, 1.9149093627929688, 3.7639007568359375, 5.612892150878906, 7.461883544921875, 9.310874938964844, 11.159866333007812, 13.008857727050781, 14.85784912109375, 16.70684051513672, 18.555831909179688, 20.404823303222656, 22.253814697265625, 24.102806091308594, 25.951797485351562, 27.80078887939453, 29.6497802734375, 31.49877166748047, 33.34776306152344, 35.196754455566406, 37.045745849609375, 38.894737243652344, 40.74372863769531, 42.59272003173828, 44.44171142578125, 46.29070281982422, 48.13969421386719, 49.988685607910156, 51.837677001953125, 53.686668395996094, 55.53565979003906, 57.38465118408203, 59.233642578125, 61.08263397216797]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 9.0, 3.0, 7.0, 3.0, 5.0, 6.0, 5.0, 7.0, 11.0, 17.0, 16.0, 12.0, 20.0, 33.0, 21.0, 26.0, 28.0, 38.0, 33.0, 31.0, 38.0, 33.0, 53.0, 35.0, 44.0, 28.0, 33.0, 22.0, 39.0, 41.0, 36.0, 29.0, 24.0, 22.0, 35.0, 26.0, 14.0, 17.0, 21.0, 10.0, 11.0, 11.0, 12.0, 8.0, 11.0, 6.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0], "bins": [-36.570594787597656, -35.454071044921875, -34.337547302246094, -33.22102737426758, -32.1045036315918, -30.987979888916016, -29.871456146240234, -28.754932403564453, -27.638410568237305, -26.521886825561523, -25.405364990234375, -24.288841247558594, -23.172317504882812, -22.055795669555664, -20.939271926879883, -19.822750091552734, -18.706226348876953, -17.589702606201172, -16.473180770874023, -15.356657028198242, -14.240134239196777, -13.123611450195312, -12.007087707519531, -10.890564918518066, -9.774042129516602, -8.657519340515137, -7.540996074676514, -6.424472808837891, -5.307950019836426, -4.191427230834961, -3.074903964996338, -1.9583806991577148, -0.8418540954589844, 0.27466893196105957, 1.3911919593811035, 2.5077149868011475, 3.6242380142211914, 4.740760803222656, 5.857284069061279, 6.973807334899902, 8.090330123901367, 9.206852912902832, 10.323375701904297, 11.439899444580078, 12.556422233581543, 13.672945022583008, 14.789468765258789, 15.905991554260254, 17.02251434326172, 18.1390380859375, 19.25555992126465, 20.37208366394043, 21.488605499267578, 22.60512924194336, 23.72165298461914, 24.838176727294922, 25.95469856262207, 27.07122230529785, 28.187744140625, 29.30426788330078, 30.420791625976562, 31.53731346130371, 32.65383529663086, 33.77035903930664, 34.88688278198242]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 13.0, 7.0, 8.0, 14.0, 18.0, 13.0, 22.0, 23.0, 23.0, 36.0, 38.0, 53.0, 39.0, 44.0, 52.0, 57.0, 56.0, 63.0, 60.0, 40.0, 43.0, 36.0, 32.0, 39.0, 29.0, 25.0, 21.0, 15.0, 16.0, 6.0, 14.0, 7.0, 9.0, 6.0, 3.0, 2.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.16796875, -4.044158935546875, -3.92034912109375, -3.796539306640625, -3.6727294921875, -3.548919677734375, -3.42510986328125, -3.301300048828125, -3.177490234375, -3.053680419921875, -2.92987060546875, -2.806060791015625, -2.6822509765625, -2.558441162109375, -2.43463134765625, -2.310821533203125, -2.18701171875, -2.063201904296875, -1.93939208984375, -1.815582275390625, -1.6917724609375, -1.567962646484375, -1.44415283203125, -1.320343017578125, -1.196533203125, -1.072723388671875, -0.94891357421875, -0.825103759765625, -0.7012939453125, -0.577484130859375, -0.45367431640625, -0.329864501953125, -0.2060546875, -0.082244873046875, 0.04156494140625, 0.165374755859375, 0.2891845703125, 0.412994384765625, 0.53680419921875, 0.660614013671875, 0.784423828125, 0.908233642578125, 1.03204345703125, 1.155853271484375, 1.2796630859375, 1.403472900390625, 1.52728271484375, 1.651092529296875, 1.77490234375, 1.898712158203125, 2.02252197265625, 2.146331787109375, 2.2701416015625, 2.393951416015625, 2.51776123046875, 2.641571044921875, 2.765380859375, 2.889190673828125, 3.01300048828125, 3.136810302734375, 3.2606201171875, 3.384429931640625, 3.50823974609375, 3.632049560546875, 3.755859375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 7.0, 11.0, 14.0, 38.0, 38.0, 65.0, 93.0, 142.0, 260.0, 384.0, 553.0, 859.0, 1299.0, 2060.0, 3277.0, 5236.0, 8837.0, 15386.0, 28333.0, 57788.0, 138166.0, 355433.0, 243688.0, 92745.0, 41878.0, 21450.0, 12002.0, 6928.0, 4166.0, 2633.0, 1661.0, 1073.0, 726.0, 446.0, 299.0, 193.0, 113.0, 88.0, 58.0, 38.0, 24.0, 24.0, 7.0, 9.0, 8.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6015625, -12.1636962890625, -11.725830078125, -11.2879638671875, -10.85009765625, -10.4122314453125, -9.974365234375, -9.5364990234375, -9.0986328125, -8.6607666015625, -8.222900390625, -7.7850341796875, -7.34716796875, -6.9093017578125, -6.471435546875, -6.0335693359375, -5.595703125, -5.1578369140625, -4.719970703125, -4.2821044921875, -3.84423828125, -3.4063720703125, -2.968505859375, -2.5306396484375, -2.0927734375, -1.6549072265625, -1.217041015625, -0.7791748046875, -0.34130859375, 0.0965576171875, 0.534423828125, 0.9722900390625, 1.41015625, 1.8480224609375, 2.285888671875, 2.7237548828125, 3.16162109375, 3.5994873046875, 4.037353515625, 4.4752197265625, 4.9130859375, 5.3509521484375, 5.788818359375, 6.2266845703125, 6.66455078125, 7.1024169921875, 7.540283203125, 7.9781494140625, 8.416015625, 8.8538818359375, 9.291748046875, 9.7296142578125, 10.16748046875, 10.6053466796875, 11.043212890625, 11.4810791015625, 11.9189453125, 12.3568115234375, 12.794677734375, 13.2325439453125, 13.67041015625, 14.1082763671875, 14.546142578125, 14.9840087890625, 15.421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 6.0, 2.0, 5.0, 2.0, 6.0, 10.0, 9.0, 12.0, 14.0, 13.0, 10.0, 16.0, 18.0, 28.0, 20.0, 23.0, 28.0, 30.0, 31.0, 29.0, 34.0, 37.0, 33.0, 23.0, 35.0, 37.0, 1054.0, 33.0, 28.0, 40.0, 33.0, 30.0, 33.0, 12.0, 39.0, 32.0, 30.0, 16.0, 19.0, 20.0, 13.0, 13.0, 17.0, 10.0, 15.0, 5.0, 11.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-3.072265625, -2.981964111328125, -2.89166259765625, -2.801361083984375, -2.7110595703125, -2.620758056640625, -2.53045654296875, -2.440155029296875, -2.349853515625, -2.259552001953125, -2.16925048828125, -2.078948974609375, -1.9886474609375, -1.898345947265625, -1.80804443359375, -1.717742919921875, -1.62744140625, -1.537139892578125, -1.44683837890625, -1.356536865234375, -1.2662353515625, -1.175933837890625, -1.08563232421875, -0.995330810546875, -0.905029296875, -0.814727783203125, -0.72442626953125, -0.634124755859375, -0.5438232421875, -0.453521728515625, -0.36322021484375, -0.272918701171875, -0.1826171875, -0.092315673828125, -0.00201416015625, 0.088287353515625, 0.1785888671875, 0.268890380859375, 0.35919189453125, 0.449493408203125, 0.539794921875, 0.630096435546875, 0.72039794921875, 0.810699462890625, 0.9010009765625, 0.991302490234375, 1.08160400390625, 1.171905517578125, 1.26220703125, 1.352508544921875, 1.44281005859375, 1.533111572265625, 1.6234130859375, 1.713714599609375, 1.80401611328125, 1.894317626953125, 1.984619140625, 2.074920654296875, 2.16522216796875, 2.255523681640625, 2.3458251953125, 2.436126708984375, 2.52642822265625, 2.616729736328125, 2.70703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 11.0, 21.0, 14.0, 23.0, 22.0, 42.0, 58.0, 79.0, 134.0, 176.0, 266.0, 405.0, 558.0, 868.0, 1407.0, 2270.0, 4019.0, 6997.0, 13990.0, 32049.0, 104993.0, 844906.0, 910462.0, 108842.0, 32706.0, 13998.0, 7210.0, 4129.0, 2390.0, 1386.0, 857.0, 575.0, 392.0, 240.0, 177.0, 142.0, 87.0, 85.0, 42.0, 32.0, 16.0, 14.0, 12.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-12.7421875, -12.356201171875, -11.97021484375, -11.584228515625, -11.1982421875, -10.812255859375, -10.42626953125, -10.040283203125, -9.654296875, -9.268310546875, -8.88232421875, -8.496337890625, -8.1103515625, -7.724365234375, -7.33837890625, -6.952392578125, -6.56640625, -6.180419921875, -5.79443359375, -5.408447265625, -5.0224609375, -4.636474609375, -4.25048828125, -3.864501953125, -3.478515625, -3.092529296875, -2.70654296875, -2.320556640625, -1.9345703125, -1.548583984375, -1.16259765625, -0.776611328125, -0.390625, -0.004638671875, 0.38134765625, 0.767333984375, 1.1533203125, 1.539306640625, 1.92529296875, 2.311279296875, 2.697265625, 3.083251953125, 3.46923828125, 3.855224609375, 4.2412109375, 4.627197265625, 5.01318359375, 5.399169921875, 5.78515625, 6.171142578125, 6.55712890625, 6.943115234375, 7.3291015625, 7.715087890625, 8.10107421875, 8.487060546875, 8.873046875, 9.259033203125, 9.64501953125, 10.031005859375, 10.4169921875, 10.802978515625, 11.18896484375, 11.574951171875, 11.9609375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 6.0, 6.0, 8.0, 10.0, 20.0, 14.0, 10.0, 19.0, 17.0, 21.0, 31.0, 37.0, 47.0, 47.0, 70.0, 141.0, 111.0, 69.0, 49.0, 30.0, 38.0, 28.0, 29.0, 18.0, 17.0, 18.0, 11.0, 11.0, 8.0, 4.0, 6.0, 7.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.564453125, -2.490875244140625, -2.41729736328125, -2.343719482421875, -2.2701416015625, -2.196563720703125, -2.12298583984375, -2.049407958984375, -1.975830078125, -1.902252197265625, -1.82867431640625, -1.755096435546875, -1.6815185546875, -1.607940673828125, -1.53436279296875, -1.460784912109375, -1.38720703125, -1.313629150390625, -1.24005126953125, -1.166473388671875, -1.0928955078125, -1.019317626953125, -0.94573974609375, -0.872161865234375, -0.798583984375, -0.725006103515625, -0.65142822265625, -0.577850341796875, -0.5042724609375, -0.430694580078125, -0.35711669921875, -0.283538818359375, -0.2099609375, -0.136383056640625, -0.06280517578125, 0.010772705078125, 0.0843505859375, 0.157928466796875, 0.23150634765625, 0.305084228515625, 0.378662109375, 0.452239990234375, 0.52581787109375, 0.599395751953125, 0.6729736328125, 0.746551513671875, 0.82012939453125, 0.893707275390625, 0.96728515625, 1.040863037109375, 1.11444091796875, 1.188018798828125, 1.2615966796875, 1.335174560546875, 1.40875244140625, 1.482330322265625, 1.555908203125, 1.629486083984375, 1.70306396484375, 1.776641845703125, 1.8502197265625, 1.923797607421875, 1.99737548828125, 2.070953369140625, 2.14453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 3.0, 11.0, 13.0, 11.0, 16.0, 14.0, 24.0, 24.0, 30.0, 31.0, 45.0, 53.0, 78.0, 75.0, 86.0, 110.0, 185.0, 363.0, 940.0, 4026.0, 31182.0, 739858.0, 252058.0, 15186.0, 2455.0, 651.0, 292.0, 171.0, 101.0, 92.0, 69.0, 56.0, 50.0, 41.0, 26.0, 22.0, 17.0, 15.0, 18.0, 11.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.078125, -27.167724609375, -26.25732421875, -25.346923828125, -24.4365234375, -23.526123046875, -22.61572265625, -21.705322265625, -20.794921875, -19.884521484375, -18.97412109375, -18.063720703125, -17.1533203125, -16.242919921875, -15.33251953125, -14.422119140625, -13.51171875, -12.601318359375, -11.69091796875, -10.780517578125, -9.8701171875, -8.959716796875, -8.04931640625, -7.138916015625, -6.228515625, -5.318115234375, -4.40771484375, -3.497314453125, -2.5869140625, -1.676513671875, -0.76611328125, 0.144287109375, 1.0546875, 1.965087890625, 2.87548828125, 3.785888671875, 4.6962890625, 5.606689453125, 6.51708984375, 7.427490234375, 8.337890625, 9.248291015625, 10.15869140625, 11.069091796875, 11.9794921875, 12.889892578125, 13.80029296875, 14.710693359375, 15.62109375, 16.531494140625, 17.44189453125, 18.352294921875, 19.2626953125, 20.173095703125, 21.08349609375, 21.993896484375, 22.904296875, 23.814697265625, 24.72509765625, 25.635498046875, 26.5458984375, 27.456298828125, 28.36669921875, 29.277099609375, 30.1875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 22.0, 64.0, 218.0, 361.0, 217.0, 92.0, 24.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78233528137207, -17.28201675415039, -16.78169822692871, -16.281381607055664, -15.781063079833984, -15.280744552612305, -14.780426025390625, -14.280108451843262, -13.779790878295898, -13.279472351074219, -12.779154777526855, -12.278836250305176, -11.778518676757812, -11.278200149536133, -10.777881622314453, -10.27756404876709, -9.77724552154541, -9.27692699432373, -8.776609420776367, -8.276290893554688, -7.775973320007324, -7.2756547927856445, -6.775336742401123, -6.275018692016602, -5.77470064163208, -5.274382591247559, -4.774064540863037, -4.273746490478516, -3.773428201675415, -3.2731101512908936, -2.772791862487793, -2.2724738121032715, -1.77215576171875, -1.2718377113342285, -0.7715195417404175, -0.27120137214660645, 0.22911667823791504, 0.7294347286224365, 1.229753017425537, 1.7300710678100586, 2.23038911819458, 2.7307071685791016, 3.231025218963623, 3.7313435077667236, 4.231661796569824, 4.7319793701171875, 5.232297897338867, 5.732615947723389, 6.23293399810791, 6.733252048492432, 7.233570098876953, 7.733888626098633, 8.234206199645996, 8.734524726867676, 9.234842300415039, 9.735160827636719, 10.235479354858398, 10.735797882080078, 11.236115455627441, 11.736433982849121, 12.236751556396484, 12.737070083618164, 13.237388610839844, 13.737706184387207, 14.23802375793457]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 6.0, 6.0, 5.0, 13.0, 13.0, 15.0, 15.0, 17.0, 18.0, 27.0, 27.0, 26.0, 28.0, 37.0, 36.0, 29.0, 36.0, 41.0, 37.0, 48.0, 34.0, 39.0, 39.0, 34.0, 31.0, 33.0, 32.0, 31.0, 34.0, 29.0, 20.0, 15.0, 17.0, 14.0, 15.0, 16.0, 15.0, 16.0, 7.0, 8.0, 7.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.8897461891174316, -2.7988765239715576, -2.7080070972442627, -2.6171374320983887, -2.5262680053710938, -2.4353983402252197, -2.3445286750793457, -2.253659248352051, -2.162789821624756, -2.071920156478882, -1.981050729751587, -1.890181064605713, -1.799311637878418, -1.708441972732544, -1.6175724267959595, -1.526702880859375, -1.435833215713501, -1.3449636697769165, -1.254094123840332, -1.163224458694458, -1.072355031967163, -0.9814854264259338, -0.8906158208847046, -0.7997462749481201, -0.7088767290115356, -0.6180071830749512, -0.5271376371383667, -0.43626803159713745, -0.345398485660553, -0.2545289397239685, -0.16365933418273926, -0.07278978824615479, 0.018079757690429688, 0.10894931852817535, 0.19981887936592102, 0.2906884551048279, 0.38155800104141235, 0.4724275469779968, 0.5632971525192261, 0.6541666984558105, 0.745036244392395, 0.8359057903289795, 0.926775336265564, 1.0176448822021484, 1.1085145473480225, 1.1993839740753174, 1.2902536392211914, 1.3811231851577759, 1.4719927310943604, 1.5628622770309448, 1.6537318229675293, 1.7446014881134033, 1.8354709148406982, 1.9263405799865723, 2.017210006713867, 2.108079671859741, 2.1989493370056152, 2.2898190021514893, 2.380688428878784, 2.471558094024658, 2.562427520751953, 2.653297185897827, 2.744166851043701, 2.835036277770996, 2.925905704498291]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 6.0, 9.0, 14.0, 9.0, 11.0, 15.0, 18.0, 21.0, 25.0, 34.0, 38.0, 36.0, 39.0, 48.0, 56.0, 53.0, 62.0, 64.0, 55.0, 55.0, 46.0, 33.0, 35.0, 38.0, 35.0, 30.0, 21.0, 15.0, 8.0, 9.0, 16.0, 10.0, 10.0, 9.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.318511962890625, -4.18780517578125, -4.057098388671875, -3.9263916015625, -3.795684814453125, -3.66497802734375, -3.534271240234375, -3.403564453125, -3.272857666015625, -3.14215087890625, -3.011444091796875, -2.8807373046875, -2.750030517578125, -2.61932373046875, -2.488616943359375, -2.35791015625, -2.227203369140625, -2.09649658203125, -1.965789794921875, -1.8350830078125, -1.704376220703125, -1.57366943359375, -1.442962646484375, -1.312255859375, -1.181549072265625, -1.05084228515625, -0.920135498046875, -0.7894287109375, -0.658721923828125, -0.52801513671875, -0.397308349609375, -0.2666015625, -0.135894775390625, -0.00518798828125, 0.125518798828125, 0.2562255859375, 0.386932373046875, 0.51763916015625, 0.648345947265625, 0.779052734375, 0.909759521484375, 1.04046630859375, 1.171173095703125, 1.3018798828125, 1.432586669921875, 1.56329345703125, 1.694000244140625, 1.82470703125, 1.955413818359375, 2.08612060546875, 2.216827392578125, 2.3475341796875, 2.478240966796875, 2.60894775390625, 2.739654541015625, 2.870361328125, 3.001068115234375, 3.13177490234375, 3.262481689453125, 3.3931884765625, 3.523895263671875, 3.65460205078125, 3.785308837890625, 3.916015625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 6.0, 19.0, 27.0, 27.0, 47.0, 63.0, 113.0, 141.0, 225.0, 335.0, 497.0, 839.0, 1290.0, 2118.0, 3741.0, 6894.0, 15830.0, 73771.0, 752218.0, 149904.0, 21187.0, 8345.0, 4310.0, 2432.0, 1473.0, 915.0, 564.0, 381.0, 288.0, 180.0, 101.0, 77.0, 60.0, 39.0, 31.0, 15.0, 16.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3203125, -9.9720458984375, -9.623779296875, -9.2755126953125, -8.92724609375, -8.5789794921875, -8.230712890625, -7.8824462890625, -7.5341796875, -7.1859130859375, -6.837646484375, -6.4893798828125, -6.14111328125, -5.7928466796875, -5.444580078125, -5.0963134765625, -4.748046875, -4.3997802734375, -4.051513671875, -3.7032470703125, -3.35498046875, -3.0067138671875, -2.658447265625, -2.3101806640625, -1.9619140625, -1.6136474609375, -1.265380859375, -0.9171142578125, -0.56884765625, -0.2205810546875, 0.127685546875, 0.4759521484375, 0.82421875, 1.1724853515625, 1.520751953125, 1.8690185546875, 2.21728515625, 2.5655517578125, 2.913818359375, 3.2620849609375, 3.6103515625, 3.9586181640625, 4.306884765625, 4.6551513671875, 5.00341796875, 5.3516845703125, 5.699951171875, 6.0482177734375, 6.396484375, 6.7447509765625, 7.093017578125, 7.4412841796875, 7.78955078125, 8.1378173828125, 8.486083984375, 8.8343505859375, 9.1826171875, 9.5308837890625, 9.879150390625, 10.2274169921875, 10.57568359375, 10.9239501953125, 11.272216796875, 11.6204833984375, 11.96875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 8.0, 15.0, 16.0, 13.0, 21.0, 37.0, 35.0, 34.0, 44.0, 43.0, 63.0, 68.0, 90.0, 133.0, 1605.0, 265.0, 118.0, 70.0, 54.0, 48.0, 41.0, 38.0, 32.0, 30.0, 30.0, 30.0, 11.0, 13.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703125, -16.142578125, -15.58203125, -15.021484375, -14.4609375, -13.900390625, -13.33984375, -12.779296875, -12.21875, -11.658203125, -11.09765625, -10.537109375, -9.9765625, -9.416015625, -8.85546875, -8.294921875, -7.734375, -7.173828125, -6.61328125, -6.052734375, -5.4921875, -4.931640625, -4.37109375, -3.810546875, -3.25, -2.689453125, -2.12890625, -1.568359375, -1.0078125, -0.447265625, 0.11328125, 0.673828125, 1.234375, 1.794921875, 2.35546875, 2.916015625, 3.4765625, 4.037109375, 4.59765625, 5.158203125, 5.71875, 6.279296875, 6.83984375, 7.400390625, 7.9609375, 8.521484375, 9.08203125, 9.642578125, 10.203125, 10.763671875, 11.32421875, 11.884765625, 12.4453125, 13.005859375, 13.56640625, 14.126953125, 14.6875, 15.248046875, 15.80859375, 16.369140625, 16.9296875, 17.490234375, 18.05078125, 18.611328125, 19.171875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 12.0, 31.0, 41.0, 55.0, 90.0, 139.0, 222.0, 381.0, 611.0, 1257.0, 2916.0, 9205.0, 73875.0, 2996055.0, 47936.0, 7654.0, 2595.0, 1150.0, 579.0, 315.0, 226.0, 136.0, 76.0, 52.0, 33.0, 21.0, 14.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.625, -48.0458984375, -46.466796875, -44.8876953125, -43.30859375, -41.7294921875, -40.150390625, -38.5712890625, -36.9921875, -35.4130859375, -33.833984375, -32.2548828125, -30.67578125, -29.0966796875, -27.517578125, -25.9384765625, -24.359375, -22.7802734375, -21.201171875, -19.6220703125, -18.04296875, -16.4638671875, -14.884765625, -13.3056640625, -11.7265625, -10.1474609375, -8.568359375, -6.9892578125, -5.41015625, -3.8310546875, -2.251953125, -0.6728515625, 0.90625, 2.4853515625, 4.064453125, 5.6435546875, 7.22265625, 8.8017578125, 10.380859375, 11.9599609375, 13.5390625, 15.1181640625, 16.697265625, 18.2763671875, 19.85546875, 21.4345703125, 23.013671875, 24.5927734375, 26.171875, 27.7509765625, 29.330078125, 30.9091796875, 32.48828125, 34.0673828125, 35.646484375, 37.2255859375, 38.8046875, 40.3837890625, 41.962890625, 43.5419921875, 45.12109375, 46.7001953125, 48.279296875, 49.8583984375, 51.4375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 11.0, 786.0, 217.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1423.282958984375, -1399.080810546875, -1374.8787841796875, -1350.6766357421875, -1326.4744873046875, -1302.2723388671875, -1278.0703125, -1253.8681640625, -1229.666015625, -1205.4638671875, -1181.2618408203125, -1157.0596923828125, -1132.8575439453125, -1108.6553955078125, -1084.453369140625, -1060.251220703125, -1036.049072265625, -1011.8469848632812, -987.6448364257812, -963.4427490234375, -939.2406005859375, -915.0385131835938, -890.8363647460938, -866.63427734375, -842.4321899414062, -818.2301025390625, -794.0279541015625, -769.8258666992188, -745.6237182617188, -721.421630859375, -697.219482421875, -673.0173950195312, -648.815185546875, -624.6130981445312, -600.4109497070312, -576.2088623046875, -552.0067138671875, -527.8046264648438, -503.60247802734375, -479.400390625, -455.1982727050781, -430.99615478515625, -406.7940368652344, -382.5919189453125, -358.3898010253906, -334.18768310546875, -309.985595703125, -285.783447265625, -261.58135986328125, -237.37924194335938, -213.1771240234375, -188.97500610351562, -164.77288818359375, -140.57077026367188, -116.36866760253906, -92.16654968261719, -67.96442413330078, -43.762306213378906, -19.560192108154297, 4.6419219970703125, 28.844039916992188, 53.04615783691406, 77.2482681274414, 101.45038604736328, 125.65250396728516]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 7.0, 6.0, 9.0, 13.0, 21.0, 23.0, 14.0, 25.0, 22.0, 21.0, 30.0, 26.0, 30.0, 26.0, 48.0, 47.0, 27.0, 45.0, 40.0, 38.0, 44.0, 50.0, 47.0, 36.0, 37.0, 31.0, 23.0, 30.0, 17.0, 20.0, 27.0, 16.0, 9.0, 22.0, 11.0, 11.0, 11.0, 10.0, 3.0, 5.0, 4.0, 1.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-49.65642166137695, -48.06755447387695, -46.47868347167969, -44.88981628417969, -43.30094909667969, -41.71207809448242, -40.12321090698242, -38.534339904785156, -36.945472717285156, -35.356605529785156, -33.76773452758789, -32.17886734008789, -30.589998245239258, -29.001129150390625, -27.412261962890625, -25.823392868041992, -24.23452377319336, -22.645654678344727, -21.056785583496094, -19.467918395996094, -17.87904930114746, -16.290180206298828, -14.701312065124512, -13.112443923950195, -11.523574829101562, -9.93470573425293, -8.345837593078613, -6.756968975067139, -5.168100357055664, -3.5792317390441895, -1.9903631210327148, -0.40149497985839844, 1.1873779296875, 2.7762465476989746, 4.365115165710449, 5.953983783721924, 7.542852401733398, 9.131721496582031, 10.720589637756348, 12.309457778930664, 13.898326873779297, 15.48719596862793, 17.076065063476562, 18.664932250976562, 20.253801345825195, 21.842670440673828, 23.431537628173828, 25.02040672302246, 26.609275817871094, 28.198144912719727, 29.78701400756836, 31.37588119506836, 32.964752197265625, 34.553619384765625, 36.142486572265625, 37.731353759765625, 39.32022476196289, 40.90909194946289, 42.497962951660156, 44.086830139160156, 45.675697326660156, 47.26456832885742, 48.85343551635742, 50.44230651855469, 52.03117370605469]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 4.0, 9.0, 13.0, 19.0, 15.0, 27.0, 18.0, 20.0, 33.0, 33.0, 37.0, 40.0, 45.0, 48.0, 46.0, 49.0, 70.0, 48.0, 53.0, 42.0, 40.0, 43.0, 31.0, 29.0, 20.0, 29.0, 20.0, 17.0, 17.0, 13.0, 9.0, 9.0, 8.0, 5.0, 9.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.19140625, -4.0614013671875, -3.931396484375, -3.8013916015625, -3.67138671875, -3.5413818359375, -3.411376953125, -3.2813720703125, -3.1513671875, -3.0213623046875, -2.891357421875, -2.7613525390625, -2.63134765625, -2.5013427734375, -2.371337890625, -2.2413330078125, -2.111328125, -1.9813232421875, -1.851318359375, -1.7213134765625, -1.59130859375, -1.4613037109375, -1.331298828125, -1.2012939453125, -1.0712890625, -0.9412841796875, -0.811279296875, -0.6812744140625, -0.55126953125, -0.4212646484375, -0.291259765625, -0.1612548828125, -0.03125, 0.0987548828125, 0.228759765625, 0.3587646484375, 0.48876953125, 0.6187744140625, 0.748779296875, 0.8787841796875, 1.0087890625, 1.1387939453125, 1.268798828125, 1.3988037109375, 1.52880859375, 1.6588134765625, 1.788818359375, 1.9188232421875, 2.048828125, 2.1788330078125, 2.308837890625, 2.4388427734375, 2.56884765625, 2.6988525390625, 2.828857421875, 2.9588623046875, 3.0888671875, 3.2188720703125, 3.348876953125, 3.4788818359375, 3.60888671875, 3.7388916015625, 3.868896484375, 3.9989013671875, 4.12890625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 9.0, 6.0, 16.0, 14.0, 15.0, 32.0, 46.0, 68.0, 95.0, 146.0, 223.0, 284.0, 466.0, 649.0, 907.0, 1309.0, 2137.0, 2922.0, 4858.0, 8137.0, 14812.0, 31503.0, 123312.0, 2522962.0, 1336536.0, 81986.0, 26569.0, 13157.0, 7592.0, 4594.0, 2884.0, 1876.0, 1223.0, 904.0, 566.0, 441.0, 318.0, 215.0, 159.0, 103.0, 75.0, 45.0, 37.0, 22.0, 28.0, 8.0, 5.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-14.65625, -14.223876953125, -13.79150390625, -13.359130859375, -12.9267578125, -12.494384765625, -12.06201171875, -11.629638671875, -11.197265625, -10.764892578125, -10.33251953125, -9.900146484375, -9.4677734375, -9.035400390625, -8.60302734375, -8.170654296875, -7.73828125, -7.305908203125, -6.87353515625, -6.441162109375, -6.0087890625, -5.576416015625, -5.14404296875, -4.711669921875, -4.279296875, -3.846923828125, -3.41455078125, -2.982177734375, -2.5498046875, -2.117431640625, -1.68505859375, -1.252685546875, -0.8203125, -0.387939453125, 0.04443359375, 0.476806640625, 0.9091796875, 1.341552734375, 1.77392578125, 2.206298828125, 2.638671875, 3.071044921875, 3.50341796875, 3.935791015625, 4.3681640625, 4.800537109375, 5.23291015625, 5.665283203125, 6.09765625, 6.530029296875, 6.96240234375, 7.394775390625, 7.8271484375, 8.259521484375, 8.69189453125, 9.124267578125, 9.556640625, 9.989013671875, 10.42138671875, 10.853759765625, 11.2861328125, 11.718505859375, 12.15087890625, 12.583251953125, 13.015625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 10.0, 4.0, 13.0, 14.0, 17.0, 29.0, 28.0, 43.0, 52.0, 69.0, 132.0, 201.0, 407.0, 634.0, 887.0, 637.0, 353.0, 162.0, 92.0, 61.0, 44.0, 38.0, 33.0, 22.0, 17.0, 10.0, 5.0, 9.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.9453125, -15.5194091796875, -15.093505859375, -14.6676025390625, -14.24169921875, -13.8157958984375, -13.389892578125, -12.9639892578125, -12.5380859375, -12.1121826171875, -11.686279296875, -11.2603759765625, -10.83447265625, -10.4085693359375, -9.982666015625, -9.5567626953125, -9.130859375, -8.7049560546875, -8.279052734375, -7.8531494140625, -7.42724609375, -7.0013427734375, -6.575439453125, -6.1495361328125, -5.7236328125, -5.2977294921875, -4.871826171875, -4.4459228515625, -4.02001953125, -3.5941162109375, -3.168212890625, -2.7423095703125, -2.31640625, -1.8905029296875, -1.464599609375, -1.0386962890625, -0.61279296875, -0.1868896484375, 0.239013671875, 0.6649169921875, 1.0908203125, 1.5167236328125, 1.942626953125, 2.3685302734375, 2.79443359375, 3.2203369140625, 3.646240234375, 4.0721435546875, 4.498046875, 4.9239501953125, 5.349853515625, 5.7757568359375, 6.20166015625, 6.6275634765625, 7.053466796875, 7.4793701171875, 7.9052734375, 8.3311767578125, 8.757080078125, 9.1829833984375, 9.60888671875, 10.0347900390625, 10.460693359375, 10.8865966796875, 11.3125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 9.0, 12.0, 6.0, 13.0, 17.0, 30.0, 39.0, 75.0, 110.0, 156.0, 300.0, 557.0, 981.0, 1757.0, 3420.0, 7092.0, 16184.0, 43541.0, 184805.0, 3035665.0, 771189.0, 81430.0, 26007.0, 10509.0, 4898.0, 2483.0, 1228.0, 716.0, 402.0, 239.0, 146.0, 81.0, 51.0, 47.0, 27.0, 24.0, 12.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.9375, -28.150146484375, -27.36279296875, -26.575439453125, -25.7880859375, -25.000732421875, -24.21337890625, -23.426025390625, -22.638671875, -21.851318359375, -21.06396484375, -20.276611328125, -19.4892578125, -18.701904296875, -17.91455078125, -17.127197265625, -16.33984375, -15.552490234375, -14.76513671875, -13.977783203125, -13.1904296875, -12.403076171875, -11.61572265625, -10.828369140625, -10.041015625, -9.253662109375, -8.46630859375, -7.678955078125, -6.8916015625, -6.104248046875, -5.31689453125, -4.529541015625, -3.7421875, -2.954833984375, -2.16748046875, -1.380126953125, -0.5927734375, 0.194580078125, 0.98193359375, 1.769287109375, 2.556640625, 3.343994140625, 4.13134765625, 4.918701171875, 5.7060546875, 6.493408203125, 7.28076171875, 8.068115234375, 8.85546875, 9.642822265625, 10.43017578125, 11.217529296875, 12.0048828125, 12.792236328125, 13.57958984375, 14.366943359375, 15.154296875, 15.941650390625, 16.72900390625, 17.516357421875, 18.3037109375, 19.091064453125, 19.87841796875, 20.665771484375, 21.453125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 22.0, 83.0, 288.0, 431.0, 123.0, 34.0, 16.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.83172607421875, -236.282958984375, -228.7342071533203, -221.18544006347656, -213.63668823242188, -206.08792114257812, -198.53915405273438, -190.9904022216797, -183.44163513183594, -175.8928680419922, -168.3441162109375, -160.79534912109375, -153.24659729003906, -145.6978302001953, -138.14907836914062, -130.60031127929688, -123.05155181884766, -115.50279235839844, -107.95403289794922, -100.4052734375, -92.85650634765625, -85.30774688720703, -77.75898742675781, -70.21022033691406, -62.66146469116211, -55.11270523071289, -47.563941955566406, -40.01518249511719, -32.46642303466797, -24.917659759521484, -17.368900299072266, -9.820137023925781, -2.2713775634765625, 5.277383327484131, 12.826144218444824, 20.37490463256836, 27.92366600036621, 35.47242736816406, 43.02118682861328, 50.569950103759766, 58.118709564208984, 65.66747283935547, 73.21623229980469, 80.7649917602539, 88.31375122070312, 95.86251831054688, 103.41127014160156, 110.96003723144531, 118.50879669189453, 126.05755615234375, 133.6063232421875, 141.1550750732422, 148.70384216308594, 156.25259399414062, 163.80136108398438, 171.35012817382812, 178.8988800048828, 186.44764709472656, 193.99639892578125, 201.545166015625, 209.0939178466797, 216.64268493652344, 224.19143676757812, 231.74020385742188, 239.28897094726562]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 7.0, 1.0, 10.0, 12.0, 8.0, 10.0, 13.0, 13.0, 20.0, 20.0, 19.0, 23.0, 29.0, 24.0, 37.0, 32.0, 42.0, 39.0, 37.0, 42.0, 47.0, 47.0, 45.0, 39.0, 48.0, 29.0, 46.0, 27.0, 31.0, 29.0, 25.0, 24.0, 28.0, 16.0, 14.0, 14.0, 12.0, 10.0, 10.0, 3.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.5467529296875, -34.332035064697266, -33.117313385009766, -31.90259552001953, -30.687875747680664, -29.473155975341797, -28.25843620300293, -27.043716430664062, -25.828998565673828, -24.61427879333496, -23.399559020996094, -22.18484115600586, -20.970121383666992, -19.755401611328125, -18.540681838989258, -17.32596206665039, -16.111242294311523, -14.896522521972656, -13.681803703308105, -12.467083930969238, -11.252365112304688, -10.03764533996582, -8.822925567626953, -7.608206748962402, -6.393486976623535, -5.178767681121826, -3.964048147201538, -2.74932861328125, -1.534609317779541, -0.31989002227783203, 0.8948297500610352, 2.109548568725586, 3.324268341064453, 4.538987636566162, 5.753706932067871, 6.968426704406738, 8.183145523071289, 9.397865295410156, 10.612585067749023, 11.827303886413574, 13.042023658752441, 14.256743431091309, 15.47146224975586, 16.686182022094727, 17.900901794433594, 19.115619659423828, 20.330341339111328, 21.545059204101562, 22.75977897644043, 23.974498748779297, 25.189218521118164, 26.40393829345703, 27.618656158447266, 28.833375930786133, 30.048095703125, 31.262813568115234, 32.477535247802734, 33.69225311279297, 34.90697479248047, 36.1216926574707, 37.3364143371582, 38.55113220214844, 39.76585388183594, 40.98057174682617, 42.195289611816406]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 11.0, 10.0, 8.0, 8.0, 12.0, 6.0, 10.0, 11.0, 25.0, 23.0, 23.0, 32.0, 31.0, 30.0, 39.0, 39.0, 40.0, 38.0, 46.0, 42.0, 45.0, 36.0, 49.0, 32.0, 37.0, 42.0, 34.0, 36.0, 32.0, 21.0, 19.0, 18.0, 19.0, 10.0, 16.0, 13.0, 7.0, 7.0, 5.0, 8.0, 6.0, 8.0, 7.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0], "bins": [-4.1015625, -3.9818115234375, -3.862060546875, -3.7423095703125, -3.62255859375, -3.5028076171875, -3.383056640625, -3.2633056640625, -3.1435546875, -3.0238037109375, -2.904052734375, -2.7843017578125, -2.66455078125, -2.5447998046875, -2.425048828125, -2.3052978515625, -2.185546875, -2.0657958984375, -1.946044921875, -1.8262939453125, -1.70654296875, -1.5867919921875, -1.467041015625, -1.3472900390625, -1.2275390625, -1.1077880859375, -0.988037109375, -0.8682861328125, -0.74853515625, -0.6287841796875, -0.509033203125, -0.3892822265625, -0.26953125, -0.1497802734375, -0.030029296875, 0.0897216796875, 0.20947265625, 0.3292236328125, 0.448974609375, 0.5687255859375, 0.6884765625, 0.8082275390625, 0.927978515625, 1.0477294921875, 1.16748046875, 1.2872314453125, 1.406982421875, 1.5267333984375, 1.646484375, 1.7662353515625, 1.885986328125, 2.0057373046875, 2.12548828125, 2.2452392578125, 2.364990234375, 2.4847412109375, 2.6044921875, 2.7242431640625, 2.843994140625, 2.9637451171875, 3.08349609375, 3.2032470703125, 3.322998046875, 3.4427490234375, 3.5625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 8.0, 14.0, 12.0, 15.0, 38.0, 54.0, 69.0, 110.0, 156.0, 237.0, 333.0, 425.0, 689.0, 924.0, 1350.0, 1884.0, 2697.0, 3850.0, 5708.0, 8723.0, 13782.0, 22409.0, 38755.0, 70427.0, 142159.0, 333676.0, 192785.0, 86617.0, 46898.0, 26747.0, 16115.0, 10083.0, 6438.0, 4291.0, 3019.0, 2114.0, 1462.0, 987.0, 759.0, 482.0, 381.0, 300.0, 175.0, 130.0, 84.0, 54.0, 42.0, 31.0, 22.0, 11.0, 12.0, 5.0, 4.0, 2.0, 4.0, 3.0], "bins": [-13.765625, -13.356689453125, -12.94775390625, -12.538818359375, -12.1298828125, -11.720947265625, -11.31201171875, -10.903076171875, -10.494140625, -10.085205078125, -9.67626953125, -9.267333984375, -8.8583984375, -8.449462890625, -8.04052734375, -7.631591796875, -7.22265625, -6.813720703125, -6.40478515625, -5.995849609375, -5.5869140625, -5.177978515625, -4.76904296875, -4.360107421875, -3.951171875, -3.542236328125, -3.13330078125, -2.724365234375, -2.3154296875, -1.906494140625, -1.49755859375, -1.088623046875, -0.6796875, -0.270751953125, 0.13818359375, 0.547119140625, 0.9560546875, 1.364990234375, 1.77392578125, 2.182861328125, 2.591796875, 3.000732421875, 3.40966796875, 3.818603515625, 4.2275390625, 4.636474609375, 5.04541015625, 5.454345703125, 5.86328125, 6.272216796875, 6.68115234375, 7.090087890625, 7.4990234375, 7.907958984375, 8.31689453125, 8.725830078125, 9.134765625, 9.543701171875, 9.95263671875, 10.361572265625, 10.7705078125, 11.179443359375, 11.58837890625, 11.997314453125, 12.40625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 14.0, 14.0, 11.0, 14.0, 21.0, 20.0, 19.0, 26.0, 20.0, 26.0, 27.0, 28.0, 39.0, 18.0, 37.0, 36.0, 43.0, 30.0, 28.0, 1058.0, 29.0, 31.0, 28.0, 48.0, 34.0, 32.0, 29.0, 28.0, 20.0, 25.0, 29.0, 10.0, 14.0, 29.0, 10.0, 17.0, 13.0, 16.0, 11.0, 9.0, 3.0, 6.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.57421875, -3.46246337890625, -3.3507080078125, -3.23895263671875, -3.127197265625, -3.01544189453125, -2.9036865234375, -2.79193115234375, -2.68017578125, -2.56842041015625, -2.4566650390625, -2.34490966796875, -2.233154296875, -2.12139892578125, -2.0096435546875, -1.89788818359375, -1.7861328125, -1.67437744140625, -1.5626220703125, -1.45086669921875, -1.339111328125, -1.22735595703125, -1.1156005859375, -1.00384521484375, -0.89208984375, -0.78033447265625, -0.6685791015625, -0.55682373046875, -0.445068359375, -0.33331298828125, -0.2215576171875, -0.10980224609375, 0.001953125, 0.11370849609375, 0.2254638671875, 0.33721923828125, 0.448974609375, 0.56072998046875, 0.6724853515625, 0.78424072265625, 0.89599609375, 1.00775146484375, 1.1195068359375, 1.23126220703125, 1.343017578125, 1.45477294921875, 1.5665283203125, 1.67828369140625, 1.7900390625, 1.90179443359375, 2.0135498046875, 2.12530517578125, 2.237060546875, 2.34881591796875, 2.4605712890625, 2.57232666015625, 2.68408203125, 2.79583740234375, 2.9075927734375, 3.01934814453125, 3.131103515625, 3.24285888671875, 3.3546142578125, 3.46636962890625, 3.578125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 6.0, 9.0, 6.0, 11.0, 13.0, 24.0, 26.0, 51.0, 54.0, 81.0, 106.0, 154.0, 219.0, 273.0, 435.0, 561.0, 864.0, 1379.0, 2119.0, 3468.0, 5721.0, 10205.0, 20316.0, 47352.0, 169155.0, 1348353.0, 356214.0, 70817.0, 27314.0, 13216.0, 7121.0, 4081.0, 2513.0, 1547.0, 1005.0, 704.0, 451.0, 310.0, 238.0, 167.0, 121.0, 78.0, 83.0, 48.0, 39.0, 29.0, 15.0, 16.0, 16.0, 11.0, 7.0, 5.0, 1.0, 1.0, 2.0, 5.0, 1.0], "bins": [-17.796875, -17.25244140625, -16.7080078125, -16.16357421875, -15.619140625, -15.07470703125, -14.5302734375, -13.98583984375, -13.44140625, -12.89697265625, -12.3525390625, -11.80810546875, -11.263671875, -10.71923828125, -10.1748046875, -9.63037109375, -9.0859375, -8.54150390625, -7.9970703125, -7.45263671875, -6.908203125, -6.36376953125, -5.8193359375, -5.27490234375, -4.73046875, -4.18603515625, -3.6416015625, -3.09716796875, -2.552734375, -2.00830078125, -1.4638671875, -0.91943359375, -0.375, 0.16943359375, 0.7138671875, 1.25830078125, 1.802734375, 2.34716796875, 2.8916015625, 3.43603515625, 3.98046875, 4.52490234375, 5.0693359375, 5.61376953125, 6.158203125, 6.70263671875, 7.2470703125, 7.79150390625, 8.3359375, 8.88037109375, 9.4248046875, 9.96923828125, 10.513671875, 11.05810546875, 11.6025390625, 12.14697265625, 12.69140625, 13.23583984375, 13.7802734375, 14.32470703125, 14.869140625, 15.41357421875, 15.9580078125, 16.50244140625, 17.046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 5.0, 14.0, 8.0, 15.0, 23.0, 35.0, 37.0, 59.0, 86.0, 187.0, 180.0, 80.0, 54.0, 51.0, 36.0, 23.0, 16.0, 18.0, 7.0, 8.0, 9.0, 7.0, 4.0, 1.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.95721435546875, -6.7464599609375, -6.53570556640625, -6.324951171875, -6.11419677734375, -5.9034423828125, -5.69268798828125, -5.48193359375, -5.27117919921875, -5.0604248046875, -4.84967041015625, -4.638916015625, -4.42816162109375, -4.2174072265625, -4.00665283203125, -3.7958984375, -3.58514404296875, -3.3743896484375, -3.16363525390625, -2.952880859375, -2.74212646484375, -2.5313720703125, -2.32061767578125, -2.10986328125, -1.89910888671875, -1.6883544921875, -1.47760009765625, -1.266845703125, -1.05609130859375, -0.8453369140625, -0.63458251953125, -0.423828125, -0.21307373046875, -0.0023193359375, 0.20843505859375, 0.419189453125, 0.62994384765625, 0.8406982421875, 1.05145263671875, 1.26220703125, 1.47296142578125, 1.6837158203125, 1.89447021484375, 2.105224609375, 2.31597900390625, 2.5267333984375, 2.73748779296875, 2.9482421875, 3.15899658203125, 3.3697509765625, 3.58050537109375, 3.791259765625, 4.00201416015625, 4.2127685546875, 4.42352294921875, 4.63427734375, 4.84503173828125, 5.0557861328125, 5.26654052734375, 5.477294921875, 5.68804931640625, 5.8988037109375, 6.10955810546875, 6.3203125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 4.0, 8.0, 3.0, 7.0, 3.0, 10.0, 12.0, 13.0, 23.0, 11.0, 25.0, 31.0, 57.0, 89.0, 122.0, 275.0, 638.0, 1743.0, 5806.0, 34230.0, 935610.0, 58650.0, 7508.0, 2108.0, 704.0, 330.0, 176.0, 101.0, 62.0, 32.0, 38.0, 29.0, 14.0, 12.0, 14.0, 9.0, 12.0, 7.0, 4.0, 8.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-77.875, -75.556640625, -73.23828125, -70.919921875, -68.6015625, -66.283203125, -63.96484375, -61.646484375, -59.328125, -57.009765625, -54.69140625, -52.373046875, -50.0546875, -47.736328125, -45.41796875, -43.099609375, -40.78125, -38.462890625, -36.14453125, -33.826171875, -31.5078125, -29.189453125, -26.87109375, -24.552734375, -22.234375, -19.916015625, -17.59765625, -15.279296875, -12.9609375, -10.642578125, -8.32421875, -6.005859375, -3.6875, -1.369140625, 0.94921875, 3.267578125, 5.5859375, 7.904296875, 10.22265625, 12.541015625, 14.859375, 17.177734375, 19.49609375, 21.814453125, 24.1328125, 26.451171875, 28.76953125, 31.087890625, 33.40625, 35.724609375, 38.04296875, 40.361328125, 42.6796875, 44.998046875, 47.31640625, 49.634765625, 51.953125, 54.271484375, 56.58984375, 58.908203125, 61.2265625, 63.544921875, 65.86328125, 68.181640625, 70.5]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 7.0, 18.0, 38.0, 83.0, 172.0, 296.0, 219.0, 76.0, 44.0, 26.0, 8.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.6009407043457, -37.73585891723633, -36.87077331542969, -36.00569152832031, -35.14060974121094, -34.2755241394043, -33.41044235229492, -32.54536056518555, -31.680274963378906, -30.8151912689209, -29.950109481811523, -29.085025787353516, -28.219942092895508, -27.3548583984375, -26.489776611328125, -25.624692916870117, -24.759611129760742, -23.894527435302734, -23.02944564819336, -22.16436195373535, -21.299278259277344, -20.43419647216797, -19.56911277770996, -18.704029083251953, -17.838947296142578, -16.97386360168457, -16.108781814575195, -15.243698120117188, -14.37861442565918, -13.513531684875488, -12.648448944091797, -11.783365249633789, -10.918281555175781, -10.05319881439209, -9.188115119934082, -8.32303237915039, -7.457949161529541, -6.592865943908691, -5.727783203125, -4.86269998550415, -3.997616767883301, -3.132533550262451, -2.2674505710601807, -1.4023675918579102, -0.5372843742370605, 0.32779884338378906, 1.1928815841674805, 2.05796480178833, 2.9230480194091797, 3.7881312370300293, 4.653214454650879, 5.51829719543457, 6.38338041305542, 7.2484636306762695, 8.113546371459961, 8.978630065917969, 9.84371280670166, 10.708795547485352, 11.57387924194336, 12.43896198272705, 13.304044723510742, 14.16912841796875, 15.034211158752441, 15.899293899536133, 16.76437759399414]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 5.0, 8.0, 9.0, 9.0, 15.0, 13.0, 20.0, 21.0, 29.0, 30.0, 45.0, 33.0, 43.0, 48.0, 41.0, 50.0, 50.0, 35.0, 49.0, 50.0, 60.0, 42.0, 28.0, 30.0, 38.0, 34.0, 21.0, 28.0, 20.0, 18.0, 16.0, 13.0, 8.0, 2.0, 4.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.751711845397949, -7.495659351348877, -7.239606857299805, -6.983554840087891, -6.727502346038818, -6.471449851989746, -6.215397834777832, -5.95934534072876, -5.7032928466796875, -5.447240352630615, -5.191187858581543, -4.935135841369629, -4.679083347320557, -4.423030853271484, -4.16697883605957, -3.910926342010498, -3.654873847961426, -3.3988213539123535, -3.1427690982818604, -2.886716842651367, -2.630664348602295, -2.3746118545532227, -2.1185595989227295, -1.8625072240829468, -1.606454849243164, -1.3504024744033813, -1.0943500995635986, -0.8382977247238159, -0.5822453498840332, -0.3261929750442505, -0.07014060020446777, 0.18591177463531494, 0.44196510314941406, 0.6980174779891968, 0.9540698528289795, 1.2101222276687622, 1.466174602508545, 1.7222269773483276, 1.9782793521881104, 2.2343316078186035, 2.490384101867676, 2.746436595916748, 3.002488851547241, 3.2585411071777344, 3.5145936012268066, 3.770646095275879, 4.026698112487793, 4.282750606536865, 4.5388031005859375, 4.79485559463501, 5.050908088684082, 5.306960105895996, 5.563012599945068, 5.819065093994141, 6.075117111206055, 6.331169605255127, 6.587222099304199, 6.8432745933532715, 7.099327087402344, 7.355379104614258, 7.61143159866333, 7.867484092712402, 8.123536109924316, 8.379589080810547, 8.635641098022461]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 5.0, 9.0, 5.0, 7.0, 14.0, 10.0, 21.0, 18.0, 16.0, 15.0, 32.0, 32.0, 39.0, 29.0, 27.0, 32.0, 47.0, 41.0, 41.0, 48.0, 44.0, 51.0, 38.0, 48.0, 44.0, 31.0, 38.0, 42.0, 14.0, 24.0, 22.0, 13.0, 21.0, 14.0, 11.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 4.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.171875, -4.048828125, -3.92578125, -3.802734375, -3.6796875, -3.556640625, -3.43359375, -3.310546875, -3.1875, -3.064453125, -2.94140625, -2.818359375, -2.6953125, -2.572265625, -2.44921875, -2.326171875, -2.203125, -2.080078125, -1.95703125, -1.833984375, -1.7109375, -1.587890625, -1.46484375, -1.341796875, -1.21875, -1.095703125, -0.97265625, -0.849609375, -0.7265625, -0.603515625, -0.48046875, -0.357421875, -0.234375, -0.111328125, 0.01171875, 0.134765625, 0.2578125, 0.380859375, 0.50390625, 0.626953125, 0.75, 0.873046875, 0.99609375, 1.119140625, 1.2421875, 1.365234375, 1.48828125, 1.611328125, 1.734375, 1.857421875, 1.98046875, 2.103515625, 2.2265625, 2.349609375, 2.47265625, 2.595703125, 2.71875, 2.841796875, 2.96484375, 3.087890625, 3.2109375, 3.333984375, 3.45703125, 3.580078125, 3.703125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 1.0, 3.0, 9.0, 8.0, 6.0, 22.0, 27.0, 45.0, 45.0, 59.0, 81.0, 127.0, 195.0, 267.0, 343.0, 572.0, 833.0, 1319.0, 2013.0, 3428.0, 6325.0, 13207.0, 34600.0, 153613.0, 609483.0, 157813.0, 34988.0, 13398.0, 6244.0, 3373.0, 2132.0, 1302.0, 867.0, 548.0, 362.0, 267.0, 185.0, 140.0, 81.0, 63.0, 50.0, 39.0, 28.0, 16.0, 8.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.9296875, -9.6500244140625, -9.370361328125, -9.0906982421875, -8.81103515625, -8.5313720703125, -8.251708984375, -7.9720458984375, -7.6923828125, -7.4127197265625, -7.133056640625, -6.8533935546875, -6.57373046875, -6.2940673828125, -6.014404296875, -5.7347412109375, -5.455078125, -5.1754150390625, -4.895751953125, -4.6160888671875, -4.33642578125, -4.0567626953125, -3.777099609375, -3.4974365234375, -3.2177734375, -2.9381103515625, -2.658447265625, -2.3787841796875, -2.09912109375, -1.8194580078125, -1.539794921875, -1.2601318359375, -0.98046875, -0.7008056640625, -0.421142578125, -0.1414794921875, 0.13818359375, 0.4178466796875, 0.697509765625, 0.9771728515625, 1.2568359375, 1.5364990234375, 1.816162109375, 2.0958251953125, 2.37548828125, 2.6551513671875, 2.934814453125, 3.2144775390625, 3.494140625, 3.7738037109375, 4.053466796875, 4.3331298828125, 4.61279296875, 4.8924560546875, 5.172119140625, 5.4517822265625, 5.7314453125, 6.0111083984375, 6.290771484375, 6.5704345703125, 6.85009765625, 7.1297607421875, 7.409423828125, 7.6890869140625, 7.96875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 6.0, 5.0, 13.0, 8.0, 10.0, 15.0, 16.0, 30.0, 29.0, 27.0, 26.0, 38.0, 48.0, 40.0, 43.0, 69.0, 98.0, 176.0, 1443.0, 269.0, 118.0, 73.0, 65.0, 54.0, 38.0, 42.0, 34.0, 38.0, 26.0, 23.0, 16.0, 19.0, 24.0, 13.0, 14.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0], "bins": [-19.390625, -18.8768310546875, -18.363037109375, -17.8492431640625, -17.33544921875, -16.8216552734375, -16.307861328125, -15.7940673828125, -15.2802734375, -14.7664794921875, -14.252685546875, -13.7388916015625, -13.22509765625, -12.7113037109375, -12.197509765625, -11.6837158203125, -11.169921875, -10.6561279296875, -10.142333984375, -9.6285400390625, -9.11474609375, -8.6009521484375, -8.087158203125, -7.5733642578125, -7.0595703125, -6.5457763671875, -6.031982421875, -5.5181884765625, -5.00439453125, -4.4906005859375, -3.976806640625, -3.4630126953125, -2.94921875, -2.4354248046875, -1.921630859375, -1.4078369140625, -0.89404296875, -0.3802490234375, 0.133544921875, 0.6473388671875, 1.1611328125, 1.6749267578125, 2.188720703125, 2.7025146484375, 3.21630859375, 3.7301025390625, 4.243896484375, 4.7576904296875, 5.271484375, 5.7852783203125, 6.299072265625, 6.8128662109375, 7.32666015625, 7.8404541015625, 8.354248046875, 8.8680419921875, 9.3818359375, 9.8956298828125, 10.409423828125, 10.9232177734375, 11.43701171875, 11.9508056640625, 12.464599609375, 12.9783935546875, 13.4921875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 16.0, 11.0, 16.0, 21.0, 45.0, 54.0, 90.0, 126.0, 211.0, 367.0, 661.0, 1255.0, 2470.0, 5339.0, 14505.0, 52043.0, 902408.0, 2064358.0, 71713.0, 17680.0, 6488.0, 2727.0, 1305.0, 697.0, 398.0, 234.0, 129.0, 115.0, 54.0, 44.0, 25.0, 17.0, 12.0, 18.0, 8.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-23.84375, -23.076904296875, -22.31005859375, -21.543212890625, -20.7763671875, -20.009521484375, -19.24267578125, -18.475830078125, -17.708984375, -16.942138671875, -16.17529296875, -15.408447265625, -14.6416015625, -13.874755859375, -13.10791015625, -12.341064453125, -11.57421875, -10.807373046875, -10.04052734375, -9.273681640625, -8.5068359375, -7.739990234375, -6.97314453125, -6.206298828125, -5.439453125, -4.672607421875, -3.90576171875, -3.138916015625, -2.3720703125, -1.605224609375, -0.83837890625, -0.071533203125, 0.6953125, 1.462158203125, 2.22900390625, 2.995849609375, 3.7626953125, 4.529541015625, 5.29638671875, 6.063232421875, 6.830078125, 7.596923828125, 8.36376953125, 9.130615234375, 9.8974609375, 10.664306640625, 11.43115234375, 12.197998046875, 12.96484375, 13.731689453125, 14.49853515625, 15.265380859375, 16.0322265625, 16.799072265625, 17.56591796875, 18.332763671875, 19.099609375, 19.866455078125, 20.63330078125, 21.400146484375, 22.1669921875, 22.933837890625, 23.70068359375, 24.467529296875, 25.234375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 42.0, 330.0, 539.0, 93.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.393192291259766, -40.60619354248047, -32.819190979003906, -25.03219223022461, -17.245193481445312, -9.458194732666016, -1.6711921691894531, 6.115806579589844, 13.90280532836914, 21.689804077148438, 29.476804733276367, 37.2638053894043, 45.050804138183594, 52.83780288696289, 60.62480545043945, 68.41180419921875, 76.19880676269531, 83.98580932617188, 91.7728042602539, 99.55980682373047, 107.3468017578125, 115.13380432128906, 122.92080688476562, 130.7078094482422, 138.4947967529297, 146.28179931640625, 154.0688018798828, 161.85580444335938, 169.64279174804688, 177.42979431152344, 185.216796875, 193.00379943847656, 200.79080200195312, 208.5778045654297, 216.36480712890625, 224.15179443359375, 231.9387969970703, 239.72579956054688, 247.51280212402344, 255.2998046875, 263.0867919921875, 270.873779296875, 278.6607971191406, 286.4477844238281, 294.23480224609375, 302.02178955078125, 309.80877685546875, 317.5957946777344, 325.3828125, 333.1697998046875, 340.9568176269531, 348.7438049316406, 356.53082275390625, 364.31781005859375, 372.10479736328125, 379.8918151855469, 387.6788024902344, 395.4657897949219, 403.2528076171875, 411.039794921875, 418.8268127441406, 426.6138000488281, 434.40081787109375, 442.18780517578125, 449.97479248046875]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 7.0, 2.0, 1.0, 3.0, 8.0, 7.0, 2.0, 11.0, 17.0, 21.0, 14.0, 25.0, 20.0, 23.0, 30.0, 30.0, 32.0, 23.0, 30.0, 39.0, 41.0, 49.0, 28.0, 39.0, 53.0, 44.0, 40.0, 33.0, 37.0, 41.0, 27.0, 27.0, 32.0, 24.0, 21.0, 22.0, 19.0, 12.0, 12.0, 15.0, 9.0, 6.0, 6.0, 7.0, 2.0, 6.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.28388214111328, -47.65742492675781, -46.030967712402344, -44.40451431274414, -42.77805709838867, -41.1515998840332, -39.525146484375, -37.89868927001953, -36.27223205566406, -34.645774841308594, -33.019317626953125, -31.392864227294922, -29.766407012939453, -28.139949798583984, -26.51349449157715, -24.887039184570312, -23.260581970214844, -21.634124755859375, -20.00766944885254, -18.381214141845703, -16.754756927490234, -15.128300666809082, -13.50184440612793, -11.875388145446777, -10.248931884765625, -8.622475624084473, -6.99601936340332, -5.369563102722168, -3.7431068420410156, -2.1166505813598633, -0.49019432067871094, 1.1362619400024414, 2.7627220153808594, 4.389178276062012, 6.015634536743164, 7.642090797424316, 9.268547058105469, 10.895003318786621, 12.521459579467773, 14.147915840148926, 15.774372100830078, 17.400829315185547, 19.027284622192383, 20.65373992919922, 22.280197143554688, 23.906654357910156, 25.533109664916992, 27.159564971923828, 28.786022186279297, 30.412479400634766, 32.03893280029297, 33.66539001464844, 35.291847229003906, 36.918304443359375, 38.544761657714844, 40.17121505737305, 41.797672271728516, 43.424129486083984, 45.05058288574219, 46.677040100097656, 48.303497314453125, 49.929954528808594, 51.55641174316406, 53.182865142822266, 54.809322357177734]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 3.0, 14.0, 13.0, 10.0, 11.0, 15.0, 20.0, 13.0, 26.0, 17.0, 28.0, 36.0, 36.0, 38.0, 42.0, 44.0, 45.0, 49.0, 41.0, 38.0, 59.0, 38.0, 39.0, 35.0, 43.0, 31.0, 35.0, 25.0, 20.0, 21.0, 12.0, 10.0, 7.0, 12.0, 9.0, 7.0, 6.0, 7.0, 6.0, 6.0, 7.0, 1.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.8125, -3.68707275390625, -3.5616455078125, -3.43621826171875, -3.310791015625, -3.18536376953125, -3.0599365234375, -2.93450927734375, -2.80908203125, -2.68365478515625, -2.5582275390625, -2.43280029296875, -2.307373046875, -2.18194580078125, -2.0565185546875, -1.93109130859375, -1.8056640625, -1.68023681640625, -1.5548095703125, -1.42938232421875, -1.303955078125, -1.17852783203125, -1.0531005859375, -0.92767333984375, -0.80224609375, -0.67681884765625, -0.5513916015625, -0.42596435546875, -0.300537109375, -0.17510986328125, -0.0496826171875, 0.07574462890625, 0.201171875, 0.32659912109375, 0.4520263671875, 0.57745361328125, 0.702880859375, 0.82830810546875, 0.9537353515625, 1.07916259765625, 1.20458984375, 1.33001708984375, 1.4554443359375, 1.58087158203125, 1.706298828125, 1.83172607421875, 1.9571533203125, 2.08258056640625, 2.2080078125, 2.33343505859375, 2.4588623046875, 2.58428955078125, 2.709716796875, 2.83514404296875, 2.9605712890625, 3.08599853515625, 3.21142578125, 3.33685302734375, 3.4622802734375, 3.58770751953125, 3.713134765625, 3.83856201171875, 3.9639892578125, 4.08941650390625, 4.21484375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 5.0, 7.0, 14.0, 13.0, 21.0, 30.0, 46.0, 62.0, 88.0, 129.0, 193.0, 293.0, 424.0, 660.0, 976.0, 1544.0, 2432.0, 4020.0, 6705.0, 11683.0, 23771.0, 72037.0, 1004143.0, 2831041.0, 160432.0, 34693.0, 15809.0, 8631.0, 5233.0, 3209.0, 1997.0, 1335.0, 842.0, 555.0, 380.0, 244.0, 177.0, 128.0, 82.0, 58.0, 44.0, 33.0, 10.0, 11.0, 14.0, 11.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.609375, -13.173095703125, -12.73681640625, -12.300537109375, -11.8642578125, -11.427978515625, -10.99169921875, -10.555419921875, -10.119140625, -9.682861328125, -9.24658203125, -8.810302734375, -8.3740234375, -7.937744140625, -7.50146484375, -7.065185546875, -6.62890625, -6.192626953125, -5.75634765625, -5.320068359375, -4.8837890625, -4.447509765625, -4.01123046875, -3.574951171875, -3.138671875, -2.702392578125, -2.26611328125, -1.829833984375, -1.3935546875, -0.957275390625, -0.52099609375, -0.084716796875, 0.3515625, 0.787841796875, 1.22412109375, 1.660400390625, 2.0966796875, 2.532958984375, 2.96923828125, 3.405517578125, 3.841796875, 4.278076171875, 4.71435546875, 5.150634765625, 5.5869140625, 6.023193359375, 6.45947265625, 6.895751953125, 7.33203125, 7.768310546875, 8.20458984375, 8.640869140625, 9.0771484375, 9.513427734375, 9.94970703125, 10.385986328125, 10.822265625, 11.258544921875, 11.69482421875, 12.131103515625, 12.5673828125, 13.003662109375, 13.43994140625, 13.876220703125, 14.3125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 4.0, 14.0, 15.0, 19.0, 18.0, 24.0, 41.0, 51.0, 63.0, 130.0, 260.0, 517.0, 1011.0, 866.0, 449.0, 218.0, 122.0, 62.0, 42.0, 38.0, 26.0, 16.0, 8.0, 8.0, 5.0, 5.0, 7.0, 5.0, 8.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.96875, -19.4268798828125, -18.885009765625, -18.3431396484375, -17.80126953125, -17.2593994140625, -16.717529296875, -16.1756591796875, -15.6337890625, -15.0919189453125, -14.550048828125, -14.0081787109375, -13.46630859375, -12.9244384765625, -12.382568359375, -11.8406982421875, -11.298828125, -10.7569580078125, -10.215087890625, -9.6732177734375, -9.13134765625, -8.5894775390625, -8.047607421875, -7.5057373046875, -6.9638671875, -6.4219970703125, -5.880126953125, -5.3382568359375, -4.79638671875, -4.2545166015625, -3.712646484375, -3.1707763671875, -2.62890625, -2.0870361328125, -1.545166015625, -1.0032958984375, -0.46142578125, 0.0804443359375, 0.622314453125, 1.1641845703125, 1.7060546875, 2.2479248046875, 2.789794921875, 3.3316650390625, 3.87353515625, 4.4154052734375, 4.957275390625, 5.4991455078125, 6.041015625, 6.5828857421875, 7.124755859375, 7.6666259765625, 8.20849609375, 8.7503662109375, 9.292236328125, 9.8341064453125, 10.3759765625, 10.9178466796875, 11.459716796875, 12.0015869140625, 12.54345703125, 13.0853271484375, 13.627197265625, 14.1690673828125, 14.7109375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 11.0, 13.0, 25.0, 30.0, 45.0, 61.0, 81.0, 144.0, 218.0, 382.0, 618.0, 1049.0, 1930.0, 3648.0, 7233.0, 16275.0, 44435.0, 210769.0, 3221001.0, 574513.0, 69341.0, 22516.0, 9696.0, 4539.0, 2468.0, 1341.0, 690.0, 435.0, 261.0, 166.0, 119.0, 73.0, 46.0, 22.0, 18.0, 20.0, 12.0, 9.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.359375, -25.552734375, -24.74609375, -23.939453125, -23.1328125, -22.326171875, -21.51953125, -20.712890625, -19.90625, -19.099609375, -18.29296875, -17.486328125, -16.6796875, -15.873046875, -15.06640625, -14.259765625, -13.453125, -12.646484375, -11.83984375, -11.033203125, -10.2265625, -9.419921875, -8.61328125, -7.806640625, -7.0, -6.193359375, -5.38671875, -4.580078125, -3.7734375, -2.966796875, -2.16015625, -1.353515625, -0.546875, 0.259765625, 1.06640625, 1.873046875, 2.6796875, 3.486328125, 4.29296875, 5.099609375, 5.90625, 6.712890625, 7.51953125, 8.326171875, 9.1328125, 9.939453125, 10.74609375, 11.552734375, 12.359375, 13.166015625, 13.97265625, 14.779296875, 15.5859375, 16.392578125, 17.19921875, 18.005859375, 18.8125, 19.619140625, 20.42578125, 21.232421875, 22.0390625, 22.845703125, 23.65234375, 24.458984375, 25.265625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 9.0, 5.0, 4.0, 17.0, 17.0, 23.0, 45.0, 40.0, 87.0, 94.0, 118.0, 124.0, 133.0, 81.0, 52.0, 40.0, 30.0, 16.0, 11.0, 24.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.00122833251953, -68.87163543701172, -66.74203491210938, -64.61244201660156, -62.48284912109375, -60.35325622558594, -58.22365951538086, -56.09406280517578, -53.96446990966797, -51.834877014160156, -49.70528030395508, -47.57568359375, -45.44609069824219, -43.316497802734375, -41.1869010925293, -39.05730438232422, -36.927711486816406, -34.798118591308594, -32.668521881103516, -30.53892707824707, -28.409332275390625, -26.27973747253418, -24.150142669677734, -22.02054786682129, -19.890953063964844, -17.7613582611084, -15.631763458251953, -13.502168655395508, -11.372573852539062, -9.242979049682617, -7.113384246826172, -4.983789443969727, -2.8541946411132812, -0.7245998382568359, 1.4049949645996094, 3.5345897674560547, 5.6641845703125, 7.793779373168945, 9.92337417602539, 12.052968978881836, 14.182563781738281, 16.312158584594727, 18.441753387451172, 20.571348190307617, 22.700942993164062, 24.830537796020508, 26.960132598876953, 29.0897274017334, 31.219322204589844, 33.348915100097656, 35.478511810302734, 37.60810852050781, 39.737701416015625, 41.86729431152344, 43.996891021728516, 46.126487731933594, 48.256080627441406, 50.38567352294922, 52.5152702331543, 54.644866943359375, 56.77445983886719, 58.904052734375, 61.03364944458008, 63.163246154785156, 65.29283905029297]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 6.0, 7.0, 12.0, 18.0, 13.0, 14.0, 21.0, 18.0, 25.0, 23.0, 26.0, 27.0, 27.0, 38.0, 36.0, 34.0, 43.0, 37.0, 34.0, 45.0, 35.0, 33.0, 40.0, 18.0, 34.0, 38.0, 28.0, 33.0, 33.0, 13.0, 19.0, 24.0, 15.0, 18.0, 22.0, 6.0, 13.0, 9.0, 6.0, 9.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.73562240600586, -32.56083679199219, -31.38604736328125, -30.211259841918945, -29.03647232055664, -27.86168670654297, -26.686899185180664, -25.51211166381836, -24.337324142456055, -23.16253662109375, -21.987749099731445, -20.81296157836914, -19.63817596435547, -18.46338653564453, -17.28860092163086, -16.113813400268555, -14.93902587890625, -13.764238357543945, -12.58945083618164, -11.414664268493652, -10.239876747131348, -9.065089225769043, -7.8903021812438965, -6.71551513671875, -5.540727615356445, -4.365940093994141, -3.191153049468994, -2.0163657665252686, -0.841578483581543, 0.3332090377807617, 1.5079960823059082, 2.6827831268310547, 3.8575668334960938, 5.032354354858398, 6.207141399383545, 7.381928443908691, 8.556715965270996, 9.7315034866333, 10.906290054321289, 12.081077575683594, 13.255865097045898, 14.430652618408203, 15.605440139770508, 16.780227661132812, 17.955013275146484, 19.129802703857422, 20.304588317871094, 21.4793758392334, 22.654163360595703, 23.828950881958008, 25.003738403320312, 26.178525924682617, 27.353313446044922, 28.528099060058594, 29.7028865814209, 30.877674102783203, 32.052459716796875, 33.22724533081055, 34.402034759521484, 35.576820373535156, 36.751609802246094, 37.926395416259766, 39.1011848449707, 40.275970458984375, 41.45075988769531]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 5.0, 8.0, 9.0, 11.0, 16.0, 10.0, 17.0, 20.0, 17.0, 25.0, 28.0, 23.0, 28.0, 43.0, 37.0, 45.0, 46.0, 39.0, 44.0, 42.0, 59.0, 39.0, 28.0, 40.0, 39.0, 43.0, 37.0, 22.0, 26.0, 18.0, 13.0, 27.0, 9.0, 13.0, 10.0, 8.0, 12.0, 5.0, 11.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.92578125, -3.79296875, -3.66015625, -3.52734375, -3.39453125, -3.26171875, -3.12890625, -2.99609375, -2.86328125, -2.73046875, -2.59765625, -2.46484375, -2.33203125, -2.19921875, -2.06640625, -1.93359375, -1.80078125, -1.66796875, -1.53515625, -1.40234375, -1.26953125, -1.13671875, -1.00390625, -0.87109375, -0.73828125, -0.60546875, -0.47265625, -0.33984375, -0.20703125, -0.07421875, 0.05859375, 0.19140625, 0.32421875, 0.45703125, 0.58984375, 0.72265625, 0.85546875, 0.98828125, 1.12109375, 1.25390625, 1.38671875, 1.51953125, 1.65234375, 1.78515625, 1.91796875, 2.05078125, 2.18359375, 2.31640625, 2.44921875, 2.58203125, 2.71484375, 2.84765625, 2.98046875, 3.11328125, 3.24609375, 3.37890625, 3.51171875, 3.64453125, 3.77734375, 3.91015625, 4.04296875, 4.17578125, 4.30859375, 4.44140625, 4.57421875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 12.0, 20.0, 15.0, 23.0, 32.0, 41.0, 80.0, 92.0, 130.0, 196.0, 231.0, 344.0, 479.0, 649.0, 954.0, 1277.0, 1958.0, 2704.0, 3821.0, 5651.0, 8651.0, 14154.0, 25638.0, 53767.0, 130186.0, 291747.0, 274042.0, 118223.0, 50105.0, 24097.0, 13176.0, 8244.0, 5386.0, 3588.0, 2651.0, 1809.0, 1256.0, 861.0, 638.0, 455.0, 321.0, 237.0, 177.0, 120.0, 75.0, 63.0, 45.0, 30.0, 34.0, 18.0, 12.0, 12.0, 9.0, 6.0, 8.0, 3.0, 0.0, 3.0], "bins": [-14.359375, -13.909912109375, -13.46044921875, -13.010986328125, -12.5615234375, -12.112060546875, -11.66259765625, -11.213134765625, -10.763671875, -10.314208984375, -9.86474609375, -9.415283203125, -8.9658203125, -8.516357421875, -8.06689453125, -7.617431640625, -7.16796875, -6.718505859375, -6.26904296875, -5.819580078125, -5.3701171875, -4.920654296875, -4.47119140625, -4.021728515625, -3.572265625, -3.122802734375, -2.67333984375, -2.223876953125, -1.7744140625, -1.324951171875, -0.87548828125, -0.426025390625, 0.0234375, 0.472900390625, 0.92236328125, 1.371826171875, 1.8212890625, 2.270751953125, 2.72021484375, 3.169677734375, 3.619140625, 4.068603515625, 4.51806640625, 4.967529296875, 5.4169921875, 5.866455078125, 6.31591796875, 6.765380859375, 7.21484375, 7.664306640625, 8.11376953125, 8.563232421875, 9.0126953125, 9.462158203125, 9.91162109375, 10.361083984375, 10.810546875, 11.260009765625, 11.70947265625, 12.158935546875, 12.6083984375, 13.057861328125, 13.50732421875, 13.956787109375, 14.40625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 3.0, 6.0, 6.0, 15.0, 11.0, 13.0, 22.0, 16.0, 22.0, 28.0, 42.0, 29.0, 26.0, 30.0, 50.0, 38.0, 44.0, 43.0, 1059.0, 39.0, 39.0, 39.0, 47.0, 41.0, 39.0, 37.0, 56.0, 32.0, 22.0, 22.0, 14.0, 16.0, 8.0, 8.0, 14.0, 8.0, 7.0, 4.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.51416015625, -4.3759765625, -4.23779296875, -4.099609375, -3.96142578125, -3.8232421875, -3.68505859375, -3.546875, -3.40869140625, -3.2705078125, -3.13232421875, -2.994140625, -2.85595703125, -2.7177734375, -2.57958984375, -2.44140625, -2.30322265625, -2.1650390625, -2.02685546875, -1.888671875, -1.75048828125, -1.6123046875, -1.47412109375, -1.3359375, -1.19775390625, -1.0595703125, -0.92138671875, -0.783203125, -0.64501953125, -0.5068359375, -0.36865234375, -0.23046875, -0.09228515625, 0.0458984375, 0.18408203125, 0.322265625, 0.46044921875, 0.5986328125, 0.73681640625, 0.875, 1.01318359375, 1.1513671875, 1.28955078125, 1.427734375, 1.56591796875, 1.7041015625, 1.84228515625, 1.98046875, 2.11865234375, 2.2568359375, 2.39501953125, 2.533203125, 2.67138671875, 2.8095703125, 2.94775390625, 3.0859375, 3.22412109375, 3.3623046875, 3.50048828125, 3.638671875, 3.77685546875, 3.9150390625, 4.05322265625, 4.19140625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 9.0, 17.0, 15.0, 29.0, 48.0, 61.0, 81.0, 102.0, 141.0, 258.0, 334.0, 474.0, 797.0, 1211.0, 2063.0, 3541.0, 6633.0, 14566.0, 42368.0, 307385.0, 1532911.0, 131985.0, 28143.0, 10864.0, 5349.0, 2936.0, 1660.0, 1063.0, 657.0, 435.0, 296.0, 206.0, 150.0, 98.0, 65.0, 43.0, 42.0, 19.0, 19.0, 12.0, 15.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.46875, -17.839111328125, -17.20947265625, -16.579833984375, -15.9501953125, -15.320556640625, -14.69091796875, -14.061279296875, -13.431640625, -12.802001953125, -12.17236328125, -11.542724609375, -10.9130859375, -10.283447265625, -9.65380859375, -9.024169921875, -8.39453125, -7.764892578125, -7.13525390625, -6.505615234375, -5.8759765625, -5.246337890625, -4.61669921875, -3.987060546875, -3.357421875, -2.727783203125, -2.09814453125, -1.468505859375, -0.8388671875, -0.209228515625, 0.42041015625, 1.050048828125, 1.6796875, 2.309326171875, 2.93896484375, 3.568603515625, 4.1982421875, 4.827880859375, 5.45751953125, 6.087158203125, 6.716796875, 7.346435546875, 7.97607421875, 8.605712890625, 9.2353515625, 9.864990234375, 10.49462890625, 11.124267578125, 11.75390625, 12.383544921875, 13.01318359375, 13.642822265625, 14.2724609375, 14.902099609375, 15.53173828125, 16.161376953125, 16.791015625, 17.420654296875, 18.05029296875, 18.679931640625, 19.3095703125, 19.939208984375, 20.56884765625, 21.198486328125, 21.828125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 7.0, 20.0, 15.0, 29.0, 43.0, 67.0, 100.0, 111.0, 147.0, 113.0, 93.0, 68.0, 46.0, 32.0, 15.0, 16.0, 10.0, 9.0, 13.0, 4.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.08099365234375, -3.9393310546875, -3.79766845703125, -3.656005859375, -3.51434326171875, -3.3726806640625, -3.23101806640625, -3.08935546875, -2.94769287109375, -2.8060302734375, -2.66436767578125, -2.522705078125, -2.38104248046875, -2.2393798828125, -2.09771728515625, -1.9560546875, -1.81439208984375, -1.6727294921875, -1.53106689453125, -1.389404296875, -1.24774169921875, -1.1060791015625, -0.96441650390625, -0.82275390625, -0.68109130859375, -0.5394287109375, -0.39776611328125, -0.256103515625, -0.11444091796875, 0.0272216796875, 0.16888427734375, 0.310546875, 0.45220947265625, 0.5938720703125, 0.73553466796875, 0.877197265625, 1.01885986328125, 1.1605224609375, 1.30218505859375, 1.44384765625, 1.58551025390625, 1.7271728515625, 1.86883544921875, 2.010498046875, 2.15216064453125, 2.2938232421875, 2.43548583984375, 2.5771484375, 2.71881103515625, 2.8604736328125, 3.00213623046875, 3.143798828125, 3.28546142578125, 3.4271240234375, 3.56878662109375, 3.71044921875, 3.85211181640625, 3.9937744140625, 4.13543701171875, 4.277099609375, 4.41876220703125, 4.5604248046875, 4.70208740234375, 4.84375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 10.0, 10.0, 15.0, 29.0, 31.0, 33.0, 59.0, 102.0, 160.0, 323.0, 888.0, 2667.0, 19076.0, 929210.0, 88399.0, 5185.0, 1271.0, 466.0, 207.0, 117.0, 81.0, 53.0, 41.0, 28.0, 21.0, 16.0, 12.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.91845703125, -46.3056640625, -44.69287109375, -43.080078125, -41.46728515625, -39.8544921875, -38.24169921875, -36.62890625, -35.01611328125, -33.4033203125, -31.79052734375, -30.177734375, -28.56494140625, -26.9521484375, -25.33935546875, -23.7265625, -22.11376953125, -20.5009765625, -18.88818359375, -17.275390625, -15.66259765625, -14.0498046875, -12.43701171875, -10.82421875, -9.21142578125, -7.5986328125, -5.98583984375, -4.373046875, -2.76025390625, -1.1474609375, 0.46533203125, 2.078125, 3.69091796875, 5.3037109375, 6.91650390625, 8.529296875, 10.14208984375, 11.7548828125, 13.36767578125, 14.98046875, 16.59326171875, 18.2060546875, 19.81884765625, 21.431640625, 23.04443359375, 24.6572265625, 26.27001953125, 27.8828125, 29.49560546875, 31.1083984375, 32.72119140625, 34.333984375, 35.94677734375, 37.5595703125, 39.17236328125, 40.78515625, 42.39794921875, 44.0107421875, 45.62353515625, 47.236328125, 48.84912109375, 50.4619140625, 52.07470703125, 53.6875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 19.0, 37.0, 99.0, 242.0, 331.0, 184.0, 51.0, 17.0, 12.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.259296417236328, -16.783069610595703, -16.306842803955078, -15.830615997314453, -15.354388236999512, -14.878161430358887, -14.401934623718262, -13.925707817077637, -13.449480056762695, -12.97325325012207, -12.497026443481445, -12.02079963684082, -11.544571876525879, -11.068345069885254, -10.592118263244629, -10.115891456604004, -9.639664649963379, -9.163437843322754, -8.687211036682129, -8.210983276367188, -7.7347564697265625, -7.2585296630859375, -6.7823028564453125, -6.3060760498046875, -5.829848766326904, -5.353621959686279, -4.877394676208496, -4.401167869567871, -3.924940824508667, -3.448713779449463, -2.972486972808838, -2.496259927749634, -2.0200319290161133, -1.5438048839569092, -1.0675779581069946, -0.5913510322570801, -0.11512398719787598, 0.3611030578613281, 0.8373298645019531, 1.3135569095611572, 1.7897839546203613, 2.2660109996795654, 2.7422380447387695, 3.2184648513793945, 3.6946918964385986, 4.170918941497803, 4.647145748138428, 5.123373031616211, 5.599599838256836, 6.075826644897461, 6.552053928375244, 7.028280735015869, 7.504508018493652, 7.980734825134277, 8.456961631774902, 8.933188438415527, 9.409416198730469, 9.885643005371094, 10.361869812011719, 10.838096618652344, 11.314324378967285, 11.79055118560791, 12.266777992248535, 12.74300479888916, 13.219231605529785]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 4.0, 4.0, 3.0, 8.0, 10.0, 18.0, 16.0, 15.0, 16.0, 28.0, 34.0, 33.0, 30.0, 34.0, 37.0, 40.0, 51.0, 48.0, 43.0, 34.0, 50.0, 43.0, 43.0, 40.0, 37.0, 45.0, 36.0, 39.0, 22.0, 21.0, 20.0, 12.0, 15.0, 13.0, 15.0, 11.0, 13.0, 8.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.073789119720459, -2.9723269939422607, -2.8708651065826416, -2.7694029808044434, -2.667940855026245, -2.566478729248047, -2.4650168418884277, -2.3635547161102295, -2.2620925903320312, -2.160630464553833, -2.059168577194214, -1.9577064514160156, -1.8562443256378174, -1.7547823190689087, -1.6533203125, -1.5518581867218018, -1.4503962993621826, -1.348934292793274, -1.2474721670150757, -1.146010160446167, -1.0445480346679688, -0.9430860280990601, -0.8416240215301514, -0.7401619553565979, -0.6386998891830444, -0.537237823009491, -0.4357757866382599, -0.3343137502670288, -0.23285168409347534, -0.13138961791992188, -0.029927611351013184, 0.07153445482254028, 0.17299628257751465, 0.2744583487510681, 0.3759203851222992, 0.4773824214935303, 0.5788444876670837, 0.6803065538406372, 0.7817685604095459, 0.8832306265830994, 0.9846926927566528, 1.0861546993255615, 1.1876168251037598, 1.2890788316726685, 1.3905408382415771, 1.4920029640197754, 1.593464970588684, 1.6949269771575928, 1.796389102935791, 1.8978511095046997, 1.999313235282898, 2.1007752418518066, 2.202237367630005, 2.303699493408203, 2.4051613807678223, 2.5066235065460205, 2.6080856323242188, 2.709547758102417, 2.811009645462036, 2.9124717712402344, 3.0139338970184326, 3.115396022796631, 3.21685791015625, 3.3183200359344482, 3.4197819232940674]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 3.0, 6.0, 9.0, 10.0, 13.0, 12.0, 19.0, 11.0, 29.0, 12.0, 24.0, 28.0, 22.0, 33.0, 31.0, 25.0, 34.0, 47.0, 42.0, 35.0, 51.0, 35.0, 36.0, 39.0, 45.0, 35.0, 31.0, 46.0, 32.0, 23.0, 12.0, 23.0, 16.0, 22.0, 20.0, 13.0, 9.0, 16.0, 3.0, 8.0, 13.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.669921875, -3.543609619140625, -3.41729736328125, -3.290985107421875, -3.1646728515625, -3.038360595703125, -2.91204833984375, -2.785736083984375, -2.659423828125, -2.533111572265625, -2.40679931640625, -2.280487060546875, -2.1541748046875, -2.027862548828125, -1.90155029296875, -1.775238037109375, -1.64892578125, -1.522613525390625, -1.39630126953125, -1.269989013671875, -1.1436767578125, -1.017364501953125, -0.89105224609375, -0.764739990234375, -0.638427734375, -0.512115478515625, -0.38580322265625, -0.259490966796875, -0.1331787109375, -0.006866455078125, 0.11944580078125, 0.245758056640625, 0.3720703125, 0.498382568359375, 0.62469482421875, 0.751007080078125, 0.8773193359375, 1.003631591796875, 1.12994384765625, 1.256256103515625, 1.382568359375, 1.508880615234375, 1.63519287109375, 1.761505126953125, 1.8878173828125, 2.014129638671875, 2.14044189453125, 2.266754150390625, 2.39306640625, 2.519378662109375, 2.64569091796875, 2.772003173828125, 2.8983154296875, 3.024627685546875, 3.15093994140625, 3.277252197265625, 3.403564453125, 3.529876708984375, 3.65618896484375, 3.782501220703125, 3.9088134765625, 4.035125732421875, 4.16143798828125, 4.287750244140625, 4.4140625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 5.0, 3.0, 4.0, 5.0, 13.0, 12.0, 21.0, 27.0, 38.0, 46.0, 55.0, 84.0, 83.0, 133.0, 191.0, 264.0, 362.0, 442.0, 639.0, 869.0, 1331.0, 1816.0, 2757.0, 4349.0, 7969.0, 19427.0, 98191.0, 648804.0, 204308.0, 30577.0, 10150.0, 5202.0, 3188.0, 2089.0, 1421.0, 1020.0, 696.0, 502.0, 362.0, 288.0, 221.0, 159.0, 116.0, 93.0, 62.0, 26.0, 36.0, 38.0, 20.0, 16.0, 15.0, 4.0, 9.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.34234619140625, -7.0948486328125, -6.84735107421875, -6.599853515625, -6.35235595703125, -6.1048583984375, -5.85736083984375, -5.60986328125, -5.36236572265625, -5.1148681640625, -4.86737060546875, -4.619873046875, -4.37237548828125, -4.1248779296875, -3.87738037109375, -3.6298828125, -3.38238525390625, -3.1348876953125, -2.88739013671875, -2.639892578125, -2.39239501953125, -2.1448974609375, -1.89739990234375, -1.64990234375, -1.40240478515625, -1.1549072265625, -0.90740966796875, -0.659912109375, -0.41241455078125, -0.1649169921875, 0.08258056640625, 0.330078125, 0.57757568359375, 0.8250732421875, 1.07257080078125, 1.320068359375, 1.56756591796875, 1.8150634765625, 2.06256103515625, 2.31005859375, 2.55755615234375, 2.8050537109375, 3.05255126953125, 3.300048828125, 3.54754638671875, 3.7950439453125, 4.04254150390625, 4.2900390625, 4.53753662109375, 4.7850341796875, 5.03253173828125, 5.280029296875, 5.52752685546875, 5.7750244140625, 6.02252197265625, 6.27001953125, 6.51751708984375, 6.7650146484375, 7.01251220703125, 7.260009765625, 7.50750732421875, 7.7550048828125, 8.00250244140625, 8.25]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 19.0, 17.0, 18.0, 14.0, 22.0, 32.0, 31.0, 30.0, 39.0, 40.0, 63.0, 72.0, 70.0, 154.0, 1610.0, 298.0, 91.0, 82.0, 63.0, 41.0, 36.0, 33.0, 26.0, 24.0, 11.0, 16.0, 16.0, 13.0, 17.0, 7.0, 6.0, 11.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.84375, -16.18896484375, -15.5341796875, -14.87939453125, -14.224609375, -13.56982421875, -12.9150390625, -12.26025390625, -11.60546875, -10.95068359375, -10.2958984375, -9.64111328125, -8.986328125, -8.33154296875, -7.6767578125, -7.02197265625, -6.3671875, -5.71240234375, -5.0576171875, -4.40283203125, -3.748046875, -3.09326171875, -2.4384765625, -1.78369140625, -1.12890625, -0.47412109375, 0.1806640625, 0.83544921875, 1.490234375, 2.14501953125, 2.7998046875, 3.45458984375, 4.109375, 4.76416015625, 5.4189453125, 6.07373046875, 6.728515625, 7.38330078125, 8.0380859375, 8.69287109375, 9.34765625, 10.00244140625, 10.6572265625, 11.31201171875, 11.966796875, 12.62158203125, 13.2763671875, 13.93115234375, 14.5859375, 15.24072265625, 15.8955078125, 16.55029296875, 17.205078125, 17.85986328125, 18.5146484375, 19.16943359375, 19.82421875, 20.47900390625, 21.1337890625, 21.78857421875, 22.443359375, 23.09814453125, 23.7529296875, 24.40771484375, 25.0625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 10.0, 14.0, 19.0, 25.0, 30.0, 34.0, 35.0, 76.0, 119.0, 255.0, 520.0, 1093.0, 2457.0, 6863.0, 25826.0, 333715.0, 2697464.0, 58419.0, 11747.0, 3821.0, 1543.0, 707.0, 343.0, 176.0, 108.0, 76.0, 42.0, 33.0, 29.0, 22.0, 14.0, 9.0, 7.0, 3.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.875, -28.005859375, -27.13671875, -26.267578125, -25.3984375, -24.529296875, -23.66015625, -22.791015625, -21.921875, -21.052734375, -20.18359375, -19.314453125, -18.4453125, -17.576171875, -16.70703125, -15.837890625, -14.96875, -14.099609375, -13.23046875, -12.361328125, -11.4921875, -10.623046875, -9.75390625, -8.884765625, -8.015625, -7.146484375, -6.27734375, -5.408203125, -4.5390625, -3.669921875, -2.80078125, -1.931640625, -1.0625, -0.193359375, 0.67578125, 1.544921875, 2.4140625, 3.283203125, 4.15234375, 5.021484375, 5.890625, 6.759765625, 7.62890625, 8.498046875, 9.3671875, 10.236328125, 11.10546875, 11.974609375, 12.84375, 13.712890625, 14.58203125, 15.451171875, 16.3203125, 17.189453125, 18.05859375, 18.927734375, 19.796875, 20.666015625, 21.53515625, 22.404296875, 23.2734375, 24.142578125, 25.01171875, 25.880859375, 26.75]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 26.0, 209.0, 537.0, 204.0, 27.0, 6.0], "bins": [-347.0757141113281, -341.3372497558594, -335.5987548828125, -329.86029052734375, -324.121826171875, -318.38336181640625, -312.6448669433594, -306.9064025878906, -301.1679382324219, -295.4294738769531, -289.69097900390625, -283.9525146484375, -278.21405029296875, -272.4755859375, -266.7370910644531, -260.9986267089844, -255.26016235351562, -249.5216827392578, -243.78321838378906, -238.04473876953125, -232.3062744140625, -226.5677947998047, -220.82933044433594, -215.09085083007812, -209.3523712158203, -203.6138916015625, -197.87542724609375, -192.13694763183594, -186.3984832763672, -180.66000366210938, -174.92153930664062, -169.1830596923828, -163.44459533691406, -157.70611572265625, -151.9676513671875, -146.2291717529297, -140.49070739746094, -134.75222778320312, -129.01376342773438, -123.27528381347656, -117.53681945800781, -111.79834747314453, -106.05987548828125, -100.32140350341797, -94.58293151855469, -88.8444595336914, -83.10598754882812, -77.36750793457031, -71.62904357910156, -65.89057159423828, -60.152099609375, -54.41362762451172, -48.67515563964844, -42.936683654785156, -37.19820785522461, -31.459735870361328, -25.72126007080078, -19.9827880859375, -14.244315147399902, -8.505842208862305, -2.7673702239990234, 2.971101760864258, 8.709575653076172, 14.448047637939453, 20.186519622802734]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 9.0, 8.0, 5.0, 10.0, 8.0, 9.0, 17.0, 22.0, 29.0, 23.0, 24.0, 30.0, 24.0, 32.0, 37.0, 43.0, 38.0, 52.0, 34.0, 41.0, 36.0, 28.0, 34.0, 36.0, 39.0, 34.0, 42.0, 32.0, 24.0, 31.0, 27.0, 15.0, 27.0, 17.0, 16.0, 13.0, 10.0, 10.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.22519302368164, -56.46272659301758, -54.70025634765625, -52.93778991699219, -51.175323486328125, -49.41285705566406, -47.650390625, -45.88792037963867, -44.12545394897461, -42.36298751831055, -40.60051727294922, -38.838050842285156, -37.075584411621094, -35.31311798095703, -33.55065155029297, -31.78818130493164, -30.025714874267578, -28.263248443603516, -26.50078010559082, -24.738311767578125, -22.975845336914062, -21.21337890625, -19.450910568237305, -17.68844223022461, -15.925975799560547, -14.163508415222168, -12.401041030883789, -10.63857364654541, -8.876106262207031, -7.113638877868652, -5.351171493530273, -3.5887041091918945, -1.8262367248535156, -0.06376934051513672, 1.6986980438232422, 3.461165428161621, 5.2236328125, 6.986100196838379, 8.748567581176758, 10.511034965515137, 12.273502349853516, 14.035969734191895, 15.798437118530273, 17.56090545654297, 19.32337188720703, 21.085838317871094, 22.84830665588379, 24.610774993896484, 26.373241424560547, 28.13570785522461, 29.898176193237305, 31.66064453125, 33.42311096191406, 35.185577392578125, 36.94804382324219, 38.710514068603516, 40.47298049926758, 42.23544692993164, 43.99791717529297, 45.76038360595703, 47.522850036621094, 49.285316467285156, 51.04778289794922, 52.81025314331055, 54.57271957397461]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 10.0, 10.0, 10.0, 13.0, 21.0, 8.0, 26.0, 28.0, 29.0, 23.0, 26.0, 29.0, 20.0, 46.0, 30.0, 42.0, 36.0, 35.0, 44.0, 51.0, 39.0, 39.0, 41.0, 38.0, 33.0, 29.0, 30.0, 28.0, 19.0, 21.0, 20.0, 16.0, 15.0, 13.0, 10.0, 6.0, 8.0, 7.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.08203125, -3.94866943359375, -3.8153076171875, -3.68194580078125, -3.548583984375, -3.41522216796875, -3.2818603515625, -3.14849853515625, -3.01513671875, -2.88177490234375, -2.7484130859375, -2.61505126953125, -2.481689453125, -2.34832763671875, -2.2149658203125, -2.08160400390625, -1.9482421875, -1.81488037109375, -1.6815185546875, -1.54815673828125, -1.414794921875, -1.28143310546875, -1.1480712890625, -1.01470947265625, -0.88134765625, -0.74798583984375, -0.6146240234375, -0.48126220703125, -0.347900390625, -0.21453857421875, -0.0811767578125, 0.05218505859375, 0.185546875, 0.31890869140625, 0.4522705078125, 0.58563232421875, 0.718994140625, 0.85235595703125, 0.9857177734375, 1.11907958984375, 1.25244140625, 1.38580322265625, 1.5191650390625, 1.65252685546875, 1.785888671875, 1.91925048828125, 2.0526123046875, 2.18597412109375, 2.3193359375, 2.45269775390625, 2.5860595703125, 2.71942138671875, 2.852783203125, 2.98614501953125, 3.1195068359375, 3.25286865234375, 3.38623046875, 3.51959228515625, 3.6529541015625, 3.78631591796875, 3.919677734375, 4.05303955078125, 4.1864013671875, 4.31976318359375, 4.453125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 6.0, 2.0, 6.0, 8.0, 16.0, 14.0, 16.0, 35.0, 49.0, 68.0, 90.0, 117.0, 155.0, 262.0, 294.0, 451.0, 639.0, 847.0, 1075.0, 1581.0, 2099.0, 2981.0, 4278.0, 6241.0, 9674.0, 15547.0, 28343.0, 74312.0, 460999.0, 2657066.0, 743620.0, 100308.0, 32624.0, 17114.0, 10293.0, 6749.0, 4546.0, 3191.0, 2225.0, 1704.0, 1213.0, 904.0, 664.0, 490.0, 370.0, 272.0, 205.0, 153.0, 97.0, 81.0, 62.0, 50.0, 30.0, 21.0, 15.0, 10.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0], "bins": [-9.6015625, -9.287841796875, -8.97412109375, -8.660400390625, -8.3466796875, -8.032958984375, -7.71923828125, -7.405517578125, -7.091796875, -6.778076171875, -6.46435546875, -6.150634765625, -5.8369140625, -5.523193359375, -5.20947265625, -4.895751953125, -4.58203125, -4.268310546875, -3.95458984375, -3.640869140625, -3.3271484375, -3.013427734375, -2.69970703125, -2.385986328125, -2.072265625, -1.758544921875, -1.44482421875, -1.131103515625, -0.8173828125, -0.503662109375, -0.18994140625, 0.123779296875, 0.4375, 0.751220703125, 1.06494140625, 1.378662109375, 1.6923828125, 2.006103515625, 2.31982421875, 2.633544921875, 2.947265625, 3.260986328125, 3.57470703125, 3.888427734375, 4.2021484375, 4.515869140625, 4.82958984375, 5.143310546875, 5.45703125, 5.770751953125, 6.08447265625, 6.398193359375, 6.7119140625, 7.025634765625, 7.33935546875, 7.653076171875, 7.966796875, 8.280517578125, 8.59423828125, 8.907958984375, 9.2216796875, 9.535400390625, 9.84912109375, 10.162841796875, 10.4765625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 10.0, 8.0, 5.0, 19.0, 14.0, 23.0, 39.0, 56.0, 74.0, 134.0, 237.0, 556.0, 968.0, 897.0, 448.0, 222.0, 100.0, 76.0, 41.0, 25.0, 17.0, 16.0, 12.0, 14.0, 10.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.8472900390625, -13.311767578125, -12.7762451171875, -12.24072265625, -11.7052001953125, -11.169677734375, -10.6341552734375, -10.0986328125, -9.5631103515625, -9.027587890625, -8.4920654296875, -7.95654296875, -7.4210205078125, -6.885498046875, -6.3499755859375, -5.814453125, -5.2789306640625, -4.743408203125, -4.2078857421875, -3.67236328125, -3.1368408203125, -2.601318359375, -2.0657958984375, -1.5302734375, -0.9947509765625, -0.459228515625, 0.0762939453125, 0.61181640625, 1.1473388671875, 1.682861328125, 2.2183837890625, 2.75390625, 3.2894287109375, 3.824951171875, 4.3604736328125, 4.89599609375, 5.4315185546875, 5.967041015625, 6.5025634765625, 7.0380859375, 7.5736083984375, 8.109130859375, 8.6446533203125, 9.18017578125, 9.7156982421875, 10.251220703125, 10.7867431640625, 11.322265625, 11.8577880859375, 12.393310546875, 12.9288330078125, 13.46435546875, 13.9998779296875, 14.535400390625, 15.0709228515625, 15.6064453125, 16.1419677734375, 16.677490234375, 17.2130126953125, 17.74853515625, 18.2840576171875, 18.819580078125, 19.3551025390625, 19.890625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 8.0, 2.0, 11.0, 7.0, 13.0, 14.0, 27.0, 44.0, 62.0, 72.0, 137.0, 261.0, 361.0, 639.0, 1008.0, 1765.0, 3114.0, 5718.0, 11974.0, 28444.0, 99341.0, 1362363.0, 2475696.0, 139465.0, 34995.0, 13664.0, 6683.0, 3536.0, 1953.0, 1160.0, 661.0, 387.0, 262.0, 154.0, 105.0, 72.0, 37.0, 29.0, 19.0, 7.0, 11.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.437255859375, -17.70263671875, -16.968017578125, -16.2333984375, -15.498779296875, -14.76416015625, -14.029541015625, -13.294921875, -12.560302734375, -11.82568359375, -11.091064453125, -10.3564453125, -9.621826171875, -8.88720703125, -8.152587890625, -7.41796875, -6.683349609375, -5.94873046875, -5.214111328125, -4.4794921875, -3.744873046875, -3.01025390625, -2.275634765625, -1.541015625, -0.806396484375, -0.07177734375, 0.662841796875, 1.3974609375, 2.132080078125, 2.86669921875, 3.601318359375, 4.3359375, 5.070556640625, 5.80517578125, 6.539794921875, 7.2744140625, 8.009033203125, 8.74365234375, 9.478271484375, 10.212890625, 10.947509765625, 11.68212890625, 12.416748046875, 13.1513671875, 13.885986328125, 14.62060546875, 15.355224609375, 16.08984375, 16.824462890625, 17.55908203125, 18.293701171875, 19.0283203125, 19.762939453125, 20.49755859375, 21.232177734375, 21.966796875, 22.701416015625, 23.43603515625, 24.170654296875, 24.9052734375, 25.639892578125, 26.37451171875, 27.109130859375, 27.84375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 12.0, 14.0, 17.0, 27.0, 33.0, 60.0, 125.0, 159.0, 161.0, 121.0, 107.0, 55.0, 46.0, 24.0, 15.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.55537414550781, -113.7451400756836, -110.9349136352539, -108.12467956542969, -105.31444549560547, -102.50421142578125, -99.69398498535156, -96.88375091552734, -94.07351684570312, -91.2632827758789, -88.45305633544922, -85.642822265625, -82.83258819580078, -80.02235412597656, -77.21212768554688, -74.40189361572266, -71.59166717529297, -68.78143310546875, -65.97120666503906, -63.160972595214844, -60.350738525390625, -57.54050827026367, -54.73027801513672, -51.9200439453125, -49.10981369018555, -46.299583435058594, -43.489349365234375, -40.67911911010742, -37.86888885498047, -35.05865478515625, -32.2484245300293, -29.43819236755371, -26.62795639038086, -23.817724227905273, -21.007492065429688, -18.197261810302734, -15.387029647827148, -12.576797485351562, -9.76656723022461, -6.956335067749023, -4.1461029052734375, -1.3358712196350098, 1.474360466003418, 4.2845916748046875, 7.094823837280273, 9.90505599975586, 12.715286254882812, 15.525518417358398, 18.335750579833984, 21.14598274230957, 23.956214904785156, 26.76644515991211, 29.576677322387695, 32.38690948486328, 35.197139739990234, 38.00736999511719, 40.817604064941406, 43.62783432006836, 46.43806838989258, 49.24829864501953, 52.05853271484375, 54.8687629699707, 57.678993225097656, 60.489227294921875, 63.29945755004883]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 11.0, 6.0, 12.0, 19.0, 15.0, 21.0, 22.0, 30.0, 32.0, 23.0, 31.0, 35.0, 36.0, 39.0, 26.0, 43.0, 41.0, 45.0, 43.0, 44.0, 46.0, 39.0, 46.0, 28.0, 30.0, 36.0, 25.0, 27.0, 17.0, 11.0, 19.0, 19.0, 7.0, 9.0, 12.0, 10.0, 2.0, 3.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.914405822753906, -40.61658477783203, -39.31876754760742, -38.02094650268555, -36.72312927246094, -35.42530822753906, -34.12748718261719, -32.82966613769531, -31.531848907470703, -30.23402976989746, -28.93621063232422, -27.638389587402344, -26.3405704498291, -25.04275131225586, -23.744930267333984, -22.447111129760742, -21.1492919921875, -19.851472854614258, -18.553653717041016, -17.25583267211914, -15.958013534545898, -14.660194396972656, -13.362374305725098, -12.064554214477539, -10.766735076904297, -9.468915939331055, -8.171095848083496, -6.873276233673096, -5.575456619262695, -4.277637004852295, -2.9798173904418945, -1.681997299194336, -0.38417816162109375, 0.9136414527893066, 2.211461067199707, 3.5092806816101074, 4.807100296020508, 6.104919910430908, 7.402739524841309, 8.700559616088867, 9.99837875366211, 11.296197891235352, 12.59401798248291, 13.891838073730469, 15.189657211303711, 16.487476348876953, 17.785297393798828, 19.08311653137207, 20.380935668945312, 21.678754806518555, 22.976573944091797, 24.274394989013672, 25.572214126586914, 26.870033264160156, 28.16785430908203, 29.465673446655273, 30.763492584228516, 32.06131362915039, 33.359130859375, 34.656951904296875, 35.95477294921875, 37.25259017944336, 38.550411224365234, 39.848228454589844, 41.14604949951172]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 0.0, 4.0, 7.0, 5.0, 9.0, 13.0, 14.0, 17.0, 19.0, 17.0, 24.0, 40.0, 23.0, 30.0, 32.0, 30.0, 36.0, 41.0, 40.0, 36.0, 46.0, 37.0, 47.0, 46.0, 39.0, 50.0, 42.0, 32.0, 28.0, 27.0, 23.0, 27.0, 14.0, 17.0, 9.0, 11.0, 12.0, 4.0, 15.0, 2.0, 8.0, 10.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.7265625, -4.58050537109375, -4.4344482421875, -4.28839111328125, -4.142333984375, -3.99627685546875, -3.8502197265625, -3.70416259765625, -3.55810546875, -3.41204833984375, -3.2659912109375, -3.11993408203125, -2.973876953125, -2.82781982421875, -2.6817626953125, -2.53570556640625, -2.3896484375, -2.24359130859375, -2.0975341796875, -1.95147705078125, -1.805419921875, -1.65936279296875, -1.5133056640625, -1.36724853515625, -1.22119140625, -1.07513427734375, -0.9290771484375, -0.78302001953125, -0.636962890625, -0.49090576171875, -0.3448486328125, -0.19879150390625, -0.052734375, 0.09332275390625, 0.2393798828125, 0.38543701171875, 0.531494140625, 0.67755126953125, 0.8236083984375, 0.96966552734375, 1.11572265625, 1.26177978515625, 1.4078369140625, 1.55389404296875, 1.699951171875, 1.84600830078125, 1.9920654296875, 2.13812255859375, 2.2841796875, 2.43023681640625, 2.5762939453125, 2.72235107421875, 2.868408203125, 3.01446533203125, 3.1605224609375, 3.30657958984375, 3.45263671875, 3.59869384765625, 3.7447509765625, 3.89080810546875, 4.036865234375, 4.18292236328125, 4.3289794921875, 4.47503662109375, 4.62109375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 17.0, 27.0, 29.0, 58.0, 61.0, 114.0, 171.0, 205.0, 317.0, 416.0, 583.0, 895.0, 1338.0, 2103.0, 3336.0, 5653.0, 9637.0, 17588.0, 34077.0, 74546.0, 210079.0, 425354.0, 142520.0, 57078.0, 26979.0, 14216.0, 8095.0, 4715.0, 2792.0, 1803.0, 1124.0, 786.0, 571.0, 371.0, 277.0, 184.0, 145.0, 84.0, 68.0, 46.0, 27.0, 21.0, 13.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -19.98193359375, -19.3232421875, -18.66455078125, -18.005859375, -17.34716796875, -16.6884765625, -16.02978515625, -15.37109375, -14.71240234375, -14.0537109375, -13.39501953125, -12.736328125, -12.07763671875, -11.4189453125, -10.76025390625, -10.1015625, -9.44287109375, -8.7841796875, -8.12548828125, -7.466796875, -6.80810546875, -6.1494140625, -5.49072265625, -4.83203125, -4.17333984375, -3.5146484375, -2.85595703125, -2.197265625, -1.53857421875, -0.8798828125, -0.22119140625, 0.4375, 1.09619140625, 1.7548828125, 2.41357421875, 3.072265625, 3.73095703125, 4.3896484375, 5.04833984375, 5.70703125, 6.36572265625, 7.0244140625, 7.68310546875, 8.341796875, 9.00048828125, 9.6591796875, 10.31787109375, 10.9765625, 11.63525390625, 12.2939453125, 12.95263671875, 13.611328125, 14.27001953125, 14.9287109375, 15.58740234375, 16.24609375, 16.90478515625, 17.5634765625, 18.22216796875, 18.880859375, 19.53955078125, 20.1982421875, 20.85693359375, 21.515625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 14.0, 12.0, 10.0, 10.0, 12.0, 23.0, 20.0, 26.0, 28.0, 30.0, 43.0, 40.0, 49.0, 42.0, 43.0, 39.0, 50.0, 1068.0, 43.0, 37.0, 40.0, 39.0, 38.0, 35.0, 38.0, 15.0, 19.0, 23.0, 19.0, 18.0, 17.0, 14.0, 15.0, 6.0, 11.0, 3.0, 3.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.58050537109375, -4.4422607421875, -4.30401611328125, -4.165771484375, -4.02752685546875, -3.8892822265625, -3.75103759765625, -3.61279296875, -3.47454833984375, -3.3363037109375, -3.19805908203125, -3.059814453125, -2.92156982421875, -2.7833251953125, -2.64508056640625, -2.5068359375, -2.36859130859375, -2.2303466796875, -2.09210205078125, -1.953857421875, -1.81561279296875, -1.6773681640625, -1.53912353515625, -1.40087890625, -1.26263427734375, -1.1243896484375, -0.98614501953125, -0.847900390625, -0.70965576171875, -0.5714111328125, -0.43316650390625, -0.294921875, -0.15667724609375, -0.0184326171875, 0.11981201171875, 0.258056640625, 0.39630126953125, 0.5345458984375, 0.67279052734375, 0.81103515625, 0.94927978515625, 1.0875244140625, 1.22576904296875, 1.364013671875, 1.50225830078125, 1.6405029296875, 1.77874755859375, 1.9169921875, 2.05523681640625, 2.1934814453125, 2.33172607421875, 2.469970703125, 2.60821533203125, 2.7464599609375, 2.88470458984375, 3.02294921875, 3.16119384765625, 3.2994384765625, 3.43768310546875, 3.575927734375, 3.71417236328125, 3.8524169921875, 3.99066162109375, 4.12890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 4.0, 10.0, 14.0, 15.0, 32.0, 34.0, 55.0, 76.0, 135.0, 158.0, 255.0, 391.0, 589.0, 857.0, 1493.0, 2369.0, 4536.0, 8284.0, 17497.0, 44073.0, 181516.0, 1406804.0, 321766.0, 61369.0, 21870.0, 10113.0, 5166.0, 2924.0, 1677.0, 1024.0, 692.0, 393.0, 305.0, 192.0, 153.0, 81.0, 58.0, 51.0, 31.0, 16.0, 17.0, 11.0, 9.0, 7.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.796875, -15.263916015625, -14.73095703125, -14.197998046875, -13.6650390625, -13.132080078125, -12.59912109375, -12.066162109375, -11.533203125, -11.000244140625, -10.46728515625, -9.934326171875, -9.4013671875, -8.868408203125, -8.33544921875, -7.802490234375, -7.26953125, -6.736572265625, -6.20361328125, -5.670654296875, -5.1376953125, -4.604736328125, -4.07177734375, -3.538818359375, -3.005859375, -2.472900390625, -1.93994140625, -1.406982421875, -0.8740234375, -0.341064453125, 0.19189453125, 0.724853515625, 1.2578125, 1.790771484375, 2.32373046875, 2.856689453125, 3.3896484375, 3.922607421875, 4.45556640625, 4.988525390625, 5.521484375, 6.054443359375, 6.58740234375, 7.120361328125, 7.6533203125, 8.186279296875, 8.71923828125, 9.252197265625, 9.78515625, 10.318115234375, 10.85107421875, 11.384033203125, 11.9169921875, 12.449951171875, 12.98291015625, 13.515869140625, 14.048828125, 14.581787109375, 15.11474609375, 15.647705078125, 16.1806640625, 16.713623046875, 17.24658203125, 17.779541015625, 18.3125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 6.0, 9.0, 8.0, 21.0, 15.0, 10.0, 13.0, 21.0, 21.0, 38.0, 39.0, 42.0, 60.0, 81.0, 107.0, 111.0, 87.0, 54.0, 37.0, 42.0, 23.0, 31.0, 24.0, 13.0, 13.0, 11.0, 12.0, 7.0, 8.0, 5.0, 5.0, 4.0, 6.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.376953125, -2.288330078125, -2.19970703125, -2.111083984375, -2.0224609375, -1.933837890625, -1.84521484375, -1.756591796875, -1.66796875, -1.579345703125, -1.49072265625, -1.402099609375, -1.3134765625, -1.224853515625, -1.13623046875, -1.047607421875, -0.958984375, -0.870361328125, -0.78173828125, -0.693115234375, -0.6044921875, -0.515869140625, -0.42724609375, -0.338623046875, -0.25, -0.161376953125, -0.07275390625, 0.015869140625, 0.1044921875, 0.193115234375, 0.28173828125, 0.370361328125, 0.458984375, 0.547607421875, 0.63623046875, 0.724853515625, 0.8134765625, 0.902099609375, 0.99072265625, 1.079345703125, 1.16796875, 1.256591796875, 1.34521484375, 1.433837890625, 1.5224609375, 1.611083984375, 1.69970703125, 1.788330078125, 1.876953125, 1.965576171875, 2.05419921875, 2.142822265625, 2.2314453125, 2.320068359375, 2.40869140625, 2.497314453125, 2.5859375, 2.674560546875, 2.76318359375, 2.851806640625, 2.9404296875, 3.029052734375, 3.11767578125, 3.206298828125, 3.294921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 8.0, 11.0, 14.0, 11.0, 17.0, 22.0, 32.0, 39.0, 42.0, 68.0, 90.0, 123.0, 173.0, 293.0, 635.0, 1894.0, 9636.0, 131758.0, 854315.0, 42151.0, 4787.0, 1156.0, 448.0, 211.0, 163.0, 99.0, 68.0, 77.0, 46.0, 34.0, 34.0, 23.0, 14.0, 10.0, 13.0, 10.0, 5.0, 1.0, 4.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.96875, -33.85205078125, -32.7353515625, -31.61865234375, -30.501953125, -29.38525390625, -28.2685546875, -27.15185546875, -26.03515625, -24.91845703125, -23.8017578125, -22.68505859375, -21.568359375, -20.45166015625, -19.3349609375, -18.21826171875, -17.1015625, -15.98486328125, -14.8681640625, -13.75146484375, -12.634765625, -11.51806640625, -10.4013671875, -9.28466796875, -8.16796875, -7.05126953125, -5.9345703125, -4.81787109375, -3.701171875, -2.58447265625, -1.4677734375, -0.35107421875, 0.765625, 1.88232421875, 2.9990234375, 4.11572265625, 5.232421875, 6.34912109375, 7.4658203125, 8.58251953125, 9.69921875, 10.81591796875, 11.9326171875, 13.04931640625, 14.166015625, 15.28271484375, 16.3994140625, 17.51611328125, 18.6328125, 19.74951171875, 20.8662109375, 21.98291015625, 23.099609375, 24.21630859375, 25.3330078125, 26.44970703125, 27.56640625, 28.68310546875, 29.7998046875, 30.91650390625, 32.033203125, 33.14990234375, 34.2666015625, 35.38330078125, 36.5]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 8.0, 8.0, 14.0, 15.0, 26.0, 52.0, 85.0, 144.0, 152.0, 161.0, 129.0, 78.0, 58.0, 27.0, 18.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.857371807098389, -7.584421634674072, -7.311471462249756, -7.0385212898254395, -6.765571117401123, -6.492620944976807, -6.219671249389648, -5.946721076965332, -5.673770904541016, -5.400820732116699, -5.127870559692383, -4.854920387268066, -4.58197021484375, -4.309020042419434, -4.036069869995117, -3.76311993598938, -3.4901695251464844, -3.217219352722168, -2.9442691802978516, -2.671319007873535, -2.3983688354492188, -2.1254186630249023, -1.852468729019165, -1.5795185565948486, -1.3065683841705322, -1.0336182117462158, -0.7606680989265442, -0.48771798610687256, -0.21476781368255615, 0.058182358741760254, 0.3311324119567871, 0.6040825843811035, 0.8770332336425781, 1.1499834060668945, 1.422933578491211, 1.6958836317062378, 1.9688338041305542, 2.24178409576416, 2.5147340297698975, 2.787684202194214, 3.0606343746185303, 3.3335845470428467, 3.606534719467163, 3.8794846534729004, 4.152434825897217, 4.425384998321533, 4.69833517074585, 4.971285343170166, 5.244235515594482, 5.517185688018799, 5.790135860443115, 6.063086032867432, 6.336036205291748, 6.6089863777160645, 6.881936073303223, 7.154886245727539, 7.4278364181518555, 7.700786590576172, 7.973736763000488, 8.246686935424805, 8.519637107849121, 8.792587280273438, 9.065537452697754, 9.33848762512207, 9.611437797546387]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 10.0, 14.0, 8.0, 13.0, 15.0, 20.0, 32.0, 37.0, 30.0, 38.0, 40.0, 34.0, 43.0, 45.0, 51.0, 46.0, 44.0, 43.0, 56.0, 38.0, 46.0, 34.0, 28.0, 34.0, 21.0, 38.0, 32.0, 22.0, 25.0, 10.0, 16.0, 8.0, 9.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.479132652282715, -4.336423397064209, -4.193713665008545, -4.051004409790039, -3.908295154571533, -3.7655856609344482, -3.6228761672973633, -3.4801669120788574, -3.3374576568603516, -3.1947481632232666, -3.0520389080047607, -2.909329414367676, -2.76662015914917, -2.623910665512085, -2.481201171875, -2.338491916656494, -2.195782423019409, -2.053072929382324, -1.9103636741638184, -1.7676541805267334, -1.6249449253082275, -1.4822354316711426, -1.3395260572433472, -1.1968166828155518, -1.0541073083877563, -0.9113979339599609, -0.7686885595321655, -0.6259791254997253, -0.48326975107192993, -0.3405603766441345, -0.19785094261169434, -0.055141568183898926, 0.08756780624389648, 0.2302771955728531, 0.3729865849018097, 0.5156959891319275, 0.6584053635597229, 0.8011147379875183, 0.9438241720199585, 1.086533546447754, 1.2292429208755493, 1.3719522953033447, 1.5146616697311401, 1.6573710441589355, 1.8000805377960205, 1.9427897930145264, 2.0854992866516113, 2.228208541870117, 2.370918035507202, 2.513627529144287, 2.656336784362793, 2.799046277999878, 2.941755533218384, 3.0844650268554688, 3.2271742820739746, 3.3698837757110596, 3.5125932693481445, 3.6553027629852295, 3.7980120182037354, 3.9407215118408203, 4.083430767059326, 4.226140022277832, 4.368849754333496, 4.511559009552002, 4.654268264770508]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 7.0, 11.0, 13.0, 13.0, 15.0, 16.0, 25.0, 21.0, 25.0, 25.0, 37.0, 32.0, 36.0, 35.0, 35.0, 44.0, 33.0, 44.0, 55.0, 65.0, 41.0, 42.0, 51.0, 32.0, 28.0, 33.0, 18.0, 21.0, 28.0, 9.0, 10.0, 12.0, 12.0, 15.0, 11.0, 9.0, 6.0, 8.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.46484375, -4.31591796875, -4.1669921875, -4.01806640625, -3.869140625, -3.72021484375, -3.5712890625, -3.42236328125, -3.2734375, -3.12451171875, -2.9755859375, -2.82666015625, -2.677734375, -2.52880859375, -2.3798828125, -2.23095703125, -2.08203125, -1.93310546875, -1.7841796875, -1.63525390625, -1.486328125, -1.33740234375, -1.1884765625, -1.03955078125, -0.890625, -0.74169921875, -0.5927734375, -0.44384765625, -0.294921875, -0.14599609375, 0.0029296875, 0.15185546875, 0.30078125, 0.44970703125, 0.5986328125, 0.74755859375, 0.896484375, 1.04541015625, 1.1943359375, 1.34326171875, 1.4921875, 1.64111328125, 1.7900390625, 1.93896484375, 2.087890625, 2.23681640625, 2.3857421875, 2.53466796875, 2.68359375, 2.83251953125, 2.9814453125, 3.13037109375, 3.279296875, 3.42822265625, 3.5771484375, 3.72607421875, 3.875, 4.02392578125, 4.1728515625, 4.32177734375, 4.470703125, 4.61962890625, 4.7685546875, 4.91748046875, 5.06640625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 12.0, 28.0, 29.0, 44.0, 56.0, 103.0, 130.0, 196.0, 293.0, 448.0, 676.0, 1002.0, 1503.0, 2531.0, 4315.0, 7446.0, 14027.0, 31977.0, 109561.0, 580627.0, 203146.0, 48929.0, 18667.0, 9142.0, 5150.0, 3135.0, 1871.0, 1198.0, 756.0, 529.0, 324.0, 209.0, 138.0, 111.0, 75.0, 54.0, 30.0, 23.0, 17.0, 12.0, 3.0, 7.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.0, -12.625244140625, -12.25048828125, -11.875732421875, -11.5009765625, -11.126220703125, -10.75146484375, -10.376708984375, -10.001953125, -9.627197265625, -9.25244140625, -8.877685546875, -8.5029296875, -8.128173828125, -7.75341796875, -7.378662109375, -7.00390625, -6.629150390625, -6.25439453125, -5.879638671875, -5.5048828125, -5.130126953125, -4.75537109375, -4.380615234375, -4.005859375, -3.631103515625, -3.25634765625, -2.881591796875, -2.5068359375, -2.132080078125, -1.75732421875, -1.382568359375, -1.0078125, -0.633056640625, -0.25830078125, 0.116455078125, 0.4912109375, 0.865966796875, 1.24072265625, 1.615478515625, 1.990234375, 2.364990234375, 2.73974609375, 3.114501953125, 3.4892578125, 3.864013671875, 4.23876953125, 4.613525390625, 4.98828125, 5.363037109375, 5.73779296875, 6.112548828125, 6.4873046875, 6.862060546875, 7.23681640625, 7.611572265625, 7.986328125, 8.361083984375, 8.73583984375, 9.110595703125, 9.4853515625, 9.860107421875, 10.23486328125, 10.609619140625, 10.984375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 9.0, 12.0, 9.0, 16.0, 13.0, 19.0, 29.0, 17.0, 31.0, 22.0, 25.0, 30.0, 44.0, 39.0, 50.0, 63.0, 101.0, 128.0, 235.0, 1355.0, 149.0, 108.0, 82.0, 64.0, 51.0, 43.0, 31.0, 40.0, 23.0, 36.0, 22.0, 27.0, 15.0, 15.0, 15.0, 12.0, 16.0, 8.0, 6.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0], "bins": [-15.96875, -15.4891357421875, -15.009521484375, -14.5299072265625, -14.05029296875, -13.5706787109375, -13.091064453125, -12.6114501953125, -12.1318359375, -11.6522216796875, -11.172607421875, -10.6929931640625, -10.21337890625, -9.7337646484375, -9.254150390625, -8.7745361328125, -8.294921875, -7.8153076171875, -7.335693359375, -6.8560791015625, -6.37646484375, -5.8968505859375, -5.417236328125, -4.9376220703125, -4.4580078125, -3.9783935546875, -3.498779296875, -3.0191650390625, -2.53955078125, -2.0599365234375, -1.580322265625, -1.1007080078125, -0.62109375, -0.1414794921875, 0.338134765625, 0.8177490234375, 1.29736328125, 1.7769775390625, 2.256591796875, 2.7362060546875, 3.2158203125, 3.6954345703125, 4.175048828125, 4.6546630859375, 5.13427734375, 5.6138916015625, 6.093505859375, 6.5731201171875, 7.052734375, 7.5323486328125, 8.011962890625, 8.4915771484375, 8.97119140625, 9.4508056640625, 9.930419921875, 10.4100341796875, 10.8896484375, 11.3692626953125, 11.848876953125, 12.3284912109375, 12.80810546875, 13.2877197265625, 13.767333984375, 14.2469482421875, 14.7265625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 11.0, 7.0, 15.0, 21.0, 32.0, 36.0, 64.0, 132.0, 230.0, 475.0, 1375.0, 5778.0, 47222.0, 2824890.0, 246964.0, 14330.0, 2565.0, 813.0, 327.0, 146.0, 91.0, 54.0, 40.0, 21.0, 19.0, 10.0, 14.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.65625, -52.81884765625, -50.9814453125, -49.14404296875, -47.306640625, -45.46923828125, -43.6318359375, -41.79443359375, -39.95703125, -38.11962890625, -36.2822265625, -34.44482421875, -32.607421875, -30.77001953125, -28.9326171875, -27.09521484375, -25.2578125, -23.42041015625, -21.5830078125, -19.74560546875, -17.908203125, -16.07080078125, -14.2333984375, -12.39599609375, -10.55859375, -8.72119140625, -6.8837890625, -5.04638671875, -3.208984375, -1.37158203125, 0.4658203125, 2.30322265625, 4.140625, 5.97802734375, 7.8154296875, 9.65283203125, 11.490234375, 13.32763671875, 15.1650390625, 17.00244140625, 18.83984375, 20.67724609375, 22.5146484375, 24.35205078125, 26.189453125, 28.02685546875, 29.8642578125, 31.70166015625, 33.5390625, 35.37646484375, 37.2138671875, 39.05126953125, 40.888671875, 42.72607421875, 44.5634765625, 46.40087890625, 48.23828125, 50.07568359375, 51.9130859375, 53.75048828125, 55.587890625, 57.42529296875, 59.2626953125, 61.10009765625, 62.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 372.0, 626.0, 16.0], "bins": [-1310.8900146484375, -1289.771728515625, -1268.6534423828125, -1247.53515625, -1226.4168701171875, -1205.298583984375, -1184.1802978515625, -1163.06201171875, -1141.943603515625, -1120.8253173828125, -1099.70703125, -1078.5887451171875, -1057.470458984375, -1036.3521728515625, -1015.2338256835938, -994.1155395507812, -972.997314453125, -951.8790283203125, -930.7607421875, -909.6424560546875, -888.524169921875, -867.4058227539062, -846.2875366210938, -825.1692504882812, -804.0509643554688, -782.9326782226562, -761.8143920898438, -740.6961059570312, -719.5777587890625, -698.45947265625, -677.3411865234375, -656.222900390625, -635.1046752929688, -613.9863891601562, -592.8681030273438, -571.7498168945312, -550.6314697265625, -529.51318359375, -508.3948974609375, -487.276611328125, -466.1583251953125, -445.0400390625, -423.9217529296875, -402.8034362792969, -381.6851501464844, -360.5668640136719, -339.44854736328125, -318.33026123046875, -297.21197509765625, -276.09368896484375, -254.9753875732422, -233.85708618164062, -212.73880004882812, -191.62051391601562, -170.50221252441406, -149.3839111328125, -128.265625, -107.14733123779297, -86.02903747558594, -64.9107437133789, -43.792449951171875, -22.674156188964844, -1.5558624267578125, 19.56243896484375, 40.680728912353516]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 11.0, 12.0, 19.0, 9.0, 12.0, 16.0, 24.0, 24.0, 21.0, 36.0, 21.0, 35.0, 39.0, 35.0, 42.0, 41.0, 33.0, 53.0, 48.0, 32.0, 41.0, 25.0, 30.0, 46.0, 21.0, 40.0, 24.0, 28.0, 20.0, 17.0, 22.0, 15.0, 12.0, 13.0, 12.0, 11.0, 16.0, 8.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.19475173950195, -47.45106506347656, -45.707374572753906, -43.963687896728516, -42.21999740600586, -40.47631072998047, -38.73262023925781, -36.98893356323242, -35.245243072509766, -33.501556396484375, -31.75786590576172, -30.014177322387695, -28.270488739013672, -26.52680206298828, -24.783111572265625, -23.039424896240234, -21.29573631286621, -19.552047729492188, -17.808359146118164, -16.06467056274414, -14.320981979370117, -12.57729434967041, -10.833605766296387, -9.089917182922363, -7.34622859954834, -5.602540016174316, -3.858851671218872, -2.1151633262634277, -0.3714747428894043, 1.372213363647461, 3.1159019470214844, 4.859590530395508, 6.603279113769531, 8.346967697143555, 10.090656280517578, 11.834344863891602, 13.578033447265625, 15.321721076965332, 17.065410614013672, 18.809097290039062, 20.55278778076172, 22.296476364135742, 24.040164947509766, 25.78385353088379, 27.527542114257812, 29.271228790283203, 31.01491928100586, 32.75860595703125, 34.502296447753906, 36.2459831237793, 37.98967361450195, 39.733360290527344, 41.47705078125, 43.22073745727539, 44.96442794799805, 46.70811462402344, 48.45180130004883, 50.19548797607422, 51.939178466796875, 53.682865142822266, 55.42655563354492, 57.17024230957031, 58.91393280029297, 60.65761947631836, 62.401309967041016]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 6.0, 9.0, 9.0, 5.0, 13.0, 12.0, 18.0, 17.0, 10.0, 18.0, 21.0, 18.0, 34.0, 36.0, 27.0, 29.0, 36.0, 34.0, 42.0, 42.0, 34.0, 42.0, 41.0, 34.0, 41.0, 42.0, 43.0, 26.0, 31.0, 28.0, 26.0, 27.0, 18.0, 12.0, 19.0, 14.0, 16.0, 10.0, 11.0, 4.0, 12.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.16015625, -4.01263427734375, -3.8651123046875, -3.71759033203125, -3.570068359375, -3.42254638671875, -3.2750244140625, -3.12750244140625, -2.97998046875, -2.83245849609375, -2.6849365234375, -2.53741455078125, -2.389892578125, -2.24237060546875, -2.0948486328125, -1.94732666015625, -1.7998046875, -1.65228271484375, -1.5047607421875, -1.35723876953125, -1.209716796875, -1.06219482421875, -0.9146728515625, -0.76715087890625, -0.61962890625, -0.47210693359375, -0.3245849609375, -0.17706298828125, -0.029541015625, 0.11798095703125, 0.2655029296875, 0.41302490234375, 0.560546875, 0.70806884765625, 0.8555908203125, 1.00311279296875, 1.150634765625, 1.29815673828125, 1.4456787109375, 1.59320068359375, 1.74072265625, 1.88824462890625, 2.0357666015625, 2.18328857421875, 2.330810546875, 2.47833251953125, 2.6258544921875, 2.77337646484375, 2.9208984375, 3.06842041015625, 3.2159423828125, 3.36346435546875, 3.510986328125, 3.65850830078125, 3.8060302734375, 3.95355224609375, 4.10107421875, 4.24859619140625, 4.3961181640625, 4.54364013671875, 4.691162109375, 4.83868408203125, 4.9862060546875, 5.13372802734375, 5.28125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 11.0, 9.0, 12.0, 11.0, 18.0, 24.0, 48.0, 44.0, 66.0, 114.0, 171.0, 264.0, 495.0, 824.0, 1450.0, 2493.0, 4451.0, 9120.0, 20397.0, 66838.0, 1318048.0, 2609618.0, 109113.0, 26746.0, 11333.0, 5518.0, 2804.0, 1702.0, 985.0, 601.0, 356.0, 211.0, 122.0, 77.0, 55.0, 30.0, 27.0, 19.0, 11.0, 13.0, 11.0, 10.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.46142578125, -15.8759765625, -15.29052734375, -14.705078125, -14.11962890625, -13.5341796875, -12.94873046875, -12.36328125, -11.77783203125, -11.1923828125, -10.60693359375, -10.021484375, -9.43603515625, -8.8505859375, -8.26513671875, -7.6796875, -7.09423828125, -6.5087890625, -5.92333984375, -5.337890625, -4.75244140625, -4.1669921875, -3.58154296875, -2.99609375, -2.41064453125, -1.8251953125, -1.23974609375, -0.654296875, -0.06884765625, 0.5166015625, 1.10205078125, 1.6875, 2.27294921875, 2.8583984375, 3.44384765625, 4.029296875, 4.61474609375, 5.2001953125, 5.78564453125, 6.37109375, 6.95654296875, 7.5419921875, 8.12744140625, 8.712890625, 9.29833984375, 9.8837890625, 10.46923828125, 11.0546875, 11.64013671875, 12.2255859375, 12.81103515625, 13.396484375, 13.98193359375, 14.5673828125, 15.15283203125, 15.73828125, 16.32373046875, 16.9091796875, 17.49462890625, 18.080078125, 18.66552734375, 19.2509765625, 19.83642578125, 20.421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 8.0, 0.0, 8.0, 7.0, 13.0, 10.0, 8.0, 22.0, 32.0, 27.0, 28.0, 58.0, 79.0, 127.0, 261.0, 512.0, 817.0, 791.0, 517.0, 266.0, 154.0, 76.0, 55.0, 38.0, 36.0, 27.0, 17.0, 15.0, 9.0, 10.0, 11.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.421875, -14.924560546875, -14.42724609375, -13.929931640625, -13.4326171875, -12.935302734375, -12.43798828125, -11.940673828125, -11.443359375, -10.946044921875, -10.44873046875, -9.951416015625, -9.4541015625, -8.956787109375, -8.45947265625, -7.962158203125, -7.46484375, -6.967529296875, -6.47021484375, -5.972900390625, -5.4755859375, -4.978271484375, -4.48095703125, -3.983642578125, -3.486328125, -2.989013671875, -2.49169921875, -1.994384765625, -1.4970703125, -0.999755859375, -0.50244140625, -0.005126953125, 0.4921875, 0.989501953125, 1.48681640625, 1.984130859375, 2.4814453125, 2.978759765625, 3.47607421875, 3.973388671875, 4.470703125, 4.968017578125, 5.46533203125, 5.962646484375, 6.4599609375, 6.957275390625, 7.45458984375, 7.951904296875, 8.44921875, 8.946533203125, 9.44384765625, 9.941162109375, 10.4384765625, 10.935791015625, 11.43310546875, 11.930419921875, 12.427734375, 12.925048828125, 13.42236328125, 13.919677734375, 14.4169921875, 14.914306640625, 15.41162109375, 15.908935546875, 16.40625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 13.0, 19.0, 25.0, 26.0, 45.0, 60.0, 98.0, 117.0, 183.0, 245.0, 375.0, 621.0, 867.0, 1395.0, 2160.0, 3609.0, 5991.0, 10823.0, 21791.0, 53634.0, 212044.0, 2145841.0, 1486137.0, 159495.0, 45096.0, 19195.0, 9818.0, 5359.0, 3263.0, 2135.0, 1232.0, 787.0, 576.0, 367.0, 277.0, 165.0, 120.0, 85.0, 66.0, 37.0, 19.0, 26.0, 18.0, 5.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-18.703125, -18.16748046875, -17.6318359375, -17.09619140625, -16.560546875, -16.02490234375, -15.4892578125, -14.95361328125, -14.41796875, -13.88232421875, -13.3466796875, -12.81103515625, -12.275390625, -11.73974609375, -11.2041015625, -10.66845703125, -10.1328125, -9.59716796875, -9.0615234375, -8.52587890625, -7.990234375, -7.45458984375, -6.9189453125, -6.38330078125, -5.84765625, -5.31201171875, -4.7763671875, -4.24072265625, -3.705078125, -3.16943359375, -2.6337890625, -2.09814453125, -1.5625, -1.02685546875, -0.4912109375, 0.04443359375, 0.580078125, 1.11572265625, 1.6513671875, 2.18701171875, 2.72265625, 3.25830078125, 3.7939453125, 4.32958984375, 4.865234375, 5.40087890625, 5.9365234375, 6.47216796875, 7.0078125, 7.54345703125, 8.0791015625, 8.61474609375, 9.150390625, 9.68603515625, 10.2216796875, 10.75732421875, 11.29296875, 11.82861328125, 12.3642578125, 12.89990234375, 13.435546875, 13.97119140625, 14.5068359375, 15.04248046875, 15.578125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 42.0, 120.0, 282.0, 318.0, 158.0, 52.0, 13.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-311.03076171875, -304.70758056640625, -298.3843688964844, -292.0611877441406, -285.73797607421875, -279.414794921875, -273.0915832519531, -266.7684020996094, -260.4451904296875, -254.1219940185547, -247.79879760742188, -241.47560119628906, -235.15240478515625, -228.82920837402344, -222.50601196289062, -216.1828155517578, -209.859619140625, -203.5364227294922, -197.21322631835938, -190.89002990722656, -184.56683349609375, -178.24363708496094, -171.92044067382812, -165.5972442626953, -159.27406311035156, -152.95086669921875, -146.62767028808594, -140.30447387695312, -133.9812774658203, -127.6580810546875, -121.33488464355469, -115.01168823242188, -108.68849182128906, -102.36529541015625, -96.04209899902344, -89.71890258789062, -83.39570617675781, -77.072509765625, -70.74931335449219, -64.42611694335938, -58.10292434692383, -51.779727935791016, -45.4565315246582, -39.133338928222656, -32.810142517089844, -26.4869441986084, -20.16374969482422, -13.840553283691406, -7.517356872558594, -1.1941609382629395, 5.129034996032715, 11.452230453491211, 17.775426864624023, 24.098623275756836, 30.421817779541016, 36.74501419067383, 43.06821060180664, 49.39140701293945, 55.714603424072266, 62.03779602050781, 68.36099243164062, 74.68418884277344, 81.00738525390625, 87.33058166503906, 93.65377807617188]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 9.0, 5.0, 3.0, 4.0, 9.0, 11.0, 8.0, 12.0, 8.0, 16.0, 26.0, 24.0, 24.0, 22.0, 26.0, 28.0, 37.0, 35.0, 40.0, 48.0, 38.0, 47.0, 49.0, 40.0, 33.0, 40.0, 30.0, 38.0, 40.0, 35.0, 32.0, 31.0, 26.0, 28.0, 25.0, 15.0, 14.0, 12.0, 10.0, 10.0, 6.0, 2.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.6296272277832, -46.21665573120117, -44.803680419921875, -43.390708923339844, -41.97773742675781, -40.564762115478516, -39.151790618896484, -37.73881530761719, -36.325843811035156, -34.912872314453125, -33.49989700317383, -32.0869255065918, -30.673952102661133, -29.26097869873047, -27.848007202148438, -26.435033798217773, -25.022062301635742, -23.609088897705078, -22.196117401123047, -20.783143997192383, -19.37017059326172, -17.957199096679688, -16.544225692749023, -15.13125228881836, -13.718279838562012, -12.305307388305664, -10.892333984375, -9.479361534118652, -8.066389083862305, -6.653415679931641, -5.240443229675293, -3.827469825744629, -2.4144973754882812, -1.001524567604065, 0.41144824028015137, 1.8244209289550781, 3.237393856048584, 4.65036678314209, 6.0633392333984375, 7.476312637329102, 8.88928508758545, 10.302257537841797, 11.715230941772461, 13.128203392028809, 14.541175842285156, 15.95414924621582, 17.367122650146484, 18.780094146728516, 20.19306755065918, 21.606040954589844, 23.019012451171875, 24.43198585510254, 25.844959259033203, 27.257930755615234, 28.6709041595459, 30.083877563476562, 31.496849060058594, 32.909820556640625, 34.32279586791992, 35.73576736450195, 37.148738861083984, 38.56171417236328, 39.97468566894531, 41.387657165527344, 42.80063247680664]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 10.0, 11.0, 10.0, 13.0, 8.0, 19.0, 16.0, 14.0, 20.0, 15.0, 29.0, 22.0, 20.0, 29.0, 36.0, 36.0, 39.0, 51.0, 37.0, 34.0, 51.0, 33.0, 32.0, 40.0, 52.0, 34.0, 35.0, 29.0, 30.0, 25.0, 21.0, 23.0, 21.0, 14.0, 17.0, 14.0, 15.0, 6.0, 6.0, 3.0, 3.0, 7.0, 6.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.56640625, -4.416748046875, -4.26708984375, -4.117431640625, -3.9677734375, -3.818115234375, -3.66845703125, -3.518798828125, -3.369140625, -3.219482421875, -3.06982421875, -2.920166015625, -2.7705078125, -2.620849609375, -2.47119140625, -2.321533203125, -2.171875, -2.022216796875, -1.87255859375, -1.722900390625, -1.5732421875, -1.423583984375, -1.27392578125, -1.124267578125, -0.974609375, -0.824951171875, -0.67529296875, -0.525634765625, -0.3759765625, -0.226318359375, -0.07666015625, 0.072998046875, 0.22265625, 0.372314453125, 0.52197265625, 0.671630859375, 0.8212890625, 0.970947265625, 1.12060546875, 1.270263671875, 1.419921875, 1.569580078125, 1.71923828125, 1.868896484375, 2.0185546875, 2.168212890625, 2.31787109375, 2.467529296875, 2.6171875, 2.766845703125, 2.91650390625, 3.066162109375, 3.2158203125, 3.365478515625, 3.51513671875, 3.664794921875, 3.814453125, 3.964111328125, 4.11376953125, 4.263427734375, 4.4130859375, 4.562744140625, 4.71240234375, 4.862060546875, 5.01171875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 13.0, 16.0, 14.0, 30.0, 35.0, 52.0, 62.0, 82.0, 130.0, 175.0, 279.0, 340.0, 521.0, 714.0, 1053.0, 1600.0, 2622.0, 4285.0, 7936.0, 16150.0, 41155.0, 172410.0, 634156.0, 104066.0, 30465.0, 12980.0, 6571.0, 3727.0, 2216.0, 1436.0, 1006.0, 650.0, 434.0, 344.0, 242.0, 154.0, 111.0, 102.0, 61.0, 35.0, 39.0, 26.0, 12.0, 10.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-25.421875, -24.63623046875, -23.8505859375, -23.06494140625, -22.279296875, -21.49365234375, -20.7080078125, -19.92236328125, -19.13671875, -18.35107421875, -17.5654296875, -16.77978515625, -15.994140625, -15.20849609375, -14.4228515625, -13.63720703125, -12.8515625, -12.06591796875, -11.2802734375, -10.49462890625, -9.708984375, -8.92333984375, -8.1376953125, -7.35205078125, -6.56640625, -5.78076171875, -4.9951171875, -4.20947265625, -3.423828125, -2.63818359375, -1.8525390625, -1.06689453125, -0.28125, 0.50439453125, 1.2900390625, 2.07568359375, 2.861328125, 3.64697265625, 4.4326171875, 5.21826171875, 6.00390625, 6.78955078125, 7.5751953125, 8.36083984375, 9.146484375, 9.93212890625, 10.7177734375, 11.50341796875, 12.2890625, 13.07470703125, 13.8603515625, 14.64599609375, 15.431640625, 16.21728515625, 17.0029296875, 17.78857421875, 18.57421875, 19.35986328125, 20.1455078125, 20.93115234375, 21.716796875, 22.50244140625, 23.2880859375, 24.07373046875, 24.859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 7.0, 9.0, 9.0, 11.0, 12.0, 12.0, 21.0, 20.0, 24.0, 27.0, 24.0, 28.0, 17.0, 33.0, 27.0, 31.0, 32.0, 38.0, 40.0, 34.0, 1063.0, 42.0, 45.0, 44.0, 46.0, 34.0, 34.0, 35.0, 32.0, 18.0, 22.0, 23.0, 19.0, 23.0, 14.0, 12.0, 14.0, 12.0, 9.0, 6.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.47705078125, -4.3330078125, -4.18896484375, -4.044921875, -3.90087890625, -3.7568359375, -3.61279296875, -3.46875, -3.32470703125, -3.1806640625, -3.03662109375, -2.892578125, -2.74853515625, -2.6044921875, -2.46044921875, -2.31640625, -2.17236328125, -2.0283203125, -1.88427734375, -1.740234375, -1.59619140625, -1.4521484375, -1.30810546875, -1.1640625, -1.02001953125, -0.8759765625, -0.73193359375, -0.587890625, -0.44384765625, -0.2998046875, -0.15576171875, -0.01171875, 0.13232421875, 0.2763671875, 0.42041015625, 0.564453125, 0.70849609375, 0.8525390625, 0.99658203125, 1.140625, 1.28466796875, 1.4287109375, 1.57275390625, 1.716796875, 1.86083984375, 2.0048828125, 2.14892578125, 2.29296875, 2.43701171875, 2.5810546875, 2.72509765625, 2.869140625, 3.01318359375, 3.1572265625, 3.30126953125, 3.4453125, 3.58935546875, 3.7333984375, 3.87744140625, 4.021484375, 4.16552734375, 4.3095703125, 4.45361328125, 4.59765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 14.0, 16.0, 30.0, 39.0, 41.0, 89.0, 103.0, 173.0, 270.0, 365.0, 562.0, 882.0, 1339.0, 2363.0, 4003.0, 7381.0, 15467.0, 39038.0, 210448.0, 1658620.0, 101336.0, 27875.0, 11918.0, 6026.0, 3334.0, 1965.0, 1241.0, 736.0, 462.0, 355.0, 216.0, 130.0, 83.0, 71.0, 48.0, 26.0, 23.0, 7.0, 15.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.796875, -25.045654296875, -24.29443359375, -23.543212890625, -22.7919921875, -22.040771484375, -21.28955078125, -20.538330078125, -19.787109375, -19.035888671875, -18.28466796875, -17.533447265625, -16.7822265625, -16.031005859375, -15.27978515625, -14.528564453125, -13.77734375, -13.026123046875, -12.27490234375, -11.523681640625, -10.7724609375, -10.021240234375, -9.27001953125, -8.518798828125, -7.767578125, -7.016357421875, -6.26513671875, -5.513916015625, -4.7626953125, -4.011474609375, -3.26025390625, -2.509033203125, -1.7578125, -1.006591796875, -0.25537109375, 0.495849609375, 1.2470703125, 1.998291015625, 2.74951171875, 3.500732421875, 4.251953125, 5.003173828125, 5.75439453125, 6.505615234375, 7.2568359375, 8.008056640625, 8.75927734375, 9.510498046875, 10.26171875, 11.012939453125, 11.76416015625, 12.515380859375, 13.2666015625, 14.017822265625, 14.76904296875, 15.520263671875, 16.271484375, 17.022705078125, 17.77392578125, 18.525146484375, 19.2763671875, 20.027587890625, 20.77880859375, 21.530029296875, 22.28125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 1.0, 6.0, 9.0, 13.0, 23.0, 26.0, 36.0, 90.0, 382.0, 212.0, 60.0, 43.0, 15.0, 18.0, 12.0, 6.0, 8.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.0318603515625, -7.719970703125, -7.4080810546875, -7.09619140625, -6.7843017578125, -6.472412109375, -6.1605224609375, -5.8486328125, -5.5367431640625, -5.224853515625, -4.9129638671875, -4.60107421875, -4.2891845703125, -3.977294921875, -3.6654052734375, -3.353515625, -3.0416259765625, -2.729736328125, -2.4178466796875, -2.10595703125, -1.7940673828125, -1.482177734375, -1.1702880859375, -0.8583984375, -0.5465087890625, -0.234619140625, 0.0772705078125, 0.38916015625, 0.7010498046875, 1.012939453125, 1.3248291015625, 1.63671875, 1.9486083984375, 2.260498046875, 2.5723876953125, 2.88427734375, 3.1961669921875, 3.508056640625, 3.8199462890625, 4.1318359375, 4.4437255859375, 4.755615234375, 5.0675048828125, 5.37939453125, 5.6912841796875, 6.003173828125, 6.3150634765625, 6.626953125, 6.9388427734375, 7.250732421875, 7.5626220703125, 7.87451171875, 8.1864013671875, 8.498291015625, 8.8101806640625, 9.1220703125, 9.4339599609375, 9.745849609375, 10.0577392578125, 10.36962890625, 10.6815185546875, 10.993408203125, 11.3052978515625, 11.6171875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 5.0, 7.0, 12.0, 13.0, 11.0, 15.0, 19.0, 15.0, 50.0, 84.0, 137.0, 447.0, 1712.0, 12632.0, 1009161.0, 21154.0, 2093.0, 509.0, 176.0, 101.0, 59.0, 32.0, 21.0, 14.0, 15.0, 17.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-141.375, -137.2861328125, -133.197265625, -129.1083984375, -125.01953125, -120.9306640625, -116.841796875, -112.7529296875, -108.6640625, -104.5751953125, -100.486328125, -96.3974609375, -92.30859375, -88.2197265625, -84.130859375, -80.0419921875, -75.953125, -71.8642578125, -67.775390625, -63.6865234375, -59.59765625, -55.5087890625, -51.419921875, -47.3310546875, -43.2421875, -39.1533203125, -35.064453125, -30.9755859375, -26.88671875, -22.7978515625, -18.708984375, -14.6201171875, -10.53125, -6.4423828125, -2.353515625, 1.7353515625, 5.82421875, 9.9130859375, 14.001953125, 18.0908203125, 22.1796875, 26.2685546875, 30.357421875, 34.4462890625, 38.53515625, 42.6240234375, 46.712890625, 50.8017578125, 54.890625, 58.9794921875, 63.068359375, 67.1572265625, 71.24609375, 75.3349609375, 79.423828125, 83.5126953125, 87.6015625, 91.6904296875, 95.779296875, 99.8681640625, 103.95703125, 108.0458984375, 112.134765625, 116.2236328125, 120.3125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 16.0, 18.0, 37.0, 73.0, 111.0, 245.0, 215.0, 111.0, 64.0, 32.0, 29.0, 13.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.527434349060059, -13.045394897460938, -12.563356399536133, -12.081316947937012, -11.599278450012207, -11.117238998413086, -10.635200500488281, -10.15316104888916, -9.671121597290039, -9.189082145690918, -8.707043647766113, -8.225004196166992, -7.7429656982421875, -7.260926246643066, -6.7788872718811035, -6.296848297119141, -5.814809799194336, -5.332770824432373, -4.85073184967041, -4.368692398071289, -3.8866536617279053, -3.4046146869659424, -2.9225754737854004, -2.4405364990234375, -1.9584975242614746, -1.4764585494995117, -0.9944194555282593, -0.5123803615570068, -0.030341386795043945, 0.45169758796691895, 0.9337368011474609, 1.4157757759094238, 1.8978157043457031, 2.379854679107666, 2.861893653869629, 3.343932867050171, 3.825971841812134, 4.308011054992676, 4.790050029754639, 5.272089004516602, 5.7541279792785645, 6.236166954040527, 6.71820592880249, 7.200244903564453, 7.682284355163574, 8.164322853088379, 8.6463623046875, 9.128400802612305, 9.610440254211426, 10.092479705810547, 10.574518203735352, 11.056557655334473, 11.538596153259277, 12.020635604858398, 12.502674102783203, 12.984713554382324, 13.466753005981445, 13.948792457580566, 14.430830955505371, 14.912870407104492, 15.394908905029297, 15.876948356628418, 16.35898780822754, 16.841026306152344, 17.32306480407715]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 8.0, 8.0, 13.0, 16.0, 24.0, 14.0, 19.0, 24.0, 28.0, 29.0, 29.0, 37.0, 42.0, 43.0, 39.0, 42.0, 44.0, 32.0, 44.0, 49.0, 45.0, 61.0, 35.0, 42.0, 28.0, 28.0, 23.0, 20.0, 13.0, 14.0, 19.0, 12.0, 9.0, 10.0, 8.0, 7.0, 5.0, 6.0, 4.0, 7.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.91430139541626, -7.684327602386475, -7.4543538093566895, -7.224379539489746, -6.994405746459961, -6.764431953430176, -6.534458160400391, -6.3044843673706055, -6.07451057434082, -5.844536781311035, -5.61456298828125, -5.384589195251465, -5.1546149253845215, -4.924641132354736, -4.694667339324951, -4.464693546295166, -4.234719276428223, -4.0047454833984375, -3.7747714519500732, -3.544797658920288, -3.314823865890503, -3.0848498344421387, -2.8548760414123535, -2.6249022483825684, -2.394928455352783, -2.164954662322998, -1.9349807500839233, -1.7050068378448486, -1.4750330448150635, -1.2450591325759888, -1.015085220336914, -0.7851114273071289, -0.5551376342773438, -0.3251637816429138, -0.0951898992061615, 0.13478398323059082, 0.36475783586502075, 0.5947316884994507, 0.8247056007385254, 1.0546793937683105, 1.2846533060073853, 1.51462721824646, 1.7446010112762451, 1.9745749235153198, 2.2045488357543945, 2.4345226287841797, 2.664496421813965, 2.89447021484375, 3.1244442462921143, 3.3544180393218994, 3.5843920707702637, 3.814365863800049, 4.044339656829834, 4.274313449859619, 4.5042877197265625, 4.734261512756348, 4.964235305786133, 5.194209098815918, 5.424182891845703, 5.654156684875488, 5.884130954742432, 6.114104747772217, 6.344078540802002, 6.574052333831787, 6.804026126861572]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 11.0, 10.0, 8.0, 11.0, 16.0, 17.0, 18.0, 20.0, 23.0, 19.0, 26.0, 32.0, 33.0, 40.0, 34.0, 47.0, 42.0, 41.0, 38.0, 46.0, 35.0, 37.0, 34.0, 40.0, 29.0, 30.0, 32.0, 24.0, 31.0, 26.0, 24.0, 24.0, 7.0, 13.0, 14.0, 10.0, 12.0, 3.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.82421875, -4.66864013671875, -4.5130615234375, -4.35748291015625, -4.201904296875, -4.04632568359375, -3.8907470703125, -3.73516845703125, -3.57958984375, -3.42401123046875, -3.2684326171875, -3.11285400390625, -2.957275390625, -2.80169677734375, -2.6461181640625, -2.49053955078125, -2.3349609375, -2.17938232421875, -2.0238037109375, -1.86822509765625, -1.712646484375, -1.55706787109375, -1.4014892578125, -1.24591064453125, -1.09033203125, -0.93475341796875, -0.7791748046875, -0.62359619140625, -0.468017578125, -0.31243896484375, -0.1568603515625, -0.00128173828125, 0.154296875, 0.30987548828125, 0.4654541015625, 0.62103271484375, 0.776611328125, 0.93218994140625, 1.0877685546875, 1.24334716796875, 1.39892578125, 1.55450439453125, 1.7100830078125, 1.86566162109375, 2.021240234375, 2.17681884765625, 2.3323974609375, 2.48797607421875, 2.6435546875, 2.79913330078125, 2.9547119140625, 3.11029052734375, 3.265869140625, 3.42144775390625, 3.5770263671875, 3.73260498046875, 3.88818359375, 4.04376220703125, 4.1993408203125, 4.35491943359375, 4.510498046875, 4.66607666015625, 4.8216552734375, 4.97723388671875, 5.1328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 8.0, 9.0, 12.0, 20.0, 33.0, 40.0, 57.0, 73.0, 97.0, 131.0, 181.0, 264.0, 324.0, 515.0, 697.0, 1019.0, 1520.0, 2266.0, 3592.0, 5797.0, 10543.0, 19890.0, 50151.0, 264947.0, 546203.0, 80121.0, 27019.0, 13097.0, 7180.0, 4302.0, 2811.0, 1614.0, 1209.0, 792.0, 596.0, 381.0, 287.0, 179.0, 170.0, 103.0, 81.0, 66.0, 44.0, 37.0, 21.0, 16.0, 12.0, 6.0, 10.0, 5.0, 0.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.359375, -11.975341796875, -11.59130859375, -11.207275390625, -10.8232421875, -10.439208984375, -10.05517578125, -9.671142578125, -9.287109375, -8.903076171875, -8.51904296875, -8.135009765625, -7.7509765625, -7.366943359375, -6.98291015625, -6.598876953125, -6.21484375, -5.830810546875, -5.44677734375, -5.062744140625, -4.6787109375, -4.294677734375, -3.91064453125, -3.526611328125, -3.142578125, -2.758544921875, -2.37451171875, -1.990478515625, -1.6064453125, -1.222412109375, -0.83837890625, -0.454345703125, -0.0703125, 0.313720703125, 0.69775390625, 1.081787109375, 1.4658203125, 1.849853515625, 2.23388671875, 2.617919921875, 3.001953125, 3.385986328125, 3.77001953125, 4.154052734375, 4.5380859375, 4.922119140625, 5.30615234375, 5.690185546875, 6.07421875, 6.458251953125, 6.84228515625, 7.226318359375, 7.6103515625, 7.994384765625, 8.37841796875, 8.762451171875, 9.146484375, 9.530517578125, 9.91455078125, 10.298583984375, 10.6826171875, 11.066650390625, 11.45068359375, 11.834716796875, 12.21875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 7.0, 10.0, 7.0, 9.0, 12.0, 10.0, 11.0, 17.0, 23.0, 30.0, 22.0, 38.0, 31.0, 44.0, 59.0, 71.0, 106.0, 135.0, 263.0, 1381.0, 206.0, 105.0, 84.0, 55.0, 53.0, 44.0, 34.0, 35.0, 26.0, 20.0, 12.0, 17.0, 12.0, 9.0, 11.0, 4.0, 11.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.28125, -19.6103515625, -18.939453125, -18.2685546875, -17.59765625, -16.9267578125, -16.255859375, -15.5849609375, -14.9140625, -14.2431640625, -13.572265625, -12.9013671875, -12.23046875, -11.5595703125, -10.888671875, -10.2177734375, -9.546875, -8.8759765625, -8.205078125, -7.5341796875, -6.86328125, -6.1923828125, -5.521484375, -4.8505859375, -4.1796875, -3.5087890625, -2.837890625, -2.1669921875, -1.49609375, -0.8251953125, -0.154296875, 0.5166015625, 1.1875, 1.8583984375, 2.529296875, 3.2001953125, 3.87109375, 4.5419921875, 5.212890625, 5.8837890625, 6.5546875, 7.2255859375, 7.896484375, 8.5673828125, 9.23828125, 9.9091796875, 10.580078125, 11.2509765625, 11.921875, 12.5927734375, 13.263671875, 13.9345703125, 14.60546875, 15.2763671875, 15.947265625, 16.6181640625, 17.2890625, 17.9599609375, 18.630859375, 19.3017578125, 19.97265625, 20.6435546875, 21.314453125, 21.9853515625, 22.65625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 2.0, 2.0, 5.0, 10.0, 11.0, 19.0, 25.0, 31.0, 35.0, 58.0, 77.0, 104.0, 210.0, 419.0, 929.0, 3537.0, 28912.0, 2674659.0, 418830.0, 14112.0, 2176.0, 707.0, 321.0, 155.0, 91.0, 67.0, 54.0, 38.0, 34.0, 23.0, 11.0, 18.0, 6.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.59375, -49.67236328125, -47.7509765625, -45.82958984375, -43.908203125, -41.98681640625, -40.0654296875, -38.14404296875, -36.22265625, -34.30126953125, -32.3798828125, -30.45849609375, -28.537109375, -26.61572265625, -24.6943359375, -22.77294921875, -20.8515625, -18.93017578125, -17.0087890625, -15.08740234375, -13.166015625, -11.24462890625, -9.3232421875, -7.40185546875, -5.48046875, -3.55908203125, -1.6376953125, 0.28369140625, 2.205078125, 4.12646484375, 6.0478515625, 7.96923828125, 9.890625, 11.81201171875, 13.7333984375, 15.65478515625, 17.576171875, 19.49755859375, 21.4189453125, 23.34033203125, 25.26171875, 27.18310546875, 29.1044921875, 31.02587890625, 32.947265625, 34.86865234375, 36.7900390625, 38.71142578125, 40.6328125, 42.55419921875, 44.4755859375, 46.39697265625, 48.318359375, 50.23974609375, 52.1611328125, 54.08251953125, 56.00390625, 57.92529296875, 59.8466796875, 61.76806640625, 63.689453125, 65.61083984375, 67.5322265625, 69.45361328125, 71.375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 80.0, 345.0, 435.0, 113.0, 27.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.848388671875, -251.2611083984375, -243.673828125, -236.0865478515625, -228.499267578125, -220.9119873046875, -213.32470703125, -205.7374267578125, -198.150146484375, -190.5628662109375, -182.9755859375, -175.3883056640625, -167.801025390625, -160.2137451171875, -152.62646484375, -145.0391845703125, -137.451904296875, -129.8646240234375, -122.27734375, -114.6900634765625, -107.102783203125, -99.5155029296875, -91.92822265625, -84.3409423828125, -76.753662109375, -69.1663818359375, -61.5791015625, -53.9918212890625, -46.404541015625, -38.8172607421875, -31.22998046875, -23.6427001953125, -16.055404663085938, -8.468124389648438, -0.8808441162109375, 6.7064361572265625, 14.293716430664062, 21.880996704101562, 29.468276977539062, 37.05555725097656, 44.64283752441406, 52.23011779785156, 59.81739807128906, 67.40467834472656, 74.99195861816406, 82.57923889160156, 90.16651916503906, 97.75379943847656, 105.34107971191406, 112.92835998535156, 120.51564025878906, 128.10292053222656, 135.69020080566406, 143.27748107910156, 150.86476135253906, 158.45204162597656, 166.03932189941406, 173.62660217285156, 181.21388244628906, 188.80116271972656, 196.38844299316406, 203.97572326660156, 211.56300354003906, 219.15028381347656, 226.73756408691406]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 12.0, 9.0, 7.0, 12.0, 11.0, 19.0, 24.0, 21.0, 32.0, 29.0, 25.0, 25.0, 33.0, 31.0, 40.0, 33.0, 35.0, 37.0, 51.0, 35.0, 40.0, 37.0, 42.0, 26.0, 41.0, 28.0, 31.0, 24.0, 29.0, 19.0, 29.0, 21.0, 16.0, 8.0, 21.0, 11.0, 8.0, 6.0, 7.0, 7.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-56.27058410644531, -54.56818771362305, -52.86579132080078, -51.16339111328125, -49.460994720458984, -47.75859832763672, -46.05620193481445, -44.35380554199219, -42.65140914916992, -40.949012756347656, -39.24661636352539, -37.544219970703125, -35.841819763183594, -34.13942337036133, -32.43702697753906, -30.734630584716797, -29.0322322845459, -27.329835891723633, -25.627437591552734, -23.92504119873047, -22.222644805908203, -20.520248413085938, -18.81785011291504, -17.115453720092773, -15.413056373596191, -13.71065902709961, -12.008262634277344, -10.305865287780762, -8.60346794128418, -6.901071548461914, -5.198674201965332, -3.4962778091430664, -1.7938804626464844, -0.091483473777771, 1.6109135150909424, 3.3133106231689453, 5.015707492828369, 6.718104362487793, 8.420501708984375, 10.12289810180664, 11.825295448303223, 13.527692794799805, 15.23008918762207, 16.93248748779297, 18.634883880615234, 20.3372802734375, 22.039676666259766, 23.74207305908203, 25.44447135925293, 27.146867752075195, 28.849266052246094, 30.55166244506836, 32.254058837890625, 33.95645523071289, 35.658851623535156, 37.36125183105469, 39.06364822387695, 40.76604461669922, 42.468441009521484, 44.17083740234375, 45.87323760986328, 47.57563400268555, 49.27803039550781, 50.98042678833008, 52.682823181152344]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 8.0, 3.0, 9.0, 8.0, 13.0, 17.0, 14.0, 15.0, 20.0, 18.0, 15.0, 22.0, 26.0, 32.0, 35.0, 31.0, 38.0, 40.0, 43.0, 42.0, 40.0, 57.0, 46.0, 35.0, 36.0, 34.0, 35.0, 22.0, 27.0, 34.0, 19.0, 30.0, 11.0, 18.0, 27.0, 16.0, 8.0, 12.0, 10.0, 8.0, 5.0, 4.0, 9.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.7235107421875, -4.556396484375, -4.3892822265625, -4.22216796875, -4.0550537109375, -3.887939453125, -3.7208251953125, -3.5537109375, -3.3865966796875, -3.219482421875, -3.0523681640625, -2.88525390625, -2.7181396484375, -2.551025390625, -2.3839111328125, -2.216796875, -2.0496826171875, -1.882568359375, -1.7154541015625, -1.54833984375, -1.3812255859375, -1.214111328125, -1.0469970703125, -0.8798828125, -0.7127685546875, -0.545654296875, -0.3785400390625, -0.21142578125, -0.0443115234375, 0.122802734375, 0.2899169921875, 0.45703125, 0.6241455078125, 0.791259765625, 0.9583740234375, 1.12548828125, 1.2926025390625, 1.459716796875, 1.6268310546875, 1.7939453125, 1.9610595703125, 2.128173828125, 2.2952880859375, 2.46240234375, 2.6295166015625, 2.796630859375, 2.9637451171875, 3.130859375, 3.2979736328125, 3.465087890625, 3.6322021484375, 3.79931640625, 3.9664306640625, 4.133544921875, 4.3006591796875, 4.4677734375, 4.6348876953125, 4.802001953125, 4.9691162109375, 5.13623046875, 5.3033447265625, 5.470458984375, 5.6375732421875, 5.8046875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 11.0, 7.0, 20.0, 23.0, 30.0, 43.0, 70.0, 85.0, 160.0, 241.0, 345.0, 617.0, 1025.0, 1758.0, 3231.0, 6336.0, 13990.0, 39965.0, 430359.0, 3292319.0, 337706.0, 38046.0, 13928.0, 6261.0, 3342.0, 1728.0, 1019.0, 609.0, 332.0, 237.0, 153.0, 85.0, 63.0, 44.0, 29.0, 13.0, 18.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.4208984375, -18.857421875, -18.2939453125, -17.73046875, -17.1669921875, -16.603515625, -16.0400390625, -15.4765625, -14.9130859375, -14.349609375, -13.7861328125, -13.22265625, -12.6591796875, -12.095703125, -11.5322265625, -10.96875, -10.4052734375, -9.841796875, -9.2783203125, -8.71484375, -8.1513671875, -7.587890625, -7.0244140625, -6.4609375, -5.8974609375, -5.333984375, -4.7705078125, -4.20703125, -3.6435546875, -3.080078125, -2.5166015625, -1.953125, -1.3896484375, -0.826171875, -0.2626953125, 0.30078125, 0.8642578125, 1.427734375, 1.9912109375, 2.5546875, 3.1181640625, 3.681640625, 4.2451171875, 4.80859375, 5.3720703125, 5.935546875, 6.4990234375, 7.0625, 7.6259765625, 8.189453125, 8.7529296875, 9.31640625, 9.8798828125, 10.443359375, 11.0068359375, 11.5703125, 12.1337890625, 12.697265625, 13.2607421875, 13.82421875, 14.3876953125, 14.951171875, 15.5146484375, 16.078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 12.0, 9.0, 11.0, 14.0, 13.0, 21.0, 38.0, 63.0, 97.0, 170.0, 366.0, 795.0, 1054.0, 679.0, 295.0, 153.0, 94.0, 48.0, 29.0, 29.0, 20.0, 10.0, 10.0, 9.0, 8.0, 9.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.71875, -21.08642578125, -20.4541015625, -19.82177734375, -19.189453125, -18.55712890625, -17.9248046875, -17.29248046875, -16.66015625, -16.02783203125, -15.3955078125, -14.76318359375, -14.130859375, -13.49853515625, -12.8662109375, -12.23388671875, -11.6015625, -10.96923828125, -10.3369140625, -9.70458984375, -9.072265625, -8.43994140625, -7.8076171875, -7.17529296875, -6.54296875, -5.91064453125, -5.2783203125, -4.64599609375, -4.013671875, -3.38134765625, -2.7490234375, -2.11669921875, -1.484375, -0.85205078125, -0.2197265625, 0.41259765625, 1.044921875, 1.67724609375, 2.3095703125, 2.94189453125, 3.57421875, 4.20654296875, 4.8388671875, 5.47119140625, 6.103515625, 6.73583984375, 7.3681640625, 8.00048828125, 8.6328125, 9.26513671875, 9.8974609375, 10.52978515625, 11.162109375, 11.79443359375, 12.4267578125, 13.05908203125, 13.69140625, 14.32373046875, 14.9560546875, 15.58837890625, 16.220703125, 16.85302734375, 17.4853515625, 18.11767578125, 18.75]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 13.0, 23.0, 27.0, 68.0, 131.0, 272.0, 659.0, 1693.0, 4891.0, 18342.0, 126145.0, 3683125.0, 319751.0, 28330.0, 6977.0, 2276.0, 846.0, 365.0, 148.0, 82.0, 39.0, 21.0, 11.0, 9.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.08740234375, -33.8623046875, -32.63720703125, -31.412109375, -30.18701171875, -28.9619140625, -27.73681640625, -26.51171875, -25.28662109375, -24.0615234375, -22.83642578125, -21.611328125, -20.38623046875, -19.1611328125, -17.93603515625, -16.7109375, -15.48583984375, -14.2607421875, -13.03564453125, -11.810546875, -10.58544921875, -9.3603515625, -8.13525390625, -6.91015625, -5.68505859375, -4.4599609375, -3.23486328125, -2.009765625, -0.78466796875, 0.4404296875, 1.66552734375, 2.890625, 4.11572265625, 5.3408203125, 6.56591796875, 7.791015625, 9.01611328125, 10.2412109375, 11.46630859375, 12.69140625, 13.91650390625, 15.1416015625, 16.36669921875, 17.591796875, 18.81689453125, 20.0419921875, 21.26708984375, 22.4921875, 23.71728515625, 24.9423828125, 26.16748046875, 27.392578125, 28.61767578125, 29.8427734375, 31.06787109375, 32.29296875, 33.51806640625, 34.7431640625, 35.96826171875, 37.193359375, 38.41845703125, 39.6435546875, 40.86865234375, 42.09375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 27.0, 111.0, 336.0, 324.0, 133.0, 51.0, 13.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-245.24896240234375, -238.44882202148438, -231.648681640625, -224.84854125976562, -218.04840087890625, -211.24826049804688, -204.4481201171875, -197.6479949951172, -190.8478546142578, -184.04771423339844, -177.24757385253906, -170.4474334716797, -163.6472930908203, -156.84716796875, -150.04702758789062, -143.24688720703125, -136.44674682617188, -129.6466064453125, -122.84646606445312, -116.04632568359375, -109.2461929321289, -102.44605255126953, -95.64591217041016, -88.84577941894531, -82.04562377929688, -75.2454833984375, -68.44534301757812, -61.645206451416016, -54.845069885253906, -48.04492950439453, -41.244789123535156, -34.44465255737305, -27.644515991210938, -20.844377517700195, -14.044238090515137, -7.244098663330078, -0.44396018981933594, 6.356178283691406, 13.156318664550781, 19.95645523071289, 26.756595611572266, 33.55673599243164, 40.35687255859375, 47.157012939453125, 53.9571533203125, 60.75728988647461, 67.55743408203125, 74.3575668334961, 81.15770721435547, 87.95784759521484, 94.75798797607422, 101.55812072753906, 108.35826110839844, 115.15840148925781, 121.95854187011719, 128.75868225097656, 135.55882263183594, 142.3589630126953, 149.1591033935547, 155.95924377441406, 162.75938415527344, 169.55950927734375, 176.35964965820312, 183.1597900390625, 189.95993041992188]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 12.0, 6.0, 18.0, 5.0, 12.0, 18.0, 15.0, 27.0, 27.0, 28.0, 29.0, 32.0, 41.0, 48.0, 38.0, 42.0, 39.0, 47.0, 29.0, 50.0, 39.0, 37.0, 34.0, 36.0, 37.0, 32.0, 35.0, 20.0, 31.0, 23.0, 19.0, 18.0, 16.0, 9.0, 6.0, 3.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.95659637451172, -40.59119415283203, -39.22578811645508, -37.86038589477539, -36.4949836730957, -35.129581451416016, -33.76417541503906, -32.398773193359375, -31.033370971679688, -29.667966842651367, -28.30256462097168, -26.93716049194336, -25.571758270263672, -24.20635414123535, -22.84095001220703, -21.475547790527344, -20.110143661499023, -18.744739532470703, -17.379337310791016, -16.013933181762695, -14.648530960083008, -13.283126831054688, -11.917723655700684, -10.55232048034668, -9.186917304992676, -7.821514129638672, -6.456110954284668, -5.090707302093506, -3.725304126739502, -2.359900951385498, -0.9944972991943359, 0.37090587615966797, 1.7363090515136719, 3.101712226867676, 4.46711540222168, 5.832519054412842, 7.197922229766846, 8.563325881958008, 9.928729057312012, 11.294132232666016, 12.65953540802002, 14.024938583374023, 15.390341758728027, 16.75574493408203, 18.12114906311035, 19.48655128479004, 20.85195541381836, 22.217357635498047, 23.582761764526367, 24.948165893554688, 26.313568115234375, 27.678972244262695, 29.044374465942383, 30.409778594970703, 31.77518081665039, 33.140586853027344, 34.50598907470703, 35.87139129638672, 37.23679733276367, 38.60219955444336, 39.96760177612305, 41.333003997802734, 42.69841003417969, 44.063812255859375, 45.42921447753906]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 8.0, 4.0, 7.0, 8.0, 7.0, 17.0, 15.0, 19.0, 17.0, 14.0, 23.0, 22.0, 25.0, 26.0, 36.0, 34.0, 44.0, 45.0, 40.0, 50.0, 50.0, 45.0, 51.0, 39.0, 36.0, 34.0, 22.0, 31.0, 39.0, 22.0, 32.0, 23.0, 10.0, 17.0, 17.0, 16.0, 15.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.42657470703125, -4.2554931640625, -4.08441162109375, -3.913330078125, -3.74224853515625, -3.5711669921875, -3.40008544921875, -3.22900390625, -3.05792236328125, -2.8868408203125, -2.71575927734375, -2.544677734375, -2.37359619140625, -2.2025146484375, -2.03143310546875, -1.8603515625, -1.68927001953125, -1.5181884765625, -1.34710693359375, -1.176025390625, -1.00494384765625, -0.8338623046875, -0.66278076171875, -0.49169921875, -0.32061767578125, -0.1495361328125, 0.02154541015625, 0.192626953125, 0.36370849609375, 0.5347900390625, 0.70587158203125, 0.876953125, 1.04803466796875, 1.2191162109375, 1.39019775390625, 1.561279296875, 1.73236083984375, 1.9034423828125, 2.07452392578125, 2.24560546875, 2.41668701171875, 2.5877685546875, 2.75885009765625, 2.929931640625, 3.10101318359375, 3.2720947265625, 3.44317626953125, 3.6142578125, 3.78533935546875, 3.9564208984375, 4.12750244140625, 4.298583984375, 4.46966552734375, 4.6407470703125, 4.81182861328125, 4.98291015625, 5.15399169921875, 5.3250732421875, 5.49615478515625, 5.667236328125, 5.83831787109375, 6.0093994140625, 6.18048095703125, 6.3515625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 10.0, 14.0, 20.0, 24.0, 46.0, 58.0, 78.0, 112.0, 138.0, 218.0, 312.0, 493.0, 775.0, 1101.0, 1780.0, 2781.0, 4496.0, 7457.0, 12494.0, 22096.0, 42138.0, 96348.0, 544265.0, 180636.0, 60112.0, 29609.0, 16093.0, 9358.0, 5577.0, 3544.0, 2182.0, 1319.0, 927.0, 630.0, 365.0, 275.0, 198.0, 140.0, 102.0, 78.0, 42.0, 25.0, 27.0, 22.0, 14.0, 6.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-20.171875, -19.5556640625, -18.939453125, -18.3232421875, -17.70703125, -17.0908203125, -16.474609375, -15.8583984375, -15.2421875, -14.6259765625, -14.009765625, -13.3935546875, -12.77734375, -12.1611328125, -11.544921875, -10.9287109375, -10.3125, -9.6962890625, -9.080078125, -8.4638671875, -7.84765625, -7.2314453125, -6.615234375, -5.9990234375, -5.3828125, -4.7666015625, -4.150390625, -3.5341796875, -2.91796875, -2.3017578125, -1.685546875, -1.0693359375, -0.453125, 0.1630859375, 0.779296875, 1.3955078125, 2.01171875, 2.6279296875, 3.244140625, 3.8603515625, 4.4765625, 5.0927734375, 5.708984375, 6.3251953125, 6.94140625, 7.5576171875, 8.173828125, 8.7900390625, 9.40625, 10.0224609375, 10.638671875, 11.2548828125, 11.87109375, 12.4873046875, 13.103515625, 13.7197265625, 14.3359375, 14.9521484375, 15.568359375, 16.1845703125, 16.80078125, 17.4169921875, 18.033203125, 18.6494140625, 19.265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 1.0, 3.0, 8.0, 6.0, 9.0, 10.0, 10.0, 5.0, 17.0, 12.0, 16.0, 19.0, 19.0, 31.0, 39.0, 25.0, 27.0, 51.0, 43.0, 39.0, 47.0, 31.0, 1056.0, 40.0, 34.0, 32.0, 32.0, 38.0, 25.0, 41.0, 23.0, 33.0, 29.0, 20.0, 24.0, 21.0, 17.0, 16.0, 11.0, 13.0, 15.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 4.0], "bins": [-4.80078125, -4.667205810546875, -4.53363037109375, -4.400054931640625, -4.2664794921875, -4.132904052734375, -3.99932861328125, -3.865753173828125, -3.732177734375, -3.598602294921875, -3.46502685546875, -3.331451416015625, -3.1978759765625, -3.064300537109375, -2.93072509765625, -2.797149658203125, -2.66357421875, -2.529998779296875, -2.39642333984375, -2.262847900390625, -2.1292724609375, -1.995697021484375, -1.86212158203125, -1.728546142578125, -1.594970703125, -1.461395263671875, -1.32781982421875, -1.194244384765625, -1.0606689453125, -0.927093505859375, -0.79351806640625, -0.659942626953125, -0.5263671875, -0.392791748046875, -0.25921630859375, -0.125640869140625, 0.0079345703125, 0.141510009765625, 0.27508544921875, 0.408660888671875, 0.542236328125, 0.675811767578125, 0.80938720703125, 0.942962646484375, 1.0765380859375, 1.210113525390625, 1.34368896484375, 1.477264404296875, 1.61083984375, 1.744415283203125, 1.87799072265625, 2.011566162109375, 2.1451416015625, 2.278717041015625, 2.41229248046875, 2.545867919921875, 2.679443359375, 2.813018798828125, 2.94659423828125, 3.080169677734375, 3.2137451171875, 3.347320556640625, 3.48089599609375, 3.614471435546875, 3.748046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 9.0, 11.0, 16.0, 18.0, 25.0, 34.0, 55.0, 62.0, 94.0, 140.0, 190.0, 281.0, 383.0, 568.0, 812.0, 1226.0, 1925.0, 3104.0, 5228.0, 9775.0, 20130.0, 61022.0, 1431395.0, 474495.0, 47339.0, 17377.0, 8451.0, 4684.0, 2890.0, 1744.0, 1089.0, 776.0, 556.0, 377.0, 238.0, 173.0, 118.0, 97.0, 51.0, 49.0, 39.0, 21.0, 17.0, 13.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0], "bins": [-25.515625, -24.740234375, -23.96484375, -23.189453125, -22.4140625, -21.638671875, -20.86328125, -20.087890625, -19.3125, -18.537109375, -17.76171875, -16.986328125, -16.2109375, -15.435546875, -14.66015625, -13.884765625, -13.109375, -12.333984375, -11.55859375, -10.783203125, -10.0078125, -9.232421875, -8.45703125, -7.681640625, -6.90625, -6.130859375, -5.35546875, -4.580078125, -3.8046875, -3.029296875, -2.25390625, -1.478515625, -0.703125, 0.072265625, 0.84765625, 1.623046875, 2.3984375, 3.173828125, 3.94921875, 4.724609375, 5.5, 6.275390625, 7.05078125, 7.826171875, 8.6015625, 9.376953125, 10.15234375, 10.927734375, 11.703125, 12.478515625, 13.25390625, 14.029296875, 14.8046875, 15.580078125, 16.35546875, 17.130859375, 17.90625, 18.681640625, 19.45703125, 20.232421875, 21.0078125, 21.783203125, 22.55859375, 23.333984375, 24.109375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 16.0, 52.0, 133.0, 521.0, 130.0, 64.0, 23.0, 6.0, 4.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.3406982421875, -11.001708984375, -10.6627197265625, -10.32373046875, -9.9847412109375, -9.645751953125, -9.3067626953125, -8.9677734375, -8.6287841796875, -8.289794921875, -7.9508056640625, -7.61181640625, -7.2728271484375, -6.933837890625, -6.5948486328125, -6.255859375, -5.9168701171875, -5.577880859375, -5.2388916015625, -4.89990234375, -4.5609130859375, -4.221923828125, -3.8829345703125, -3.5439453125, -3.2049560546875, -2.865966796875, -2.5269775390625, -2.18798828125, -1.8489990234375, -1.510009765625, -1.1710205078125, -0.83203125, -0.4930419921875, -0.154052734375, 0.1849365234375, 0.52392578125, 0.8629150390625, 1.201904296875, 1.5408935546875, 1.8798828125, 2.2188720703125, 2.557861328125, 2.8968505859375, 3.23583984375, 3.5748291015625, 3.913818359375, 4.2528076171875, 4.591796875, 4.9307861328125, 5.269775390625, 5.6087646484375, 5.94775390625, 6.2867431640625, 6.625732421875, 6.9647216796875, 7.3037109375, 7.6427001953125, 7.981689453125, 8.3206787109375, 8.65966796875, 8.9986572265625, 9.337646484375, 9.6766357421875, 10.015625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 5.0, 9.0, 15.0, 17.0, 29.0, 31.0, 63.0, 135.0, 400.0, 1564.0, 11770.0, 1020983.0, 11206.0, 1603.0, 391.0, 116.0, 60.0, 35.0, 16.0, 13.0, 13.0, 12.0, 6.0, 11.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-125.3125, -121.0634765625, -116.814453125, -112.5654296875, -108.31640625, -104.0673828125, -99.818359375, -95.5693359375, -91.3203125, -87.0712890625, -82.822265625, -78.5732421875, -74.32421875, -70.0751953125, -65.826171875, -61.5771484375, -57.328125, -53.0791015625, -48.830078125, -44.5810546875, -40.33203125, -36.0830078125, -31.833984375, -27.5849609375, -23.3359375, -19.0869140625, -14.837890625, -10.5888671875, -6.33984375, -2.0908203125, 2.158203125, 6.4072265625, 10.65625, 14.9052734375, 19.154296875, 23.4033203125, 27.65234375, 31.9013671875, 36.150390625, 40.3994140625, 44.6484375, 48.8974609375, 53.146484375, 57.3955078125, 61.64453125, 65.8935546875, 70.142578125, 74.3916015625, 78.640625, 82.8896484375, 87.138671875, 91.3876953125, 95.63671875, 99.8857421875, 104.134765625, 108.3837890625, 112.6328125, 116.8818359375, 121.130859375, 125.3798828125, 129.62890625, 133.8779296875, 138.126953125, 142.3759765625, 146.625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 9.0, 25.0, 70.0, 324.0, 455.0, 93.0, 25.0, 5.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.83820343017578, -39.603981018066406, -38.3697624206543, -37.13554000854492, -35.90131759643555, -34.66709518432617, -33.43287658691406, -32.19865417480469, -30.964431762695312, -29.73021125793457, -28.495988845825195, -27.261768341064453, -26.027545928955078, -24.793325424194336, -23.559104919433594, -22.32488250732422, -21.090662002563477, -19.856441497802734, -18.62221908569336, -17.387998580932617, -16.153776168823242, -14.9195556640625, -13.685334205627441, -12.451112747192383, -11.216891288757324, -9.982669830322266, -8.748448371887207, -7.514227390289307, -6.280005931854248, -5.0457844734191895, -3.811563491821289, -2.5773420333862305, -1.3431205749511719, -0.10889923572540283, 1.1253221035003662, 2.3595433235168457, 3.5937647819519043, 4.827986240386963, 6.062207221984863, 7.296428680419922, 8.53065013885498, 9.764871597290039, 10.999093055725098, 12.233314514160156, 13.467535018920898, 14.701757431030273, 15.935977935791016, 17.17020034790039, 18.404420852661133, 19.638641357421875, 20.87286376953125, 22.107084274291992, 23.341306686401367, 24.57552719116211, 25.809749603271484, 27.043970108032227, 28.27819061279297, 29.51241111755371, 30.746633529663086, 31.980854034423828, 33.2150764465332, 34.44929885864258, 35.68351745605469, 36.91773986816406, 38.15196228027344]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 4.0, 6.0, 6.0, 14.0, 13.0, 6.0, 21.0, 24.0, 18.0, 21.0, 29.0, 28.0, 30.0, 19.0, 29.0, 42.0, 35.0, 45.0, 36.0, 37.0, 41.0, 39.0, 33.0, 45.0, 40.0, 27.0, 33.0, 45.0, 39.0, 24.0, 12.0, 22.0, 23.0, 21.0, 10.0, 11.0, 14.0, 7.0, 9.0, 11.0, 5.0, 3.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-6.155326843261719, -5.963757038116455, -5.77218770980835, -5.580617904663086, -5.3890485763549805, -5.197478771209717, -5.005909442901611, -4.814339637756348, -4.622770309448242, -4.4312005043029785, -4.239631175994873, -4.048061370849609, -3.856492042541504, -3.6649224758148193, -3.4733529090881348, -3.281783103942871, -3.0902135372161865, -2.898643970489502, -2.7070744037628174, -2.515504837036133, -2.3239352703094482, -2.1323657035827637, -1.9407960176467896, -1.749226450920105, -1.5576568841934204, -1.3660873174667358, -1.1745177507400513, -0.9829481244087219, -0.7913785576820374, -0.5998089909553528, -0.40823936462402344, -0.21666979789733887, -0.025100231170654297, 0.16646935045719147, 0.35803893208503723, 0.5496085286140442, 0.7411780953407288, 0.9327476620674133, 1.1243172883987427, 1.3158868551254272, 1.5074564218521118, 1.6990259885787964, 1.890595555305481, 2.082165241241455, 2.2737348079681396, 2.465304374694824, 2.656873941421509, 2.8484435081481934, 3.040013074874878, 3.2315826416015625, 3.423152208328247, 3.6147217750549316, 3.806291341781616, 3.997860908508301, 4.1894307136535645, 4.38100004196167, 4.572569847106934, 4.764139652252197, 4.955708980560303, 5.147278785705566, 5.338848114013672, 5.5304179191589355, 5.721987247467041, 5.913557052612305, 6.10512638092041]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 7.0, 10.0, 10.0, 12.0, 19.0, 10.0, 19.0, 26.0, 14.0, 17.0, 18.0, 26.0, 31.0, 30.0, 35.0, 35.0, 49.0, 57.0, 42.0, 54.0, 41.0, 46.0, 37.0, 32.0, 36.0, 34.0, 34.0, 20.0, 26.0, 25.0, 14.0, 22.0, 19.0, 18.0, 12.0, 7.0, 15.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.536865234375, -4.36669921875, -4.196533203125, -4.0263671875, -3.856201171875, -3.68603515625, -3.515869140625, -3.345703125, -3.175537109375, -3.00537109375, -2.835205078125, -2.6650390625, -2.494873046875, -2.32470703125, -2.154541015625, -1.984375, -1.814208984375, -1.64404296875, -1.473876953125, -1.3037109375, -1.133544921875, -0.96337890625, -0.793212890625, -0.623046875, -0.452880859375, -0.28271484375, -0.112548828125, 0.0576171875, 0.227783203125, 0.39794921875, 0.568115234375, 0.73828125, 0.908447265625, 1.07861328125, 1.248779296875, 1.4189453125, 1.589111328125, 1.75927734375, 1.929443359375, 2.099609375, 2.269775390625, 2.43994140625, 2.610107421875, 2.7802734375, 2.950439453125, 3.12060546875, 3.290771484375, 3.4609375, 3.631103515625, 3.80126953125, 3.971435546875, 4.1416015625, 4.311767578125, 4.48193359375, 4.652099609375, 4.822265625, 4.992431640625, 5.16259765625, 5.332763671875, 5.5029296875, 5.673095703125, 5.84326171875, 6.013427734375, 6.18359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 19.0, 23.0, 29.0, 42.0, 50.0, 66.0, 97.0, 129.0, 189.0, 243.0, 374.0, 550.0, 760.0, 1186.0, 1831.0, 3056.0, 5048.0, 9091.0, 16814.0, 34421.0, 81751.0, 258111.0, 403688.0, 130604.0, 48781.0, 22580.0, 11689.0, 6638.0, 3738.0, 2399.0, 1483.0, 945.0, 617.0, 422.0, 322.0, 200.0, 138.0, 107.0, 97.0, 55.0, 39.0, 29.0, 28.0, 19.0, 14.0, 9.0, 7.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.19921875, -6.96099853515625, -6.7227783203125, -6.48455810546875, -6.246337890625, -6.00811767578125, -5.7698974609375, -5.53167724609375, -5.29345703125, -5.05523681640625, -4.8170166015625, -4.57879638671875, -4.340576171875, -4.10235595703125, -3.8641357421875, -3.62591552734375, -3.3876953125, -3.14947509765625, -2.9112548828125, -2.67303466796875, -2.434814453125, -2.19659423828125, -1.9583740234375, -1.72015380859375, -1.48193359375, -1.24371337890625, -1.0054931640625, -0.76727294921875, -0.529052734375, -0.29083251953125, -0.0526123046875, 0.18560791015625, 0.423828125, 0.66204833984375, 0.9002685546875, 1.13848876953125, 1.376708984375, 1.61492919921875, 1.8531494140625, 2.09136962890625, 2.32958984375, 2.56781005859375, 2.8060302734375, 3.04425048828125, 3.282470703125, 3.52069091796875, 3.7589111328125, 3.99713134765625, 4.2353515625, 4.47357177734375, 4.7117919921875, 4.95001220703125, 5.188232421875, 5.42645263671875, 5.6646728515625, 5.90289306640625, 6.14111328125, 6.37933349609375, 6.6175537109375, 6.85577392578125, 7.093994140625, 7.33221435546875, 7.5704345703125, 7.80865478515625, 8.046875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 7.0, 4.0, 5.0, 11.0, 7.0, 7.0, 10.0, 30.0, 21.0, 25.0, 32.0, 34.0, 36.0, 56.0, 59.0, 69.0, 97.0, 128.0, 317.0, 1418.0, 171.0, 90.0, 64.0, 57.0, 44.0, 44.0, 47.0, 25.0, 23.0, 25.0, 16.0, 10.0, 9.0, 11.0, 13.0, 4.0, 2.0, 4.0, 9.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-23.1875, -22.46630859375, -21.7451171875, -21.02392578125, -20.302734375, -19.58154296875, -18.8603515625, -18.13916015625, -17.41796875, -16.69677734375, -15.9755859375, -15.25439453125, -14.533203125, -13.81201171875, -13.0908203125, -12.36962890625, -11.6484375, -10.92724609375, -10.2060546875, -9.48486328125, -8.763671875, -8.04248046875, -7.3212890625, -6.60009765625, -5.87890625, -5.15771484375, -4.4365234375, -3.71533203125, -2.994140625, -2.27294921875, -1.5517578125, -0.83056640625, -0.109375, 0.61181640625, 1.3330078125, 2.05419921875, 2.775390625, 3.49658203125, 4.2177734375, 4.93896484375, 5.66015625, 6.38134765625, 7.1025390625, 7.82373046875, 8.544921875, 9.26611328125, 9.9873046875, 10.70849609375, 11.4296875, 12.15087890625, 12.8720703125, 13.59326171875, 14.314453125, 15.03564453125, 15.7568359375, 16.47802734375, 17.19921875, 17.92041015625, 18.6416015625, 19.36279296875, 20.083984375, 20.80517578125, 21.5263671875, 22.24755859375, 22.96875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 21.0, 31.0, 69.0, 180.0, 528.0, 2099.0, 92095.0, 3045063.0, 4299.0, 843.0, 250.0, 87.0, 45.0, 27.0, 18.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-177.75, -172.96875, -168.1875, -163.40625, -158.625, -153.84375, -149.0625, -144.28125, -139.5, -134.71875, -129.9375, -125.15625, -120.375, -115.59375, -110.8125, -106.03125, -101.25, -96.46875, -91.6875, -86.90625, -82.125, -77.34375, -72.5625, -67.78125, -63.0, -58.21875, -53.4375, -48.65625, -43.875, -39.09375, -34.3125, -29.53125, -24.75, -19.96875, -15.1875, -10.40625, -5.625, -0.84375, 3.9375, 8.71875, 13.5, 18.28125, 23.0625, 27.84375, 32.625, 37.40625, 42.1875, 46.96875, 51.75, 56.53125, 61.3125, 66.09375, 70.875, 75.65625, 80.4375, 85.21875, 90.0, 94.78125, 99.5625, 104.34375, 109.125, 113.90625, 118.6875, 123.46875, 128.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 29.0, 86.0, 221.0, 341.0, 200.0, 87.0, 28.0, 6.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.52264404296875, -137.16053771972656, -132.79843139648438, -128.4363250732422, -124.07421875, -119.71211242675781, -115.35001373291016, -110.98790740966797, -106.62580108642578, -102.2636947631836, -97.9015884399414, -93.53948211669922, -89.17738342285156, -84.81527709960938, -80.45317077636719, -76.091064453125, -71.72895812988281, -67.36685180664062, -63.00474548339844, -58.642642974853516, -54.28053665161133, -49.91843032836914, -45.55632781982422, -41.19422149658203, -36.832115173339844, -32.470008850097656, -28.1079044342041, -23.745800018310547, -19.38369369506836, -15.021587371826172, -10.659482955932617, -6.2973785400390625, -1.9352569580078125, 2.4268484115600586, 6.78895378112793, 11.1510591506958, 15.513164520263672, 19.87527084350586, 24.237375259399414, 28.59947967529297, 32.961585998535156, 37.323692321777344, 41.68579864501953, 46.04790115356445, 50.41000747680664, 54.77211380004883, 59.13421630859375, 63.49632263183594, 67.85842895507812, 72.22053527832031, 76.5826416015625, 80.94474792480469, 85.30685424804688, 89.66896057128906, 94.03105926513672, 98.3931655883789, 102.7552719116211, 107.11737823486328, 111.47948455810547, 115.84159088134766, 120.20368957519531, 124.5657958984375, 128.9279022216797, 133.29000854492188, 137.65211486816406]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 6.0, 15.0, 14.0, 7.0, 10.0, 21.0, 17.0, 15.0, 19.0, 34.0, 33.0, 33.0, 37.0, 29.0, 33.0, 29.0, 40.0, 30.0, 46.0, 32.0, 37.0, 36.0, 32.0, 37.0, 36.0, 36.0, 21.0, 34.0, 25.0, 31.0, 27.0, 15.0, 14.0, 20.0, 13.0, 12.0, 16.0, 13.0, 6.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.63307189941406, -60.77549362182617, -58.917911529541016, -57.060333251953125, -55.20275115966797, -53.34517288208008, -51.48759460449219, -49.63001251220703, -47.77243423461914, -45.91485595703125, -44.057273864746094, -42.1996955871582, -40.34211730957031, -38.484535217285156, -36.626956939697266, -34.769378662109375, -32.91179656982422, -31.054216384887695, -29.196636199951172, -27.33905792236328, -25.481477737426758, -23.623897552490234, -21.766319274902344, -19.90873908996582, -18.051158905029297, -16.193578720092773, -14.335999488830566, -12.47842025756836, -10.620840072631836, -8.763259887695312, -6.9056806564331055, -5.048101425170898, -3.190521240234375, -1.3329415321350098, 0.5246381759643555, 2.3822178840637207, 4.239797592163086, 6.097377777099609, 7.954957008361816, 9.812536239624023, 11.670116424560547, 13.52769660949707, 15.385275840759277, 17.242855072021484, 19.100435256958008, 20.95801544189453, 22.815593719482422, 24.673173904418945, 26.53075408935547, 28.388334274291992, 30.245914459228516, 32.103492736816406, 33.96107482910156, 35.81865310668945, 37.676231384277344, 39.5338134765625, 41.39139175415039, 43.24897003173828, 45.10655212402344, 46.96413040161133, 48.82170867919922, 50.679290771484375, 52.536869049072266, 54.394447326660156, 56.25202941894531]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 5.0, 9.0, 11.0, 8.0, 19.0, 12.0, 22.0, 14.0, 23.0, 18.0, 22.0, 26.0, 28.0, 37.0, 29.0, 32.0, 43.0, 49.0, 45.0, 34.0, 53.0, 31.0, 42.0, 37.0, 34.0, 36.0, 30.0, 27.0, 22.0, 33.0, 22.0, 14.0, 18.0, 16.0, 23.0, 18.0, 7.0, 8.0, 11.0, 3.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.93438720703125, -4.7515869140625, -4.56878662109375, -4.385986328125, -4.20318603515625, -4.0203857421875, -3.83758544921875, -3.65478515625, -3.47198486328125, -3.2891845703125, -3.10638427734375, -2.923583984375, -2.74078369140625, -2.5579833984375, -2.37518310546875, -2.1923828125, -2.00958251953125, -1.8267822265625, -1.64398193359375, -1.461181640625, -1.27838134765625, -1.0955810546875, -0.91278076171875, -0.72998046875, -0.54718017578125, -0.3643798828125, -0.18157958984375, 0.001220703125, 0.18402099609375, 0.3668212890625, 0.54962158203125, 0.732421875, 0.91522216796875, 1.0980224609375, 1.28082275390625, 1.463623046875, 1.64642333984375, 1.8292236328125, 2.01202392578125, 2.19482421875, 2.37762451171875, 2.5604248046875, 2.74322509765625, 2.926025390625, 3.10882568359375, 3.2916259765625, 3.47442626953125, 3.6572265625, 3.84002685546875, 4.0228271484375, 4.20562744140625, 4.388427734375, 4.57122802734375, 4.7540283203125, 4.93682861328125, 5.11962890625, 5.30242919921875, 5.4852294921875, 5.66802978515625, 5.850830078125, 6.03363037109375, 6.2164306640625, 6.39923095703125, 6.58203125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 8.0, 11.0, 23.0, 21.0, 27.0, 50.0, 65.0, 84.0, 108.0, 166.0, 234.0, 319.0, 455.0, 681.0, 879.0, 1246.0, 1866.0, 2630.0, 4078.0, 6267.0, 10443.0, 19722.0, 50974.0, 241680.0, 1360900.0, 1960167.0, 394713.0, 76868.0, 25447.0, 12698.0, 7402.0, 4667.0, 2975.0, 2028.0, 1332.0, 888.0, 639.0, 450.0, 296.0, 230.0, 162.0, 107.0, 62.0, 67.0, 46.0, 32.0, 20.0, 9.0, 17.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.8046875, -9.4996337890625, -9.194580078125, -8.8895263671875, -8.58447265625, -8.2794189453125, -7.974365234375, -7.6693115234375, -7.3642578125, -7.0592041015625, -6.754150390625, -6.4490966796875, -6.14404296875, -5.8389892578125, -5.533935546875, -5.2288818359375, -4.923828125, -4.6187744140625, -4.313720703125, -4.0086669921875, -3.70361328125, -3.3985595703125, -3.093505859375, -2.7884521484375, -2.4833984375, -2.1783447265625, -1.873291015625, -1.5682373046875, -1.26318359375, -0.9581298828125, -0.653076171875, -0.3480224609375, -0.04296875, 0.2620849609375, 0.567138671875, 0.8721923828125, 1.17724609375, 1.4822998046875, 1.787353515625, 2.0924072265625, 2.3974609375, 2.7025146484375, 3.007568359375, 3.3126220703125, 3.61767578125, 3.9227294921875, 4.227783203125, 4.5328369140625, 4.837890625, 5.1429443359375, 5.447998046875, 5.7530517578125, 6.05810546875, 6.3631591796875, 6.668212890625, 6.9732666015625, 7.2783203125, 7.5833740234375, 7.888427734375, 8.1934814453125, 8.49853515625, 8.8035888671875, 9.108642578125, 9.4136962890625, 9.71875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 2.0, 11.0, 5.0, 8.0, 11.0, 13.0, 14.0, 20.0, 28.0, 32.0, 61.0, 116.0, 169.0, 282.0, 496.0, 687.0, 712.0, 492.0, 321.0, 175.0, 105.0, 84.0, 58.0, 43.0, 25.0, 22.0, 11.0, 12.0, 8.0, 11.0, 4.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.140625, -14.696533203125, -14.25244140625, -13.808349609375, -13.3642578125, -12.920166015625, -12.47607421875, -12.031982421875, -11.587890625, -11.143798828125, -10.69970703125, -10.255615234375, -9.8115234375, -9.367431640625, -8.92333984375, -8.479248046875, -8.03515625, -7.591064453125, -7.14697265625, -6.702880859375, -6.2587890625, -5.814697265625, -5.37060546875, -4.926513671875, -4.482421875, -4.038330078125, -3.59423828125, -3.150146484375, -2.7060546875, -2.261962890625, -1.81787109375, -1.373779296875, -0.9296875, -0.485595703125, -0.04150390625, 0.402587890625, 0.8466796875, 1.290771484375, 1.73486328125, 2.178955078125, 2.623046875, 3.067138671875, 3.51123046875, 3.955322265625, 4.3994140625, 4.843505859375, 5.28759765625, 5.731689453125, 6.17578125, 6.619873046875, 7.06396484375, 7.508056640625, 7.9521484375, 8.396240234375, 8.84033203125, 9.284423828125, 9.728515625, 10.172607421875, 10.61669921875, 11.060791015625, 11.5048828125, 11.948974609375, 12.39306640625, 12.837158203125, 13.28125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 10.0, 15.0, 29.0, 45.0, 50.0, 105.0, 137.0, 189.0, 314.0, 480.0, 738.0, 1232.0, 2215.0, 4150.0, 8818.0, 21260.0, 72136.0, 511546.0, 3043300.0, 425206.0, 64704.0, 20002.0, 8253.0, 3982.0, 2191.0, 1172.0, 690.0, 459.0, 278.0, 184.0, 122.0, 86.0, 57.0, 41.0, 29.0, 18.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.140625, -18.551025390625, -17.96142578125, -17.371826171875, -16.7822265625, -16.192626953125, -15.60302734375, -15.013427734375, -14.423828125, -13.834228515625, -13.24462890625, -12.655029296875, -12.0654296875, -11.475830078125, -10.88623046875, -10.296630859375, -9.70703125, -9.117431640625, -8.52783203125, -7.938232421875, -7.3486328125, -6.759033203125, -6.16943359375, -5.579833984375, -4.990234375, -4.400634765625, -3.81103515625, -3.221435546875, -2.6318359375, -2.042236328125, -1.45263671875, -0.863037109375, -0.2734375, 0.316162109375, 0.90576171875, 1.495361328125, 2.0849609375, 2.674560546875, 3.26416015625, 3.853759765625, 4.443359375, 5.032958984375, 5.62255859375, 6.212158203125, 6.8017578125, 7.391357421875, 7.98095703125, 8.570556640625, 9.16015625, 9.749755859375, 10.33935546875, 10.928955078125, 11.5185546875, 12.108154296875, 12.69775390625, 13.287353515625, 13.876953125, 14.466552734375, 15.05615234375, 15.645751953125, 16.2353515625, 16.824951171875, 17.41455078125, 18.004150390625, 18.59375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 35.0, 135.0, 423.0, 298.0, 85.0, 22.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-335.96075439453125, -327.9210510253906, -319.88134765625, -311.8416748046875, -303.8019714355469, -295.76226806640625, -287.72259521484375, -279.6828918457031, -271.6431884765625, -263.6034851074219, -255.5637969970703, -247.52410888671875, -239.48440551757812, -231.4447021484375, -223.40501403808594, -215.36532592773438, -207.32562255859375, -199.28591918945312, -191.24623107910156, -183.20654296875, -175.16683959960938, -167.12713623046875, -159.0874481201172, -151.04776000976562, -143.008056640625, -134.96835327148438, -126.92866516113281, -118.88896942138672, -110.84927368164062, -102.80957794189453, -94.76988220214844, -86.73018646240234, -78.69050598144531, -70.65081024169922, -62.611114501953125, -54.57141876220703, -46.53172302246094, -38.492027282714844, -30.45233154296875, -22.412635803222656, -14.372940063476562, -6.333244323730469, 1.706451416015625, 9.746147155761719, 17.785842895507812, 25.825538635253906, 33.865234375, 41.904930114746094, 49.94462585449219, 57.98432159423828, 66.02401733398438, 74.06371307373047, 82.10340881347656, 90.14310455322266, 98.18280029296875, 106.22249603271484, 114.26219177246094, 122.30188751220703, 130.34158325195312, 138.38128662109375, 146.4209747314453, 154.46066284179688, 162.5003662109375, 170.54006958007812, 178.5797576904297]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 8.0, 9.0, 15.0, 20.0, 12.0, 22.0, 16.0, 22.0, 34.0, 31.0, 31.0, 34.0, 36.0, 33.0, 42.0, 43.0, 43.0, 34.0, 46.0, 40.0, 41.0, 42.0, 43.0, 41.0, 38.0, 27.0, 24.0, 27.0, 17.0, 17.0, 16.0, 19.0, 14.0, 6.0, 11.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.966026306152344, -38.600746154785156, -37.235469818115234, -35.87018966674805, -34.504913330078125, -33.13963317871094, -31.774354934692383, -30.409076690673828, -29.043798446655273, -27.67852020263672, -26.313241958618164, -24.94796371459961, -23.582683563232422, -22.2174072265625, -20.852127075195312, -19.486848831176758, -18.121570587158203, -16.75629234313965, -15.391014099121094, -14.025734901428223, -12.660456657409668, -11.295178413391113, -9.929899215698242, -8.564620971679688, -7.199342727661133, -5.834064483642578, -4.468785762786865, -3.1035070419311523, -1.7382287979125977, -0.37295055389404297, 0.9923286437988281, 2.357606887817383, 3.722881317138672, 5.088159561157227, 6.4534382820129395, 7.818717002868652, 9.183995246887207, 10.549273490905762, 11.914552688598633, 13.279830932617188, 14.645109176635742, 16.010387420654297, 17.37566566467285, 18.740943908691406, 20.106224060058594, 21.471500396728516, 22.836780548095703, 24.202058792114258, 25.567337036132812, 26.932615280151367, 28.297893524169922, 29.66317367553711, 31.02845001220703, 32.39373016357422, 33.759010314941406, 35.12428665161133, 36.48956298828125, 37.85484313964844, 39.22011947631836, 40.58539962768555, 41.95067596435547, 43.315956115722656, 44.681236267089844, 46.046512603759766, 47.41179275512695]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 10.0, 14.0, 10.0, 12.0, 15.0, 28.0, 24.0, 24.0, 23.0, 22.0, 35.0, 37.0, 34.0, 41.0, 44.0, 56.0, 51.0, 50.0, 45.0, 38.0, 39.0, 31.0, 49.0, 27.0, 25.0, 34.0, 29.0, 20.0, 15.0, 12.0, 20.0, 15.0, 18.0, 13.0, 6.0, 7.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.5731201171875, -5.376708984375, -5.1802978515625, -4.98388671875, -4.7874755859375, -4.591064453125, -4.3946533203125, -4.1982421875, -4.0018310546875, -3.805419921875, -3.6090087890625, -3.41259765625, -3.2161865234375, -3.019775390625, -2.8233642578125, -2.626953125, -2.4305419921875, -2.234130859375, -2.0377197265625, -1.84130859375, -1.6448974609375, -1.448486328125, -1.2520751953125, -1.0556640625, -0.8592529296875, -0.662841796875, -0.4664306640625, -0.27001953125, -0.0736083984375, 0.122802734375, 0.3192138671875, 0.515625, 0.7120361328125, 0.908447265625, 1.1048583984375, 1.30126953125, 1.4976806640625, 1.694091796875, 1.8905029296875, 2.0869140625, 2.2833251953125, 2.479736328125, 2.6761474609375, 2.87255859375, 3.0689697265625, 3.265380859375, 3.4617919921875, 3.658203125, 3.8546142578125, 4.051025390625, 4.2474365234375, 4.44384765625, 4.6402587890625, 4.836669921875, 5.0330810546875, 5.2294921875, 5.4259033203125, 5.622314453125, 5.8187255859375, 6.01513671875, 6.2115478515625, 6.407958984375, 6.6043701171875, 6.80078125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 10.0, 16.0, 19.0, 35.0, 51.0, 72.0, 79.0, 152.0, 229.0, 308.0, 423.0, 701.0, 941.0, 1624.0, 2652.0, 5013.0, 11095.0, 28341.0, 79143.0, 242806.0, 416950.0, 164109.0, 54927.0, 20218.0, 8309.0, 4023.0, 2177.0, 1355.0, 898.0, 623.0, 406.0, 255.0, 182.0, 113.0, 99.0, 60.0, 40.0, 36.0, 23.0, 8.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.263671875, -3.1627197265625, -3.061767578125, -2.9608154296875, -2.85986328125, -2.7589111328125, -2.657958984375, -2.5570068359375, -2.4560546875, -2.3551025390625, -2.254150390625, -2.1531982421875, -2.05224609375, -1.9512939453125, -1.850341796875, -1.7493896484375, -1.6484375, -1.5474853515625, -1.446533203125, -1.3455810546875, -1.24462890625, -1.1436767578125, -1.042724609375, -0.9417724609375, -0.8408203125, -0.7398681640625, -0.638916015625, -0.5379638671875, -0.43701171875, -0.3360595703125, -0.235107421875, -0.1341552734375, -0.033203125, 0.0677490234375, 0.168701171875, 0.2696533203125, 0.37060546875, 0.4715576171875, 0.572509765625, 0.6734619140625, 0.7744140625, 0.8753662109375, 0.976318359375, 1.0772705078125, 1.17822265625, 1.2791748046875, 1.380126953125, 1.4810791015625, 1.58203125, 1.6829833984375, 1.783935546875, 1.8848876953125, 1.98583984375, 2.0867919921875, 2.187744140625, 2.2886962890625, 2.3896484375, 2.4906005859375, 2.591552734375, 2.6925048828125, 2.79345703125, 2.8944091796875, 2.995361328125, 3.0963134765625, 3.197265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 14.0, 9.0, 13.0, 10.0, 18.0, 17.0, 9.0, 27.0, 25.0, 40.0, 31.0, 38.0, 43.0, 29.0, 46.0, 43.0, 36.0, 1071.0, 47.0, 43.0, 42.0, 37.0, 40.0, 45.0, 32.0, 28.0, 31.0, 30.0, 20.0, 16.0, 22.0, 13.0, 17.0, 13.0, 8.0, 2.0, 6.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.22265625, -5.075927734375, -4.92919921875, -4.782470703125, -4.6357421875, -4.489013671875, -4.34228515625, -4.195556640625, -4.048828125, -3.902099609375, -3.75537109375, -3.608642578125, -3.4619140625, -3.315185546875, -3.16845703125, -3.021728515625, -2.875, -2.728271484375, -2.58154296875, -2.434814453125, -2.2880859375, -2.141357421875, -1.99462890625, -1.847900390625, -1.701171875, -1.554443359375, -1.40771484375, -1.260986328125, -1.1142578125, -0.967529296875, -0.82080078125, -0.674072265625, -0.52734375, -0.380615234375, -0.23388671875, -0.087158203125, 0.0595703125, 0.206298828125, 0.35302734375, 0.499755859375, 0.646484375, 0.793212890625, 0.93994140625, 1.086669921875, 1.2333984375, 1.380126953125, 1.52685546875, 1.673583984375, 1.8203125, 1.967041015625, 2.11376953125, 2.260498046875, 2.4072265625, 2.553955078125, 2.70068359375, 2.847412109375, 2.994140625, 3.140869140625, 3.28759765625, 3.434326171875, 3.5810546875, 3.727783203125, 3.87451171875, 4.021240234375, 4.16796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 3.0, 5.0, 5.0, 12.0, 16.0, 21.0, 22.0, 43.0, 65.0, 85.0, 136.0, 213.0, 356.0, 560.0, 1076.0, 2247.0, 5562.0, 18863.0, 96657.0, 1252175.0, 628116.0, 67900.0, 14266.0, 4467.0, 1959.0, 902.0, 533.0, 300.0, 190.0, 115.0, 77.0, 57.0, 38.0, 23.0, 14.0, 12.0, 16.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.97265625, -2.87646484375, -2.7802734375, -2.68408203125, -2.587890625, -2.49169921875, -2.3955078125, -2.29931640625, -2.203125, -2.10693359375, -2.0107421875, -1.91455078125, -1.818359375, -1.72216796875, -1.6259765625, -1.52978515625, -1.43359375, -1.33740234375, -1.2412109375, -1.14501953125, -1.048828125, -0.95263671875, -0.8564453125, -0.76025390625, -0.6640625, -0.56787109375, -0.4716796875, -0.37548828125, -0.279296875, -0.18310546875, -0.0869140625, 0.00927734375, 0.10546875, 0.20166015625, 0.2978515625, 0.39404296875, 0.490234375, 0.58642578125, 0.6826171875, 0.77880859375, 0.875, 0.97119140625, 1.0673828125, 1.16357421875, 1.259765625, 1.35595703125, 1.4521484375, 1.54833984375, 1.64453125, 1.74072265625, 1.8369140625, 1.93310546875, 2.029296875, 2.12548828125, 2.2216796875, 2.31787109375, 2.4140625, 2.51025390625, 2.6064453125, 2.70263671875, 2.798828125, 2.89501953125, 2.9912109375, 3.08740234375, 3.18359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 9.0, 7.0, 15.0, 12.0, 10.0, 15.0, 19.0, 25.0, 32.0, 47.0, 61.0, 100.0, 213.0, 137.0, 65.0, 49.0, 34.0, 39.0, 23.0, 13.0, 9.0, 13.0, 10.0, 5.0, 6.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48681640625, -0.4719505310058594, -0.45708465576171875, -0.4422187805175781, -0.4273529052734375, -0.4124870300292969, -0.39762115478515625, -0.3827552795410156, -0.367889404296875, -0.3530235290527344, -0.33815765380859375, -0.3232917785644531, -0.3084259033203125, -0.2935600280761719, -0.27869415283203125, -0.2638282775878906, -0.24896240234375, -0.23409652709960938, -0.21923065185546875, -0.20436477661132812, -0.1894989013671875, -0.17463302612304688, -0.15976715087890625, -0.14490127563476562, -0.130035400390625, -0.11516952514648438, -0.10030364990234375, -0.08543777465820312, -0.0705718994140625, -0.055706024169921875, -0.04084014892578125, -0.025974273681640625, -0.0111083984375, 0.003757476806640625, 0.01862335205078125, 0.033489227294921875, 0.0483551025390625, 0.06322097778320312, 0.07808685302734375, 0.09295272827148438, 0.107818603515625, 0.12268447875976562, 0.13755035400390625, 0.15241622924804688, 0.1672821044921875, 0.18214797973632812, 0.19701385498046875, 0.21187973022460938, 0.22674560546875, 0.24161148071289062, 0.25647735595703125, 0.2713432312011719, 0.2862091064453125, 0.3010749816894531, 0.31594085693359375, 0.3308067321777344, 0.345672607421875, 0.3605384826660156, 0.37540435791015625, 0.3902702331542969, 0.4051361083984375, 0.4200019836425781, 0.43486785888671875, 0.4497337341308594, 0.464599609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 6.0, 6.0, 12.0, 9.0, 13.0, 24.0, 21.0, 40.0, 60.0, 107.0, 184.0, 492.0, 6451.0, 967647.0, 71477.0, 1293.0, 306.0, 151.0, 70.0, 42.0, 29.0, 16.0, 18.0, 19.0, 9.0, 10.0, 6.0, 6.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.2398681640625, -7.971923828125, -7.7039794921875, -7.43603515625, -7.1680908203125, -6.900146484375, -6.6322021484375, -6.3642578125, -6.0963134765625, -5.828369140625, -5.5604248046875, -5.29248046875, -5.0245361328125, -4.756591796875, -4.4886474609375, -4.220703125, -3.9527587890625, -3.684814453125, -3.4168701171875, -3.14892578125, -2.8809814453125, -2.613037109375, -2.3450927734375, -2.0771484375, -1.8092041015625, -1.541259765625, -1.2733154296875, -1.00537109375, -0.7374267578125, -0.469482421875, -0.2015380859375, 0.06640625, 0.3343505859375, 0.602294921875, 0.8702392578125, 1.13818359375, 1.4061279296875, 1.674072265625, 1.9420166015625, 2.2099609375, 2.4779052734375, 2.745849609375, 3.0137939453125, 3.28173828125, 3.5496826171875, 3.817626953125, 4.0855712890625, 4.353515625, 4.6214599609375, 4.889404296875, 5.1573486328125, 5.42529296875, 5.6932373046875, 5.961181640625, 6.2291259765625, 6.4970703125, 6.7650146484375, 7.032958984375, 7.3009033203125, 7.56884765625, 7.8367919921875, 8.104736328125, 8.3726806640625, 8.640625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 13.0, 40.0, 79.0, 195.0, 263.0, 222.0, 113.0, 55.0, 22.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0071334838867188, -0.9535536170005798, -0.8999736905097961, -0.8463938236236572, -0.7928138971328735, -0.7392340302467346, -0.6856541633605957, -0.632074236869812, -0.5784943103790283, -0.5249144434928894, -0.4713345170021057, -0.4177546501159668, -0.3641747236251831, -0.3105948567390442, -0.2570149600505829, -0.20343506336212158, -0.14985519647598267, -0.09627529978752136, -0.042695410549640656, 0.010884478688240051, 0.06446437537670135, 0.11804425716400146, 0.17162415385246277, 0.22520405054092407, 0.2787839472293854, 0.3323638439178467, 0.385943740606308, 0.4395236372947693, 0.4931035041809082, 0.5466834306716919, 0.6002632975578308, 0.6538431644439697, 0.7074230909347534, 0.7610029578208923, 0.814582884311676, 0.8681627511978149, 0.9217426776885986, 0.9753225445747375, 1.0289024114608765, 1.0824823379516602, 1.1360622644424438, 1.1896421909332275, 1.2432219982147217, 1.2968019247055054, 1.350381851196289, 1.4039616584777832, 1.457541584968567, 1.5111215114593506, 1.5647013187408447, 1.6182812452316284, 1.6718610525131226, 1.7254409790039062, 1.77902090549469, 1.8326008319854736, 1.8861806392669678, 1.9397605657577515, 1.9933404922485352, 2.0469202995300293, 2.1005003452301025, 2.1540801525115967, 2.207659959793091, 2.261240005493164, 2.314819812774658, 2.3683996200561523, 2.4219796657562256]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 2.0, 6.0, 7.0, 5.0, 5.0, 9.0, 9.0, 13.0, 17.0, 22.0, 25.0, 29.0, 32.0, 28.0, 32.0, 31.0, 38.0, 39.0, 38.0, 43.0, 40.0, 43.0, 57.0, 38.0, 40.0, 43.0, 49.0, 33.0, 40.0, 26.0, 22.0, 20.0, 17.0, 20.0, 20.0, 16.0, 8.0, 9.0, 3.0, 6.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3933756351470947, -0.38143232464790344, -0.36948901414871216, -0.35754573345184326, -0.345602422952652, -0.3336591124534607, -0.3217158317565918, -0.3097725212574005, -0.29782921075820923, -0.28588590025901794, -0.27394258975982666, -0.26199930906295776, -0.2500559985637665, -0.2381126880645752, -0.2261693924665451, -0.21422609686851501, -0.20228278636932373, -0.19033947587013245, -0.17839618027210236, -0.16645288467407227, -0.15450957417488098, -0.1425662636756897, -0.1306229680776596, -0.11867966502904892, -0.10673636198043823, -0.09479305893182755, -0.08284975588321686, -0.07090645283460617, -0.05896314978599548, -0.047019846737384796, -0.03507654368877411, -0.02313324064016342, -0.011189937591552734, 0.0007533654570579529, 0.01269666850566864, 0.024639971554279327, 0.036583274602890015, 0.0485265776515007, 0.06046988070011139, 0.07241318374872208, 0.08435648679733276, 0.09629978984594345, 0.10824309289455414, 0.12018639594316483, 0.1321296989917755, 0.1440730094909668, 0.1560163050889969, 0.16795960068702698, 0.17990291118621826, 0.19184622168540955, 0.20378951728343964, 0.21573281288146973, 0.227676123380661, 0.2396194338798523, 0.2515627145767212, 0.2635060250759125, 0.27544933557510376, 0.28739264607429504, 0.29933595657348633, 0.3112792372703552, 0.3232225477695465, 0.3351658582687378, 0.3471091389656067, 0.359052449464798, 0.37099575996398926]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 8.0, 8.0, 4.0, 13.0, 12.0, 16.0, 23.0, 29.0, 20.0, 26.0, 33.0, 29.0, 42.0, 26.0, 47.0, 49.0, 43.0, 37.0, 52.0, 54.0, 29.0, 43.0, 35.0, 27.0, 39.0, 24.0, 31.0, 27.0, 16.0, 32.0, 15.0, 15.0, 16.0, 20.0, 16.0, 14.0, 5.0, 2.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.31964111328125, -5.1275634765625, -4.93548583984375, -4.743408203125, -4.55133056640625, -4.3592529296875, -4.16717529296875, -3.97509765625, -3.78302001953125, -3.5909423828125, -3.39886474609375, -3.206787109375, -3.01470947265625, -2.8226318359375, -2.63055419921875, -2.4384765625, -2.24639892578125, -2.0543212890625, -1.86224365234375, -1.670166015625, -1.47808837890625, -1.2860107421875, -1.09393310546875, -0.90185546875, -0.70977783203125, -0.5177001953125, -0.32562255859375, -0.133544921875, 0.05853271484375, 0.2506103515625, 0.44268798828125, 0.634765625, 0.82684326171875, 1.0189208984375, 1.21099853515625, 1.403076171875, 1.59515380859375, 1.7872314453125, 1.97930908203125, 2.17138671875, 2.36346435546875, 2.5555419921875, 2.74761962890625, 2.939697265625, 3.13177490234375, 3.3238525390625, 3.51593017578125, 3.7080078125, 3.90008544921875, 4.0921630859375, 4.28424072265625, 4.476318359375, 4.66839599609375, 4.8604736328125, 5.05255126953125, 5.24462890625, 5.43670654296875, 5.6287841796875, 5.82086181640625, 6.012939453125, 6.20501708984375, 6.3970947265625, 6.58917236328125, 6.78125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 6.0, 12.0, 12.0, 27.0, 23.0, 53.0, 63.0, 73.0, 114.0, 157.0, 234.0, 393.0, 562.0, 899.0, 1374.0, 2242.0, 3727.0, 6216.0, 11309.0, 21033.0, 45567.0, 119477.0, 362080.0, 296458.0, 95287.0, 38057.0, 18496.0, 9989.0, 5557.0, 3302.0, 2037.0, 1260.0, 797.0, 527.0, 328.0, 237.0, 180.0, 118.0, 62.0, 44.0, 44.0, 41.0, 31.0, 14.0, 14.0, 9.0, 0.0, 4.0, 1.0], "bins": [-12.78125, -12.4439697265625, -12.106689453125, -11.7694091796875, -11.43212890625, -11.0948486328125, -10.757568359375, -10.4202880859375, -10.0830078125, -9.7457275390625, -9.408447265625, -9.0711669921875, -8.73388671875, -8.3966064453125, -8.059326171875, -7.7220458984375, -7.384765625, -7.0474853515625, -6.710205078125, -6.3729248046875, -6.03564453125, -5.6983642578125, -5.361083984375, -5.0238037109375, -4.6865234375, -4.3492431640625, -4.011962890625, -3.6746826171875, -3.33740234375, -3.0001220703125, -2.662841796875, -2.3255615234375, -1.98828125, -1.6510009765625, -1.313720703125, -0.9764404296875, -0.63916015625, -0.3018798828125, 0.035400390625, 0.3726806640625, 0.7099609375, 1.0472412109375, 1.384521484375, 1.7218017578125, 2.05908203125, 2.3963623046875, 2.733642578125, 3.0709228515625, 3.408203125, 3.7454833984375, 4.082763671875, 4.4200439453125, 4.75732421875, 5.0946044921875, 5.431884765625, 5.7691650390625, 6.1064453125, 6.4437255859375, 6.781005859375, 7.1182861328125, 7.45556640625, 7.7928466796875, 8.130126953125, 8.4674072265625, 8.8046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 6.0, 5.0, 9.0, 8.0, 7.0, 19.0, 21.0, 21.0, 24.0, 27.0, 43.0, 43.0, 59.0, 68.0, 90.0, 112.0, 227.0, 1414.0, 260.0, 145.0, 83.0, 62.0, 45.0, 45.0, 28.0, 33.0, 37.0, 22.0, 21.0, 13.0, 14.0, 6.0, 8.0, 3.0, 5.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.625, -23.662109375, -22.69921875, -21.736328125, -20.7734375, -19.810546875, -18.84765625, -17.884765625, -16.921875, -15.958984375, -14.99609375, -14.033203125, -13.0703125, -12.107421875, -11.14453125, -10.181640625, -9.21875, -8.255859375, -7.29296875, -6.330078125, -5.3671875, -4.404296875, -3.44140625, -2.478515625, -1.515625, -0.552734375, 0.41015625, 1.373046875, 2.3359375, 3.298828125, 4.26171875, 5.224609375, 6.1875, 7.150390625, 8.11328125, 9.076171875, 10.0390625, 11.001953125, 11.96484375, 12.927734375, 13.890625, 14.853515625, 15.81640625, 16.779296875, 17.7421875, 18.705078125, 19.66796875, 20.630859375, 21.59375, 22.556640625, 23.51953125, 24.482421875, 25.4453125, 26.408203125, 27.37109375, 28.333984375, 29.296875, 30.259765625, 31.22265625, 32.185546875, 33.1484375, 34.111328125, 35.07421875, 36.037109375, 37.0]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 17.0, 28.0, 23.0, 78.0, 119.0, 237.0, 571.0, 1720.0, 9503.0, 2033407.0, 1088789.0, 8372.0, 1695.0, 569.0, 208.0, 128.0, 56.0, 24.0, 26.0, 20.0, 25.0, 7.0, 8.0, 6.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-110.0625, -106.6201171875, -103.177734375, -99.7353515625, -96.29296875, -92.8505859375, -89.408203125, -85.9658203125, -82.5234375, -79.0810546875, -75.638671875, -72.1962890625, -68.75390625, -65.3115234375, -61.869140625, -58.4267578125, -54.984375, -51.5419921875, -48.099609375, -44.6572265625, -41.21484375, -37.7724609375, -34.330078125, -30.8876953125, -27.4453125, -24.0029296875, -20.560546875, -17.1181640625, -13.67578125, -10.2333984375, -6.791015625, -3.3486328125, 0.09375, 3.5361328125, 6.978515625, 10.4208984375, 13.86328125, 17.3056640625, 20.748046875, 24.1904296875, 27.6328125, 31.0751953125, 34.517578125, 37.9599609375, 41.40234375, 44.8447265625, 48.287109375, 51.7294921875, 55.171875, 58.6142578125, 62.056640625, 65.4990234375, 68.94140625, 72.3837890625, 75.826171875, 79.2685546875, 82.7109375, 86.1533203125, 89.595703125, 93.0380859375, 96.48046875, 99.9228515625, 103.365234375, 106.8076171875, 110.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 190.0, 804.0, 21.0, 1.0, 1.0, 3.0], "bins": [-1539.7672119140625, -1513.7623291015625, -1487.7574462890625, -1461.7525634765625, -1435.74755859375, -1409.74267578125, -1383.73779296875, -1357.73291015625, -1331.72802734375, -1305.72314453125, -1279.71826171875, -1253.71337890625, -1227.7083740234375, -1201.7034912109375, -1175.6986083984375, -1149.6937255859375, -1123.6888427734375, -1097.6839599609375, -1071.6790771484375, -1045.6741943359375, -1019.6692504882812, -993.664306640625, -967.659423828125, -941.654541015625, -915.6495971679688, -889.6447143554688, -863.6397705078125, -837.6348876953125, -811.6300048828125, -785.6251220703125, -759.6201782226562, -733.6152954101562, -707.6104125976562, -681.6055297851562, -655.6005859375, -629.595703125, -603.5908203125, -577.5859375, -551.5809936523438, -525.5761108398438, -499.57122802734375, -473.5663146972656, -447.5614318847656, -421.5565185546875, -395.5516357421875, -369.5467224121094, -343.54180908203125, -317.53692626953125, -291.53204345703125, -265.5271301269531, -239.52224731445312, -213.517333984375, -187.512451171875, -161.50753784179688, -135.5026397705078, -109.49774169921875, -83.49282836914062, -57.48793029785156, -31.483028411865234, -5.478126525878906, 20.526771545410156, 46.53167724609375, 72.53657531738281, 98.54147338867188, 124.54637145996094]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 2.0, 3.0, 10.0, 16.0, 12.0, 16.0, 12.0, 15.0, 18.0, 24.0, 31.0, 23.0, 38.0, 33.0, 32.0, 40.0, 35.0, 49.0, 60.0, 39.0, 26.0, 55.0, 43.0, 50.0, 41.0, 33.0, 37.0, 41.0, 26.0, 21.0, 18.0, 25.0, 20.0, 12.0, 10.0, 5.0, 8.0, 11.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-82.3473129272461, -80.09688568115234, -77.8464584350586, -75.59603118896484, -73.3456039428711, -71.09517669677734, -68.8447494506836, -66.59432220458984, -64.3438949584961, -62.093467712402344, -59.843040466308594, -57.592613220214844, -55.342185974121094, -53.091758728027344, -50.841331481933594, -48.590904235839844, -46.340476989746094, -44.090049743652344, -41.839622497558594, -39.589195251464844, -37.338768005371094, -35.088340759277344, -32.837913513183594, -30.587486267089844, -28.337059020996094, -26.086631774902344, -23.836204528808594, -21.585777282714844, -19.335350036621094, -17.084922790527344, -14.834495544433594, -12.584068298339844, -10.333633422851562, -8.083206176757812, -5.8327789306640625, -3.5823516845703125, -1.3319244384765625, 0.9185028076171875, 3.1689300537109375, 5.4193572998046875, 7.6697845458984375, 9.920211791992188, 12.170639038085938, 14.421066284179688, 16.671493530273438, 18.921920776367188, 21.172348022460938, 23.422775268554688, 25.673202514648438, 27.923629760742188, 30.174057006835938, 32.42448425292969, 34.67491149902344, 36.92533874511719, 39.17576599121094, 41.42619323730469, 43.67662048339844, 45.92704772949219, 48.17747497558594, 50.42790222167969, 52.67832946777344, 54.92875671386719, 57.17918395996094, 59.42961120605469, 61.68003845214844]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 3.0, 4.0, 10.0, 10.0, 17.0, 17.0, 18.0, 20.0, 24.0, 25.0, 28.0, 28.0, 38.0, 35.0, 42.0, 40.0, 48.0, 44.0, 44.0, 32.0, 46.0, 29.0, 56.0, 50.0, 36.0, 34.0, 20.0, 31.0, 23.0, 30.0, 21.0, 23.0, 18.0, 13.0, 5.0, 5.0, 8.0, 8.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.5596923828125, -5.338134765625, -5.1165771484375, -4.89501953125, -4.6734619140625, -4.451904296875, -4.2303466796875, -4.0087890625, -3.7872314453125, -3.565673828125, -3.3441162109375, -3.12255859375, -2.9010009765625, -2.679443359375, -2.4578857421875, -2.236328125, -2.0147705078125, -1.793212890625, -1.5716552734375, -1.35009765625, -1.1285400390625, -0.906982421875, -0.6854248046875, -0.4638671875, -0.2423095703125, -0.020751953125, 0.2008056640625, 0.42236328125, 0.6439208984375, 0.865478515625, 1.0870361328125, 1.30859375, 1.5301513671875, 1.751708984375, 1.9732666015625, 2.19482421875, 2.4163818359375, 2.637939453125, 2.8594970703125, 3.0810546875, 3.3026123046875, 3.524169921875, 3.7457275390625, 3.96728515625, 4.1888427734375, 4.410400390625, 4.6319580078125, 4.853515625, 5.0750732421875, 5.296630859375, 5.5181884765625, 5.73974609375, 5.9613037109375, 6.182861328125, 6.4044189453125, 6.6259765625, 6.8475341796875, 7.069091796875, 7.2906494140625, 7.51220703125, 7.7337646484375, 7.955322265625, 8.1768798828125, 8.3984375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 8.0, 9.0, 20.0, 22.0, 31.0, 47.0, 78.0, 130.0, 225.0, 356.0, 589.0, 880.0, 1503.0, 2779.0, 5263.0, 10536.0, 24812.0, 99702.0, 1420023.0, 2400444.0, 168360.0, 31679.0, 12818.0, 5996.0, 3262.0, 1812.0, 1045.0, 649.0, 428.0, 277.0, 154.0, 128.0, 68.0, 39.0, 37.0, 25.0, 17.0, 13.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.53125, -16.94921875, -16.3671875, -15.78515625, -15.203125, -14.62109375, -14.0390625, -13.45703125, -12.875, -12.29296875, -11.7109375, -11.12890625, -10.546875, -9.96484375, -9.3828125, -8.80078125, -8.21875, -7.63671875, -7.0546875, -6.47265625, -5.890625, -5.30859375, -4.7265625, -4.14453125, -3.5625, -2.98046875, -2.3984375, -1.81640625, -1.234375, -0.65234375, -0.0703125, 0.51171875, 1.09375, 1.67578125, 2.2578125, 2.83984375, 3.421875, 4.00390625, 4.5859375, 5.16796875, 5.75, 6.33203125, 6.9140625, 7.49609375, 8.078125, 8.66015625, 9.2421875, 9.82421875, 10.40625, 10.98828125, 11.5703125, 12.15234375, 12.734375, 13.31640625, 13.8984375, 14.48046875, 15.0625, 15.64453125, 16.2265625, 16.80859375, 17.390625, 17.97265625, 18.5546875, 19.13671875, 19.71875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 14.0, 17.0, 23.0, 29.0, 46.0, 51.0, 79.0, 117.0, 199.0, 400.0, 758.0, 955.0, 607.0, 321.0, 160.0, 76.0, 58.0, 39.0, 26.0, 22.0, 14.0, 8.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.4375, -24.77294921875, -24.1083984375, -23.44384765625, -22.779296875, -22.11474609375, -21.4501953125, -20.78564453125, -20.12109375, -19.45654296875, -18.7919921875, -18.12744140625, -17.462890625, -16.79833984375, -16.1337890625, -15.46923828125, -14.8046875, -14.14013671875, -13.4755859375, -12.81103515625, -12.146484375, -11.48193359375, -10.8173828125, -10.15283203125, -9.48828125, -8.82373046875, -8.1591796875, -7.49462890625, -6.830078125, -6.16552734375, -5.5009765625, -4.83642578125, -4.171875, -3.50732421875, -2.8427734375, -2.17822265625, -1.513671875, -0.84912109375, -0.1845703125, 0.47998046875, 1.14453125, 1.80908203125, 2.4736328125, 3.13818359375, 3.802734375, 4.46728515625, 5.1318359375, 5.79638671875, 6.4609375, 7.12548828125, 7.7900390625, 8.45458984375, 9.119140625, 9.78369140625, 10.4482421875, 11.11279296875, 11.77734375, 12.44189453125, 13.1064453125, 13.77099609375, 14.435546875, 15.10009765625, 15.7646484375, 16.42919921875, 17.09375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 7.0, 8.0, 13.0, 24.0, 51.0, 63.0, 102.0, 207.0, 410.0, 799.0, 1648.0, 4178.0, 11848.0, 43938.0, 390650.0, 3479054.0, 213698.0, 31976.0, 9238.0, 3351.0, 1480.0, 717.0, 358.0, 197.0, 97.0, 68.0, 34.0, 22.0, 13.0, 10.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.0, -26.97802734375, -25.9560546875, -24.93408203125, -23.912109375, -22.89013671875, -21.8681640625, -20.84619140625, -19.82421875, -18.80224609375, -17.7802734375, -16.75830078125, -15.736328125, -14.71435546875, -13.6923828125, -12.67041015625, -11.6484375, -10.62646484375, -9.6044921875, -8.58251953125, -7.560546875, -6.53857421875, -5.5166015625, -4.49462890625, -3.47265625, -2.45068359375, -1.4287109375, -0.40673828125, 0.615234375, 1.63720703125, 2.6591796875, 3.68115234375, 4.703125, 5.72509765625, 6.7470703125, 7.76904296875, 8.791015625, 9.81298828125, 10.8349609375, 11.85693359375, 12.87890625, 13.90087890625, 14.9228515625, 15.94482421875, 16.966796875, 17.98876953125, 19.0107421875, 20.03271484375, 21.0546875, 22.07666015625, 23.0986328125, 24.12060546875, 25.142578125, 26.16455078125, 27.1865234375, 28.20849609375, 29.23046875, 30.25244140625, 31.2744140625, 32.29638671875, 33.318359375, 34.34033203125, 35.3623046875, 36.38427734375, 37.40625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 13.0, 15.0, 41.0, 42.0, 93.0, 173.0, 218.0, 183.0, 100.0, 61.0, 32.0, 18.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.308170318603516, -54.06150436401367, -49.814842224121094, -45.56817626953125, -41.321510314941406, -37.07484817504883, -32.828182220458984, -28.581518173217773, -24.334854125976562, -20.08819007873535, -15.841525077819824, -11.594860076904297, -7.348196029663086, -3.101531982421875, 1.1451339721679688, 5.39179801940918, 9.63846206665039, 13.885126113891602, 18.131790161132812, 22.378456115722656, 26.625120162963867, 30.871784210205078, 35.11845016479492, 39.3651123046875, 43.611778259277344, 47.85844421386719, 52.105106353759766, 56.35177230834961, 60.59843444824219, 64.84510040283203, 69.09176635742188, 73.33843231201172, 77.5850830078125, 81.83174896240234, 86.07841491699219, 90.3250732421875, 94.57173919677734, 98.81840515136719, 103.06507110595703, 107.31173706054688, 111.55839538574219, 115.80506134033203, 120.05172729492188, 124.29838562011719, 128.54505920410156, 132.79171752929688, 137.03839111328125, 141.28504943847656, 145.53170776367188, 149.7783660888672, 154.02503967285156, 158.27169799804688, 162.51837158203125, 166.76502990722656, 171.01168823242188, 175.25836181640625, 179.50503540039062, 183.75169372558594, 187.9983673095703, 192.24502563476562, 196.49169921875, 200.7383575439453, 204.98501586914062, 209.231689453125, 213.4783477783203]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 6.0, 15.0, 8.0, 18.0, 17.0, 12.0, 16.0, 24.0, 22.0, 23.0, 39.0, 44.0, 38.0, 34.0, 29.0, 35.0, 48.0, 40.0, 51.0, 38.0, 36.0, 39.0, 34.0, 35.0, 34.0, 35.0, 26.0, 23.0, 17.0, 20.0, 22.0, 30.0, 11.0, 15.0, 10.0, 10.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.37556076049805, -50.801177978515625, -49.2267951965332, -47.65241241455078, -46.078033447265625, -44.5036506652832, -42.92926788330078, -41.35488510131836, -39.78050231933594, -38.206119537353516, -36.631736755371094, -35.05735397338867, -33.48297119140625, -31.90859031677246, -30.334209442138672, -28.75982666015625, -27.185443878173828, -25.611061096191406, -24.036678314208984, -22.462297439575195, -20.887914657592773, -19.31353187561035, -17.739151000976562, -16.16476821899414, -14.590385437011719, -13.016002655029297, -11.441620826721191, -9.867238998413086, -8.292856216430664, -6.7184739112854, -5.144091606140137, -3.5697097778320312, -1.9953269958496094, -0.4209446907043457, 1.153437614440918, 2.7278199195861816, 4.302202224731445, 5.876584529876709, 7.450966835021973, 9.025348663330078, 10.5997314453125, 12.174114227294922, 13.748496055603027, 15.322877883911133, 16.897260665893555, 18.471643447875977, 20.046024322509766, 21.620407104492188, 23.19478988647461, 24.76917266845703, 26.343555450439453, 27.917936325073242, 29.492319107055664, 31.066701889038086, 32.641082763671875, 34.2154655456543, 35.78984832763672, 37.36423110961914, 38.93861389160156, 40.512996673583984, 42.087379455566406, 43.66175842285156, 45.236141204833984, 46.810523986816406, 48.38490676879883]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 7.0, 10.0, 8.0, 11.0, 9.0, 17.0, 21.0, 23.0, 31.0, 29.0, 35.0, 30.0, 39.0, 35.0, 28.0, 34.0, 48.0, 57.0, 37.0, 32.0, 34.0, 42.0, 38.0, 40.0, 41.0, 26.0, 31.0, 28.0, 26.0, 21.0, 18.0, 22.0, 15.0, 14.0, 11.0, 10.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.53125, -5.333251953125, -5.13525390625, -4.937255859375, -4.7392578125, -4.541259765625, -4.34326171875, -4.145263671875, -3.947265625, -3.749267578125, -3.55126953125, -3.353271484375, -3.1552734375, -2.957275390625, -2.75927734375, -2.561279296875, -2.36328125, -2.165283203125, -1.96728515625, -1.769287109375, -1.5712890625, -1.373291015625, -1.17529296875, -0.977294921875, -0.779296875, -0.581298828125, -0.38330078125, -0.185302734375, 0.0126953125, 0.210693359375, 0.40869140625, 0.606689453125, 0.8046875, 1.002685546875, 1.20068359375, 1.398681640625, 1.5966796875, 1.794677734375, 1.99267578125, 2.190673828125, 2.388671875, 2.586669921875, 2.78466796875, 2.982666015625, 3.1806640625, 3.378662109375, 3.57666015625, 3.774658203125, 3.97265625, 4.170654296875, 4.36865234375, 4.566650390625, 4.7646484375, 4.962646484375, 5.16064453125, 5.358642578125, 5.556640625, 5.754638671875, 5.95263671875, 6.150634765625, 6.3486328125, 6.546630859375, 6.74462890625, 6.942626953125, 7.140625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 17.0, 17.0, 22.0, 33.0, 42.0, 67.0, 86.0, 126.0, 174.0, 274.0, 464.0, 716.0, 1157.0, 1973.0, 3882.0, 7820.0, 16549.0, 36443.0, 86278.0, 220071.0, 377060.0, 170295.0, 67986.0, 29413.0, 13250.0, 6460.0, 3313.0, 1750.0, 992.0, 621.0, 375.0, 248.0, 166.0, 108.0, 87.0, 59.0, 55.0, 24.0, 14.0, 9.0, 11.0, 5.0, 10.0, 5.0, 4.0, 3.0, 0.0, 3.0, 4.0, 3.0], "bins": [-3.232421875, -3.13836669921875, -3.0443115234375, -2.95025634765625, -2.856201171875, -2.76214599609375, -2.6680908203125, -2.57403564453125, -2.47998046875, -2.38592529296875, -2.2918701171875, -2.19781494140625, -2.103759765625, -2.00970458984375, -1.9156494140625, -1.82159423828125, -1.7275390625, -1.63348388671875, -1.5394287109375, -1.44537353515625, -1.351318359375, -1.25726318359375, -1.1632080078125, -1.06915283203125, -0.97509765625, -0.88104248046875, -0.7869873046875, -0.69293212890625, -0.598876953125, -0.50482177734375, -0.4107666015625, -0.31671142578125, -0.22265625, -0.12860107421875, -0.0345458984375, 0.05950927734375, 0.153564453125, 0.24761962890625, 0.3416748046875, 0.43572998046875, 0.52978515625, 0.62384033203125, 0.7178955078125, 0.81195068359375, 0.906005859375, 1.00006103515625, 1.0941162109375, 1.18817138671875, 1.2822265625, 1.37628173828125, 1.4703369140625, 1.56439208984375, 1.658447265625, 1.75250244140625, 1.8465576171875, 1.94061279296875, 2.03466796875, 2.12872314453125, 2.2227783203125, 2.31683349609375, 2.410888671875, 2.50494384765625, 2.5989990234375, 2.69305419921875, 2.787109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 14.0, 5.0, 11.0, 10.0, 11.0, 12.0, 21.0, 18.0, 21.0, 26.0, 23.0, 23.0, 29.0, 31.0, 39.0, 30.0, 37.0, 38.0, 41.0, 1077.0, 51.0, 42.0, 41.0, 33.0, 44.0, 43.0, 31.0, 27.0, 26.0, 31.0, 25.0, 23.0, 13.0, 12.0, 15.0, 10.0, 11.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.4029541015625, -4.255126953125, -4.1072998046875, -3.95947265625, -3.8116455078125, -3.663818359375, -3.5159912109375, -3.3681640625, -3.2203369140625, -3.072509765625, -2.9246826171875, -2.77685546875, -2.6290283203125, -2.481201171875, -2.3333740234375, -2.185546875, -2.0377197265625, -1.889892578125, -1.7420654296875, -1.59423828125, -1.4464111328125, -1.298583984375, -1.1507568359375, -1.0029296875, -0.8551025390625, -0.707275390625, -0.5594482421875, -0.41162109375, -0.2637939453125, -0.115966796875, 0.0318603515625, 0.1796875, 0.3275146484375, 0.475341796875, 0.6231689453125, 0.77099609375, 0.9188232421875, 1.066650390625, 1.2144775390625, 1.3623046875, 1.5101318359375, 1.657958984375, 1.8057861328125, 1.95361328125, 2.1014404296875, 2.249267578125, 2.3970947265625, 2.544921875, 2.6927490234375, 2.840576171875, 2.9884033203125, 3.13623046875, 3.2840576171875, 3.431884765625, 3.5797119140625, 3.7275390625, 3.8753662109375, 4.023193359375, 4.1710205078125, 4.31884765625, 4.4666748046875, 4.614501953125, 4.7623291015625, 4.91015625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 4.0, 5.0, 11.0, 13.0, 16.0, 24.0, 34.0, 50.0, 78.0, 144.0, 230.0, 335.0, 566.0, 956.0, 1815.0, 3430.0, 6937.0, 15399.0, 37702.0, 107564.0, 466267.0, 1155059.0, 197542.0, 59808.0, 22999.0, 9763.0, 4736.0, 2410.0, 1321.0, 721.0, 425.0, 284.0, 160.0, 137.0, 48.0, 45.0, 31.0, 13.0, 19.0, 8.0, 6.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9990234375, -1.938873291015625, -1.87872314453125, -1.818572998046875, -1.7584228515625, -1.698272705078125, -1.63812255859375, -1.577972412109375, -1.517822265625, -1.457672119140625, -1.39752197265625, -1.337371826171875, -1.2772216796875, -1.217071533203125, -1.15692138671875, -1.096771240234375, -1.03662109375, -0.976470947265625, -0.91632080078125, -0.856170654296875, -0.7960205078125, -0.735870361328125, -0.67572021484375, -0.615570068359375, -0.555419921875, -0.495269775390625, -0.43511962890625, -0.374969482421875, -0.3148193359375, -0.254669189453125, -0.19451904296875, -0.134368896484375, -0.07421875, -0.014068603515625, 0.04608154296875, 0.106231689453125, 0.1663818359375, 0.226531982421875, 0.28668212890625, 0.346832275390625, 0.406982421875, 0.467132568359375, 0.52728271484375, 0.587432861328125, 0.6475830078125, 0.707733154296875, 0.76788330078125, 0.828033447265625, 0.88818359375, 0.948333740234375, 1.00848388671875, 1.068634033203125, 1.1287841796875, 1.188934326171875, 1.24908447265625, 1.309234619140625, 1.369384765625, 1.429534912109375, 1.48968505859375, 1.549835205078125, 1.6099853515625, 1.670135498046875, 1.73028564453125, 1.790435791015625, 1.8505859375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 5.0, 3.0, 2.0, 8.0, 5.0, 10.0, 15.0, 12.0, 14.0, 15.0, 23.0, 31.0, 39.0, 45.0, 76.0, 106.0, 116.0, 109.0, 80.0, 49.0, 44.0, 29.0, 22.0, 29.0, 28.0, 16.0, 11.0, 16.0, 11.0, 10.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.3499259948730469, -0.33632659912109375, -0.3227272033691406, -0.3091278076171875, -0.2955284118652344, -0.28192901611328125, -0.2683296203613281, -0.254730224609375, -0.24113082885742188, -0.22753143310546875, -0.21393203735351562, -0.2003326416015625, -0.18673324584960938, -0.17313385009765625, -0.15953445434570312, -0.14593505859375, -0.13233566284179688, -0.11873626708984375, -0.10513687133789062, -0.0915374755859375, -0.07793807983398438, -0.06433868408203125, -0.050739288330078125, -0.037139892578125, -0.023540496826171875, -0.00994110107421875, 0.003658294677734375, 0.0172576904296875, 0.030857086181640625, 0.04445648193359375, 0.058055877685546875, 0.0716552734375, 0.08525466918945312, 0.09885406494140625, 0.11245346069335938, 0.1260528564453125, 0.13965225219726562, 0.15325164794921875, 0.16685104370117188, 0.180450439453125, 0.19404983520507812, 0.20764923095703125, 0.22124862670898438, 0.2348480224609375, 0.24844741821289062, 0.26204681396484375, 0.2756462097167969, 0.28924560546875, 0.3028450012207031, 0.31644439697265625, 0.3300437927246094, 0.3436431884765625, 0.3572425842285156, 0.37084197998046875, 0.3844413757324219, 0.398040771484375, 0.4116401672363281, 0.42523956298828125, 0.4388389587402344, 0.4524383544921875, 0.4660377502441406, 0.47963714599609375, 0.4932365417480469, 0.5068359375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 9.0, 10.0, 19.0, 24.0, 32.0, 25.0, 42.0, 81.0, 93.0, 147.0, 384.0, 2346.0, 54540.0, 963466.0, 25013.0, 1549.0, 302.0, 135.0, 79.0, 62.0, 42.0, 30.0, 21.0, 24.0, 14.0, 12.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.984375, -8.744140625, -8.50390625, -8.263671875, -8.0234375, -7.783203125, -7.54296875, -7.302734375, -7.0625, -6.822265625, -6.58203125, -6.341796875, -6.1015625, -5.861328125, -5.62109375, -5.380859375, -5.140625, -4.900390625, -4.66015625, -4.419921875, -4.1796875, -3.939453125, -3.69921875, -3.458984375, -3.21875, -2.978515625, -2.73828125, -2.498046875, -2.2578125, -2.017578125, -1.77734375, -1.537109375, -1.296875, -1.056640625, -0.81640625, -0.576171875, -0.3359375, -0.095703125, 0.14453125, 0.384765625, 0.625, 0.865234375, 1.10546875, 1.345703125, 1.5859375, 1.826171875, 2.06640625, 2.306640625, 2.546875, 2.787109375, 3.02734375, 3.267578125, 3.5078125, 3.748046875, 3.98828125, 4.228515625, 4.46875, 4.708984375, 4.94921875, 5.189453125, 5.4296875, 5.669921875, 5.91015625, 6.150390625, 6.390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 23.0, 31.0, 46.0, 93.0, 106.0, 142.0, 142.0, 136.0, 122.0, 67.0, 44.0, 24.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5879830121994019, -1.5536115169525146, -1.519239902496338, -1.4848684072494507, -1.4504969120025635, -1.4161254167556763, -1.3817538022994995, -1.3473823070526123, -1.313010811805725, -1.278639316558838, -1.2442677021026611, -1.209896206855774, -1.1755247116088867, -1.1411532163619995, -1.1067816019058228, -1.0724101066589355, -1.0380384922027588, -1.0036669969558716, -0.9692954421043396, -0.9349238872528076, -0.9005523920059204, -0.8661808371543884, -0.8318092823028564, -0.7974377870559692, -0.763066291809082, -0.72869473695755, -0.6943232417106628, -0.6599516868591309, -0.6255801916122437, -0.5912086367607117, -0.5568370819091797, -0.5224655866622925, -0.4880940318107605, -0.4537225067615509, -0.4193509817123413, -0.3849794268608093, -0.3506079316139221, -0.31623637676239014, -0.28186485171318054, -0.24749332666397095, -0.21312180161476135, -0.17875027656555176, -0.14437875151634216, -0.11000721156597137, -0.07563568651676178, -0.041264161467552185, -0.0068926215171813965, 0.027478903532028198, 0.06185042858123779, 0.09622195363044739, 0.13059347867965698, 0.16496501863002777, 0.19933654367923737, 0.23370806872844696, 0.26807960867881775, 0.30245113372802734, 0.33682265877723694, 0.37119418382644653, 0.40556570887565613, 0.4399372339248657, 0.4743087887763977, 0.5086802840232849, 0.5430518388748169, 0.5774233341217041, 0.6117948889732361]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 8.0, 3.0, 10.0, 8.0, 8.0, 16.0, 16.0, 15.0, 20.0, 32.0, 42.0, 35.0, 39.0, 30.0, 38.0, 40.0, 42.0, 48.0, 44.0, 43.0, 38.0, 42.0, 49.0, 33.0, 38.0, 29.0, 25.0, 36.0, 26.0, 20.0, 21.0, 18.0, 21.0, 16.0, 9.0, 7.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4755464196205139, -0.4611012041568756, -0.4466559588909149, -0.4322107434272766, -0.4177654981613159, -0.4033202826976776, -0.3888750374317169, -0.3744298219680786, -0.3599845767021179, -0.3455393612384796, -0.3310941159725189, -0.3166489005088806, -0.3022036552429199, -0.2877584397792816, -0.2733131945133209, -0.2588679790496826, -0.24442274868488312, -0.22997751832008362, -0.21553228795528412, -0.20108705759048462, -0.18664182722568512, -0.17219659686088562, -0.15775138139724731, -0.14330613613128662, -0.12886092066764832, -0.11441569030284882, -0.09997045993804932, -0.08552522957324982, -0.07107999920845032, -0.056634776294231415, -0.042189545929431915, -0.027744315564632416, -0.01329907774925232, 0.0011461516842246056, 0.01559138111770153, 0.03003660961985588, 0.04448183998465538, 0.05892706662416458, 0.07337229698896408, 0.08781752735376358, 0.10226275771856308, 0.11670798808336258, 0.13115321099758148, 0.14559844136238098, 0.16004367172718048, 0.17448890209197998, 0.18893413245677948, 0.20337936282157898, 0.21782459318637848, 0.23226982355117798, 0.24671505391597748, 0.261160284280777, 0.2756054997444153, 0.290050745010376, 0.3044959604740143, 0.318941205739975, 0.3333864212036133, 0.3478316366672516, 0.3622768819332123, 0.3767220973968506, 0.3911673426628113, 0.4056125581264496, 0.4200578033924103, 0.4345030188560486, 0.4489482641220093]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 4.0, 10.0, 9.0, 13.0, 17.0, 18.0, 23.0, 23.0, 22.0, 28.0, 22.0, 36.0, 30.0, 36.0, 43.0, 39.0, 54.0, 32.0, 33.0, 43.0, 37.0, 32.0, 28.0, 44.0, 33.0, 39.0, 20.0, 24.0, 22.0, 24.0, 17.0, 22.0, 28.0, 12.0, 10.0, 12.0, 9.0, 4.0, 9.0, 4.0, 2.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.796875, -5.61517333984375, -5.4334716796875, -5.25177001953125, -5.070068359375, -4.88836669921875, -4.7066650390625, -4.52496337890625, -4.34326171875, -4.16156005859375, -3.9798583984375, -3.79815673828125, -3.616455078125, -3.43475341796875, -3.2530517578125, -3.07135009765625, -2.8896484375, -2.70794677734375, -2.5262451171875, -2.34454345703125, -2.162841796875, -1.98114013671875, -1.7994384765625, -1.61773681640625, -1.43603515625, -1.25433349609375, -1.0726318359375, -0.89093017578125, -0.709228515625, -0.52752685546875, -0.3458251953125, -0.16412353515625, 0.017578125, 0.19927978515625, 0.3809814453125, 0.56268310546875, 0.744384765625, 0.92608642578125, 1.1077880859375, 1.28948974609375, 1.47119140625, 1.65289306640625, 1.8345947265625, 2.01629638671875, 2.197998046875, 2.37969970703125, 2.5614013671875, 2.74310302734375, 2.9248046875, 3.10650634765625, 3.2882080078125, 3.46990966796875, 3.651611328125, 3.83331298828125, 4.0150146484375, 4.19671630859375, 4.37841796875, 4.56011962890625, 4.7418212890625, 4.92352294921875, 5.105224609375, 5.28692626953125, 5.4686279296875, 5.65032958984375, 5.83203125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 19.0, 22.0, 22.0, 31.0, 56.0, 78.0, 93.0, 142.0, 203.0, 269.0, 439.0, 567.0, 867.0, 1256.0, 1872.0, 3107.0, 5146.0, 9110.0, 17620.0, 38216.0, 101701.0, 389909.0, 318155.0, 88448.0, 33627.0, 15836.0, 8300.0, 4855.0, 2853.0, 1866.0, 1203.0, 813.0, 524.0, 384.0, 270.0, 190.0, 143.0, 93.0, 71.0, 43.0, 37.0, 26.0, 22.0, 10.0, 10.0, 2.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-12.9140625, -12.5096435546875, -12.105224609375, -11.7008056640625, -11.29638671875, -10.8919677734375, -10.487548828125, -10.0831298828125, -9.6787109375, -9.2742919921875, -8.869873046875, -8.4654541015625, -8.06103515625, -7.6566162109375, -7.252197265625, -6.8477783203125, -6.443359375, -6.0389404296875, -5.634521484375, -5.2301025390625, -4.82568359375, -4.4212646484375, -4.016845703125, -3.6124267578125, -3.2080078125, -2.8035888671875, -2.399169921875, -1.9947509765625, -1.59033203125, -1.1859130859375, -0.781494140625, -0.3770751953125, 0.02734375, 0.4317626953125, 0.836181640625, 1.2406005859375, 1.64501953125, 2.0494384765625, 2.453857421875, 2.8582763671875, 3.2626953125, 3.6671142578125, 4.071533203125, 4.4759521484375, 4.88037109375, 5.2847900390625, 5.689208984375, 6.0936279296875, 6.498046875, 6.9024658203125, 7.306884765625, 7.7113037109375, 8.11572265625, 8.5201416015625, 8.924560546875, 9.3289794921875, 9.7333984375, 10.1378173828125, 10.542236328125, 10.9466552734375, 11.35107421875, 11.7554931640625, 12.159912109375, 12.5643310546875, 12.96875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 10.0, 7.0, 12.0, 10.0, 26.0, 14.0, 19.0, 29.0, 24.0, 45.0, 42.0, 56.0, 74.0, 87.0, 143.0, 267.0, 1393.0, 182.0, 105.0, 87.0, 73.0, 55.0, 45.0, 22.0, 28.0, 30.0, 23.0, 21.0, 17.0, 17.0, 9.0, 16.0, 7.0, 11.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.282958984375, -19.61279296875, -18.942626953125, -18.2724609375, -17.602294921875, -16.93212890625, -16.261962890625, -15.591796875, -14.921630859375, -14.25146484375, -13.581298828125, -12.9111328125, -12.240966796875, -11.57080078125, -10.900634765625, -10.23046875, -9.560302734375, -8.89013671875, -8.219970703125, -7.5498046875, -6.879638671875, -6.20947265625, -5.539306640625, -4.869140625, -4.198974609375, -3.52880859375, -2.858642578125, -2.1884765625, -1.518310546875, -0.84814453125, -0.177978515625, 0.4921875, 1.162353515625, 1.83251953125, 2.502685546875, 3.1728515625, 3.843017578125, 4.51318359375, 5.183349609375, 5.853515625, 6.523681640625, 7.19384765625, 7.864013671875, 8.5341796875, 9.204345703125, 9.87451171875, 10.544677734375, 11.21484375, 11.885009765625, 12.55517578125, 13.225341796875, 13.8955078125, 14.565673828125, 15.23583984375, 15.906005859375, 16.576171875, 17.246337890625, 17.91650390625, 18.586669921875, 19.2568359375, 19.927001953125, 20.59716796875, 21.267333984375, 21.9375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 6.0, 4.0, 5.0, 6.0, 9.0, 15.0, 16.0, 12.0, 22.0, 27.0, 34.0, 59.0, 70.0, 81.0, 136.0, 149.0, 276.0, 661.0, 2150.0, 12782.0, 446796.0, 2647053.0, 29774.0, 3549.0, 945.0, 376.0, 195.0, 119.0, 91.0, 64.0, 58.0, 32.0, 29.0, 25.0, 19.0, 18.0, 10.0, 5.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.75, -56.0087890625, -54.267578125, -52.5263671875, -50.78515625, -49.0439453125, -47.302734375, -45.5615234375, -43.8203125, -42.0791015625, -40.337890625, -38.5966796875, -36.85546875, -35.1142578125, -33.373046875, -31.6318359375, -29.890625, -28.1494140625, -26.408203125, -24.6669921875, -22.92578125, -21.1845703125, -19.443359375, -17.7021484375, -15.9609375, -14.2197265625, -12.478515625, -10.7373046875, -8.99609375, -7.2548828125, -5.513671875, -3.7724609375, -2.03125, -0.2900390625, 1.451171875, 3.1923828125, 4.93359375, 6.6748046875, 8.416015625, 10.1572265625, 11.8984375, 13.6396484375, 15.380859375, 17.1220703125, 18.86328125, 20.6044921875, 22.345703125, 24.0869140625, 25.828125, 27.5693359375, 29.310546875, 31.0517578125, 32.79296875, 34.5341796875, 36.275390625, 38.0166015625, 39.7578125, 41.4990234375, 43.240234375, 44.9814453125, 46.72265625, 48.4638671875, 50.205078125, 51.9462890625, 53.6875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 45.0, 839.0, 132.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.889549255371094, -43.596412658691406, -27.303272247314453, -11.0101318359375, 5.2830047607421875, 21.576141357421875, 37.869285583496094, 54.16242218017578, 70.45555877685547, 86.74869537353516, 103.04183959960938, 119.33497619628906, 135.62811279296875, 151.92124938964844, 168.21438598632812, 184.50753784179688, 200.8006591796875, 217.0937957763672, 233.38693237304688, 249.68008422851562, 265.97320556640625, 282.266357421875, 298.55950927734375, 314.8526306152344, 331.1457824707031, 347.4389343261719, 363.7320556640625, 380.02520751953125, 396.3183288574219, 412.6114807128906, 428.90460205078125, 445.19775390625, 461.49090576171875, 477.7840576171875, 494.0771789550781, 510.3703308105469, 526.6634521484375, 542.9566040039062, 559.249755859375, 575.5428466796875, 591.8359985351562, 608.129150390625, 624.4223022460938, 640.7153930664062, 657.008544921875, 673.3016967773438, 689.5948486328125, 705.887939453125, 722.18115234375, 738.4743041992188, 754.7674560546875, 771.060546875, 787.3536987304688, 803.6468505859375, 819.9400024414062, 836.233154296875, 852.5262451171875, 868.8193969726562, 885.112548828125, 901.4056396484375, 917.6987915039062, 933.991943359375, 950.2850952148438, 966.5782470703125, 982.871337890625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 18.0, 18.0, 25.0, 19.0, 27.0, 31.0, 35.0, 43.0, 42.0, 55.0, 53.0, 64.0, 54.0, 47.0, 38.0, 46.0, 47.0, 52.0, 34.0, 37.0, 35.0, 22.0, 30.0, 22.0, 17.0, 12.0, 15.0, 19.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.81705474853516, -89.38529205322266, -86.95352935791016, -84.52176666259766, -82.09000396728516, -79.65824127197266, -77.22647857666016, -74.79470825195312, -72.36294555664062, -69.93118286132812, -67.49942016601562, -65.06765747070312, -62.635894775390625, -60.204132080078125, -57.77236557006836, -55.34060287475586, -52.908843994140625, -50.477081298828125, -48.045318603515625, -45.613555908203125, -43.181793212890625, -40.750030517578125, -38.31826400756836, -35.88650131225586, -33.45473861694336, -31.02297592163086, -28.59121322631836, -26.159448623657227, -23.727685928344727, -21.295923233032227, -18.864158630371094, -16.432395935058594, -14.000640869140625, -11.568878173828125, -9.137114524841309, -6.70535135269165, -4.273588180541992, -1.8418254852294922, 0.5899381637573242, 3.0217018127441406, 5.453464508056641, 7.885227680206299, 10.316990852355957, 12.748754501342773, 15.180517196655273, 17.612279891967773, 20.044044494628906, 22.475807189941406, 24.907569885253906, 27.339332580566406, 29.771095275878906, 32.202857971191406, 34.634620666503906, 37.066383361816406, 39.49814987182617, 41.92991256713867, 44.36167526245117, 46.79343795776367, 49.22520065307617, 51.65696334838867, 54.08872985839844, 56.52049255371094, 58.95225524902344, 61.38401794433594, 63.81578063964844]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 7.0, 12.0, 18.0, 12.0, 22.0, 22.0, 23.0, 20.0, 32.0, 18.0, 25.0, 30.0, 41.0, 38.0, 42.0, 37.0, 36.0, 56.0, 45.0, 33.0, 35.0, 30.0, 38.0, 27.0, 40.0, 33.0, 37.0, 20.0, 20.0, 17.0, 14.0, 19.0, 19.0, 14.0, 11.0, 11.0, 10.0, 4.0, 7.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.9140625, -6.70556640625, -6.4970703125, -6.28857421875, -6.080078125, -5.87158203125, -5.6630859375, -5.45458984375, -5.24609375, -5.03759765625, -4.8291015625, -4.62060546875, -4.412109375, -4.20361328125, -3.9951171875, -3.78662109375, -3.578125, -3.36962890625, -3.1611328125, -2.95263671875, -2.744140625, -2.53564453125, -2.3271484375, -2.11865234375, -1.91015625, -1.70166015625, -1.4931640625, -1.28466796875, -1.076171875, -0.86767578125, -0.6591796875, -0.45068359375, -0.2421875, -0.03369140625, 0.1748046875, 0.38330078125, 0.591796875, 0.80029296875, 1.0087890625, 1.21728515625, 1.42578125, 1.63427734375, 1.8427734375, 2.05126953125, 2.259765625, 2.46826171875, 2.6767578125, 2.88525390625, 3.09375, 3.30224609375, 3.5107421875, 3.71923828125, 3.927734375, 4.13623046875, 4.3447265625, 4.55322265625, 4.76171875, 4.97021484375, 5.1787109375, 5.38720703125, 5.595703125, 5.80419921875, 6.0126953125, 6.22119140625, 6.4296875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 5.0, 7.0, 1.0, 5.0, 10.0, 7.0, 15.0, 16.0, 16.0, 29.0, 40.0, 50.0, 89.0, 135.0, 276.0, 464.0, 948.0, 1913.0, 4384.0, 10871.0, 35451.0, 275703.0, 2865015.0, 899636.0, 69266.0, 17705.0, 6523.0, 2764.0, 1316.0, 731.0, 321.0, 187.0, 128.0, 58.0, 56.0, 40.0, 24.0, 17.0, 10.0, 5.0, 9.0, 12.0, 4.0, 2.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-19.890625, -19.300537109375, -18.71044921875, -18.120361328125, -17.5302734375, -16.940185546875, -16.35009765625, -15.760009765625, -15.169921875, -14.579833984375, -13.98974609375, -13.399658203125, -12.8095703125, -12.219482421875, -11.62939453125, -11.039306640625, -10.44921875, -9.859130859375, -9.26904296875, -8.678955078125, -8.0888671875, -7.498779296875, -6.90869140625, -6.318603515625, -5.728515625, -5.138427734375, -4.54833984375, -3.958251953125, -3.3681640625, -2.778076171875, -2.18798828125, -1.597900390625, -1.0078125, -0.417724609375, 0.17236328125, 0.762451171875, 1.3525390625, 1.942626953125, 2.53271484375, 3.122802734375, 3.712890625, 4.302978515625, 4.89306640625, 5.483154296875, 6.0732421875, 6.663330078125, 7.25341796875, 7.843505859375, 8.43359375, 9.023681640625, 9.61376953125, 10.203857421875, 10.7939453125, 11.384033203125, 11.97412109375, 12.564208984375, 13.154296875, 13.744384765625, 14.33447265625, 14.924560546875, 15.5146484375, 16.104736328125, 16.69482421875, 17.284912109375, 17.875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 7.0, 8.0, 13.0, 10.0, 12.0, 15.0, 17.0, 30.0, 32.0, 55.0, 53.0, 75.0, 118.0, 218.0, 339.0, 460.0, 615.0, 579.0, 434.0, 283.0, 185.0, 120.0, 94.0, 69.0, 48.0, 37.0, 23.0, 19.0, 15.0, 16.0, 6.0, 9.0, 9.0, 11.0, 12.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.828125, -12.397705078125, -11.96728515625, -11.536865234375, -11.1064453125, -10.676025390625, -10.24560546875, -9.815185546875, -9.384765625, -8.954345703125, -8.52392578125, -8.093505859375, -7.6630859375, -7.232666015625, -6.80224609375, -6.371826171875, -5.94140625, -5.510986328125, -5.08056640625, -4.650146484375, -4.2197265625, -3.789306640625, -3.35888671875, -2.928466796875, -2.498046875, -2.067626953125, -1.63720703125, -1.206787109375, -0.7763671875, -0.345947265625, 0.08447265625, 0.514892578125, 0.9453125, 1.375732421875, 1.80615234375, 2.236572265625, 2.6669921875, 3.097412109375, 3.52783203125, 3.958251953125, 4.388671875, 4.819091796875, 5.24951171875, 5.679931640625, 6.1103515625, 6.540771484375, 6.97119140625, 7.401611328125, 7.83203125, 8.262451171875, 8.69287109375, 9.123291015625, 9.5537109375, 9.984130859375, 10.41455078125, 10.844970703125, 11.275390625, 11.705810546875, 12.13623046875, 12.566650390625, 12.9970703125, 13.427490234375, 13.85791015625, 14.288330078125, 14.71875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 11.0, 9.0, 12.0, 17.0, 10.0, 18.0, 30.0, 41.0, 42.0, 102.0, 174.0, 431.0, 1079.0, 4076.0, 19297.0, 188276.0, 3689107.0, 261755.0, 23021.0, 4652.0, 1275.0, 403.0, 162.0, 101.0, 48.0, 35.0, 26.0, 12.0, 14.0, 10.0, 11.0, 8.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-45.46875, -44.2578125, -43.046875, -41.8359375, -40.625, -39.4140625, -38.203125, -36.9921875, -35.78125, -34.5703125, -33.359375, -32.1484375, -30.9375, -29.7265625, -28.515625, -27.3046875, -26.09375, -24.8828125, -23.671875, -22.4609375, -21.25, -20.0390625, -18.828125, -17.6171875, -16.40625, -15.1953125, -13.984375, -12.7734375, -11.5625, -10.3515625, -9.140625, -7.9296875, -6.71875, -5.5078125, -4.296875, -3.0859375, -1.875, -0.6640625, 0.546875, 1.7578125, 2.96875, 4.1796875, 5.390625, 6.6015625, 7.8125, 9.0234375, 10.234375, 11.4453125, 12.65625, 13.8671875, 15.078125, 16.2890625, 17.5, 18.7109375, 19.921875, 21.1328125, 22.34375, 23.5546875, 24.765625, 25.9765625, 27.1875, 28.3984375, 29.609375, 30.8203125, 32.03125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 6.0, 12.0, 21.0, 31.0, 49.0, 53.0, 84.0, 119.0, 139.0, 135.0, 128.0, 77.0, 53.0, 30.0, 22.0, 9.0, 12.0, 5.0, 8.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-77.667724609375, -75.27259826660156, -72.87747192382812, -70.48235321044922, -68.08722686767578, -65.69210052490234, -63.296974182128906, -60.90184783935547, -58.5067253112793, -56.11159896850586, -53.71647644042969, -51.32135009765625, -48.92622375488281, -46.53110122680664, -44.1359748840332, -41.74085235595703, -39.345726013183594, -36.950599670410156, -34.555477142333984, -32.16035079956055, -29.765226364135742, -27.370101928710938, -24.9749755859375, -22.579851150512695, -20.18472671508789, -17.789602279663086, -15.394476890563965, -12.999351501464844, -10.604227066040039, -8.209102630615234, -5.813977241516113, -3.418851852416992, -1.0237197875976562, 1.3714051246643066, 3.7665300369262695, 6.161654949188232, 8.556779861450195, 10.951904296875, 13.347029685974121, 15.742155075073242, 18.137279510498047, 20.53240394592285, 22.927528381347656, 25.322654724121094, 27.7177791595459, 30.112903594970703, 32.50802993774414, 34.90315246582031, 37.29827880859375, 39.69340515136719, 42.08852767944336, 44.4836540222168, 46.87877655029297, 49.273902893066406, 51.669029235839844, 54.06415557861328, 56.45927810668945, 58.85440444946289, 61.24952697753906, 63.6446533203125, 66.03977966308594, 68.43490600585938, 70.83002471923828, 73.22515106201172, 75.62027740478516]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 8.0, 8.0, 10.0, 8.0, 14.0, 21.0, 18.0, 16.0, 18.0, 21.0, 26.0, 40.0, 22.0, 32.0, 34.0, 41.0, 38.0, 45.0, 29.0, 37.0, 34.0, 45.0, 33.0, 50.0, 53.0, 37.0, 41.0, 32.0, 33.0, 21.0, 22.0, 20.0, 15.0, 16.0, 14.0, 9.0, 10.0, 7.0, 3.0, 4.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-48.651527404785156, -47.16160202026367, -45.67168045043945, -44.18175506591797, -42.69183349609375, -41.201908111572266, -39.71198654174805, -38.22206115722656, -36.732139587402344, -35.24221420288086, -33.75229263305664, -32.262367248535156, -30.772445678710938, -29.282522201538086, -27.792598724365234, -26.30267333984375, -24.8127498626709, -23.322826385498047, -21.832902908325195, -20.342979431152344, -18.853055953979492, -17.36313247680664, -15.873208045959473, -14.383284568786621, -12.89336109161377, -11.403437614440918, -9.913514137268066, -8.423589706420898, -6.933666706085205, -5.4437432289123535, -3.9538192749023438, -2.463895797729492, -0.9739723205566406, 0.5159512758255005, 2.0058748722076416, 3.4957985877990723, 4.985722064971924, 6.475645542144775, 7.965569496154785, 9.455492973327637, 10.945416450500488, 12.43533992767334, 13.925263404846191, 15.41518783569336, 16.90511131286621, 18.395034790039062, 19.884958267211914, 21.374881744384766, 22.864805221557617, 24.35472869873047, 25.84465217590332, 27.334575653076172, 28.824499130249023, 30.314422607421875, 31.80434799194336, 33.29426956176758, 34.78419494628906, 36.27412033081055, 37.764041900634766, 39.25396728515625, 40.74388885498047, 42.23381423950195, 43.72373580932617, 45.213661193847656, 46.703582763671875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 8.0, 11.0, 18.0, 4.0, 15.0, 11.0, 16.0, 26.0, 29.0, 19.0, 29.0, 39.0, 27.0, 30.0, 35.0, 42.0, 38.0, 32.0, 35.0, 46.0, 37.0, 43.0, 39.0, 29.0, 24.0, 39.0, 26.0, 24.0, 27.0, 19.0, 24.0, 22.0, 18.0, 12.0, 13.0, 9.0, 11.0, 13.0, 6.0, 4.0, 8.0, 6.0, 5.0, 5.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.49609375, -5.3145751953125, -5.133056640625, -4.9515380859375, -4.77001953125, -4.5885009765625, -4.406982421875, -4.2254638671875, -4.0439453125, -3.8624267578125, -3.680908203125, -3.4993896484375, -3.31787109375, -3.1363525390625, -2.954833984375, -2.7733154296875, -2.591796875, -2.4102783203125, -2.228759765625, -2.0472412109375, -1.86572265625, -1.6842041015625, -1.502685546875, -1.3211669921875, -1.1396484375, -0.9581298828125, -0.776611328125, -0.5950927734375, -0.41357421875, -0.2320556640625, -0.050537109375, 0.1309814453125, 0.3125, 0.4940185546875, 0.675537109375, 0.8570556640625, 1.03857421875, 1.2200927734375, 1.401611328125, 1.5831298828125, 1.7646484375, 1.9461669921875, 2.127685546875, 2.3092041015625, 2.49072265625, 2.6722412109375, 2.853759765625, 3.0352783203125, 3.216796875, 3.3983154296875, 3.579833984375, 3.7613525390625, 3.94287109375, 4.1243896484375, 4.305908203125, 4.4874267578125, 4.6689453125, 4.8504638671875, 5.031982421875, 5.2135009765625, 5.39501953125, 5.5765380859375, 5.758056640625, 5.9395751953125, 6.12109375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 11.0, 7.0, 16.0, 10.0, 32.0, 26.0, 44.0, 62.0, 72.0, 126.0, 176.0, 225.0, 318.0, 444.0, 607.0, 880.0, 1225.0, 1835.0, 2850.0, 4612.0, 8142.0, 15195.0, 30945.0, 67939.0, 159938.0, 321866.0, 236967.0, 100762.0, 44620.0, 20954.0, 10815.0, 5890.0, 3458.0, 2293.0, 1555.0, 1026.0, 743.0, 552.0, 361.0, 290.0, 174.0, 129.0, 98.0, 83.0, 49.0, 41.0, 23.0, 21.0, 14.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.833984375, -1.772308349609375, -1.71063232421875, -1.648956298828125, -1.5872802734375, -1.525604248046875, -1.46392822265625, -1.402252197265625, -1.340576171875, -1.278900146484375, -1.21722412109375, -1.155548095703125, -1.0938720703125, -1.032196044921875, -0.97052001953125, -0.908843994140625, -0.84716796875, -0.785491943359375, -0.72381591796875, -0.662139892578125, -0.6004638671875, -0.538787841796875, -0.47711181640625, -0.415435791015625, -0.353759765625, -0.292083740234375, -0.23040771484375, -0.168731689453125, -0.1070556640625, -0.045379638671875, 0.01629638671875, 0.077972412109375, 0.1396484375, 0.201324462890625, 0.26300048828125, 0.324676513671875, 0.3863525390625, 0.448028564453125, 0.50970458984375, 0.571380615234375, 0.633056640625, 0.694732666015625, 0.75640869140625, 0.818084716796875, 0.8797607421875, 0.941436767578125, 1.00311279296875, 1.064788818359375, 1.12646484375, 1.188140869140625, 1.24981689453125, 1.311492919921875, 1.3731689453125, 1.434844970703125, 1.49652099609375, 1.558197021484375, 1.619873046875, 1.681549072265625, 1.74322509765625, 1.804901123046875, 1.8665771484375, 1.928253173828125, 1.98992919921875, 2.051605224609375, 2.11328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 5.0, 8.0, 7.0, 9.0, 16.0, 12.0, 10.0, 19.0, 16.0, 23.0, 22.0, 21.0, 30.0, 34.0, 40.0, 46.0, 41.0, 43.0, 37.0, 28.0, 41.0, 1059.0, 35.0, 39.0, 44.0, 34.0, 34.0, 27.0, 40.0, 42.0, 19.0, 22.0, 21.0, 19.0, 15.0, 11.0, 12.0, 6.0, 10.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.1273193359375, -3.985107421875, -3.8428955078125, -3.70068359375, -3.5584716796875, -3.416259765625, -3.2740478515625, -3.1318359375, -2.9896240234375, -2.847412109375, -2.7052001953125, -2.56298828125, -2.4207763671875, -2.278564453125, -2.1363525390625, -1.994140625, -1.8519287109375, -1.709716796875, -1.5675048828125, -1.42529296875, -1.2830810546875, -1.140869140625, -0.9986572265625, -0.8564453125, -0.7142333984375, -0.572021484375, -0.4298095703125, -0.28759765625, -0.1453857421875, -0.003173828125, 0.1390380859375, 0.28125, 0.4234619140625, 0.565673828125, 0.7078857421875, 0.85009765625, 0.9923095703125, 1.134521484375, 1.2767333984375, 1.4189453125, 1.5611572265625, 1.703369140625, 1.8455810546875, 1.98779296875, 2.1300048828125, 2.272216796875, 2.4144287109375, 2.556640625, 2.6988525390625, 2.841064453125, 2.9832763671875, 3.12548828125, 3.2677001953125, 3.409912109375, 3.5521240234375, 3.6943359375, 3.8365478515625, 3.978759765625, 4.1209716796875, 4.26318359375, 4.4053955078125, 4.547607421875, 4.6898193359375, 4.83203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 8.0, 5.0, 12.0, 19.0, 37.0, 49.0, 86.0, 125.0, 193.0, 349.0, 615.0, 1201.0, 2642.0, 7182.0, 24811.0, 133630.0, 1518188.0, 341263.0, 47660.0, 11465.0, 3945.0, 1668.0, 797.0, 481.0, 273.0, 150.0, 87.0, 70.0, 44.0, 24.0, 18.0, 7.0, 5.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.400390625, -2.32470703125, -2.2490234375, -2.17333984375, -2.09765625, -2.02197265625, -1.9462890625, -1.87060546875, -1.794921875, -1.71923828125, -1.6435546875, -1.56787109375, -1.4921875, -1.41650390625, -1.3408203125, -1.26513671875, -1.189453125, -1.11376953125, -1.0380859375, -0.96240234375, -0.88671875, -0.81103515625, -0.7353515625, -0.65966796875, -0.583984375, -0.50830078125, -0.4326171875, -0.35693359375, -0.28125, -0.20556640625, -0.1298828125, -0.05419921875, 0.021484375, 0.09716796875, 0.1728515625, 0.24853515625, 0.32421875, 0.39990234375, 0.4755859375, 0.55126953125, 0.626953125, 0.70263671875, 0.7783203125, 0.85400390625, 0.9296875, 1.00537109375, 1.0810546875, 1.15673828125, 1.232421875, 1.30810546875, 1.3837890625, 1.45947265625, 1.53515625, 1.61083984375, 1.6865234375, 1.76220703125, 1.837890625, 1.91357421875, 1.9892578125, 2.06494140625, 2.140625, 2.21630859375, 2.2919921875, 2.36767578125, 2.443359375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 7.0, 12.0, 11.0, 15.0, 17.0, 13.0, 17.0, 30.0, 24.0, 47.0, 45.0, 69.0, 89.0, 158.0, 91.0, 69.0, 39.0, 45.0, 37.0, 17.0, 24.0, 16.0, 16.0, 16.0, 16.0, 11.0, 6.0, 8.0, 2.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.207275390625, -0.20026397705078125, -0.1932525634765625, -0.18624114990234375, -0.179229736328125, -0.17221832275390625, -0.1652069091796875, -0.15819549560546875, -0.15118408203125, -0.14417266845703125, -0.1371612548828125, -0.13014984130859375, -0.123138427734375, -0.11612701416015625, -0.1091156005859375, -0.10210418701171875, -0.0950927734375, -0.08808135986328125, -0.0810699462890625, -0.07405853271484375, -0.067047119140625, -0.06003570556640625, -0.0530242919921875, -0.04601287841796875, -0.03900146484375, -0.03199005126953125, -0.0249786376953125, -0.01796722412109375, -0.010955810546875, -0.00394439697265625, 0.0030670166015625, 0.01007843017578125, 0.01708984375, 0.02410125732421875, 0.0311126708984375, 0.03812408447265625, 0.045135498046875, 0.05214691162109375, 0.0591583251953125, 0.06616973876953125, 0.07318115234375, 0.08019256591796875, 0.0872039794921875, 0.09421539306640625, 0.101226806640625, 0.10823822021484375, 0.1152496337890625, 0.12226104736328125, 0.1292724609375, 0.13628387451171875, 0.1432952880859375, 0.15030670166015625, 0.157318115234375, 0.16432952880859375, 0.1713409423828125, 0.17835235595703125, 0.18536376953125, 0.19237518310546875, 0.1993865966796875, 0.20639801025390625, 0.213409423828125, 0.22042083740234375, 0.2274322509765625, 0.23444366455078125, 0.241455078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 10.0, 14.0, 18.0, 21.0, 17.0, 33.0, 47.0, 62.0, 106.0, 217.0, 651.0, 3635.0, 72422.0, 955746.0, 13419.0, 1319.0, 340.0, 152.0, 90.0, 46.0, 28.0, 35.0, 16.0, 21.0, 15.0, 13.0, 8.0, 5.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.6875, -4.5506591796875, -4.413818359375, -4.2769775390625, -4.14013671875, -4.0032958984375, -3.866455078125, -3.7296142578125, -3.5927734375, -3.4559326171875, -3.319091796875, -3.1822509765625, -3.04541015625, -2.9085693359375, -2.771728515625, -2.6348876953125, -2.498046875, -2.3612060546875, -2.224365234375, -2.0875244140625, -1.95068359375, -1.8138427734375, -1.677001953125, -1.5401611328125, -1.4033203125, -1.2664794921875, -1.129638671875, -0.9927978515625, -0.85595703125, -0.7191162109375, -0.582275390625, -0.4454345703125, -0.30859375, -0.1717529296875, -0.034912109375, 0.1019287109375, 0.23876953125, 0.3756103515625, 0.512451171875, 0.6492919921875, 0.7861328125, 0.9229736328125, 1.059814453125, 1.1966552734375, 1.33349609375, 1.4703369140625, 1.607177734375, 1.7440185546875, 1.880859375, 2.0177001953125, 2.154541015625, 2.2913818359375, 2.42822265625, 2.5650634765625, 2.701904296875, 2.8387451171875, 2.9755859375, 3.1124267578125, 3.249267578125, 3.3861083984375, 3.52294921875, 3.6597900390625, 3.796630859375, 3.9334716796875, 4.0703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 13.0, 18.0, 35.0, 83.0, 125.0, 196.0, 216.0, 154.0, 85.0, 42.0, 16.0, 17.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5326188206672668, -0.5113019943237305, -0.4899851977825165, -0.4686684012413025, -0.4473515748977661, -0.42603474855422974, -0.40471795201301575, -0.38340115547180176, -0.3620843291282654, -0.340767502784729, -0.319450706243515, -0.298133909702301, -0.27681708335876465, -0.25550025701522827, -0.23418346047401428, -0.2128666490316391, -0.19154983758926392, -0.17023302614688873, -0.14891621470451355, -0.12759940326213837, -0.10628259181976318, -0.084965780377388, -0.06364896893501282, -0.042332157492637634, -0.02101534605026245, 0.00030146539211273193, 0.021618276834487915, 0.0429350882768631, 0.06425189971923828, 0.08556871116161346, 0.10688552260398865, 0.12820233404636383, 0.14951908588409424, 0.17083589732646942, 0.1921527087688446, 0.2134695202112198, 0.23478633165359497, 0.25610315799713135, 0.27741995453834534, 0.2987367510795593, 0.3200535774230957, 0.3413704037666321, 0.36268720030784607, 0.38400399684906006, 0.40532082319259644, 0.4266376495361328, 0.4479544460773468, 0.4692712426185608, 0.49058806896209717, 0.5119048953056335, 0.5332217216491699, 0.5545384883880615, 0.5758553147315979, 0.5971721410751343, 0.6184889078140259, 0.6398057341575623, 0.6611225605010986, 0.682439386844635, 0.7037562131881714, 0.725072979927063, 0.7463898062705994, 0.7677066326141357, 0.7890233993530273, 0.8103402256965637, 0.8316570520401001]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 6.0, 4.0, 3.0, 0.0, 7.0, 10.0, 6.0, 13.0, 11.0, 19.0, 22.0, 17.0, 26.0, 18.0, 14.0, 31.0, 36.0, 29.0, 29.0, 29.0, 40.0, 50.0, 46.0, 38.0, 45.0, 38.0, 38.0, 38.0, 27.0, 29.0, 35.0, 31.0, 29.0, 34.0, 29.0, 20.0, 18.0, 15.0, 11.0, 9.0, 7.0, 11.0, 9.0, 7.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.17120659351348877, -0.16573093831539154, -0.1602552831172943, -0.15477962791919708, -0.14930397272109985, -0.14382831752300262, -0.1383526623249054, -0.13287700712680817, -0.12740135192871094, -0.12192569673061371, -0.11645004153251648, -0.11097438633441925, -0.10549873113632202, -0.10002307593822479, -0.09454742074012756, -0.08907176554203033, -0.0835961103439331, -0.07812045514583588, -0.07264479994773865, -0.06716914474964142, -0.06169348955154419, -0.05621783435344696, -0.05074217915534973, -0.0452665239572525, -0.03979086875915527, -0.034315213561058044, -0.028839558362960815, -0.023363903164863586, -0.017888247966766357, -0.012412592768669128, -0.006936937570571899, -0.0014612823724746704, 0.004014372825622559, 0.009490028023719788, 0.014965683221817017, 0.020441338419914246, 0.025916993618011475, 0.031392648816108704, 0.03686830401420593, 0.04234395921230316, 0.04781961441040039, 0.05329526960849762, 0.05877092480659485, 0.06424658000469208, 0.0697222352027893, 0.07519789040088654, 0.08067354559898376, 0.086149200797081, 0.09162485599517822, 0.09710051119327545, 0.10257616639137268, 0.10805182158946991, 0.11352747678756714, 0.11900313198566437, 0.1244787871837616, 0.12995444238185883, 0.13543009757995605, 0.14090575277805328, 0.1463814079761505, 0.15185706317424774, 0.15733271837234497, 0.1628083735704422, 0.16828402876853943, 0.17375968396663666, 0.1792353391647339]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 9.0, 5.0, 12.0, 10.0, 10.0, 14.0, 17.0, 30.0, 18.0, 23.0, 34.0, 22.0, 28.0, 28.0, 34.0, 35.0, 44.0, 40.0, 37.0, 53.0, 40.0, 34.0, 33.0, 55.0, 37.0, 23.0, 27.0, 38.0, 23.0, 14.0, 21.0, 20.0, 23.0, 12.0, 14.0, 16.0, 11.0, 7.0, 8.0, 7.0, 3.0, 8.0, 5.0, 9.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.51171875, -5.321533203125, -5.13134765625, -4.941162109375, -4.7509765625, -4.560791015625, -4.37060546875, -4.180419921875, -3.990234375, -3.800048828125, -3.60986328125, -3.419677734375, -3.2294921875, -3.039306640625, -2.84912109375, -2.658935546875, -2.46875, -2.278564453125, -2.08837890625, -1.898193359375, -1.7080078125, -1.517822265625, -1.32763671875, -1.137451171875, -0.947265625, -0.757080078125, -0.56689453125, -0.376708984375, -0.1865234375, 0.003662109375, 0.19384765625, 0.384033203125, 0.57421875, 0.764404296875, 0.95458984375, 1.144775390625, 1.3349609375, 1.525146484375, 1.71533203125, 1.905517578125, 2.095703125, 2.285888671875, 2.47607421875, 2.666259765625, 2.8564453125, 3.046630859375, 3.23681640625, 3.427001953125, 3.6171875, 3.807373046875, 3.99755859375, 4.187744140625, 4.3779296875, 4.568115234375, 4.75830078125, 4.948486328125, 5.138671875, 5.328857421875, 5.51904296875, 5.709228515625, 5.8994140625, 6.089599609375, 6.27978515625, 6.469970703125, 6.66015625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 11.0, 10.0, 14.0, 29.0, 31.0, 51.0, 56.0, 83.0, 100.0, 166.0, 220.0, 309.0, 427.0, 659.0, 1016.0, 1504.0, 2607.0, 4419.0, 8618.0, 17800.0, 43814.0, 152642.0, 537420.0, 185058.0, 49800.0, 19739.0, 9342.0, 4749.0, 2750.0, 1698.0, 1011.0, 706.0, 482.0, 318.0, 246.0, 162.0, 131.0, 89.0, 64.0, 57.0, 33.0, 29.0, 25.0, 18.0, 11.0, 10.0, 2.0, 4.0, 5.0, 3.0, 1.0, 3.0], "bins": [-12.75, -12.381103515625, -12.01220703125, -11.643310546875, -11.2744140625, -10.905517578125, -10.53662109375, -10.167724609375, -9.798828125, -9.429931640625, -9.06103515625, -8.692138671875, -8.3232421875, -7.954345703125, -7.58544921875, -7.216552734375, -6.84765625, -6.478759765625, -6.10986328125, -5.740966796875, -5.3720703125, -5.003173828125, -4.63427734375, -4.265380859375, -3.896484375, -3.527587890625, -3.15869140625, -2.789794921875, -2.4208984375, -2.052001953125, -1.68310546875, -1.314208984375, -0.9453125, -0.576416015625, -0.20751953125, 0.161376953125, 0.5302734375, 0.899169921875, 1.26806640625, 1.636962890625, 2.005859375, 2.374755859375, 2.74365234375, 3.112548828125, 3.4814453125, 3.850341796875, 4.21923828125, 4.588134765625, 4.95703125, 5.325927734375, 5.69482421875, 6.063720703125, 6.4326171875, 6.801513671875, 7.17041015625, 7.539306640625, 7.908203125, 8.277099609375, 8.64599609375, 9.014892578125, 9.3837890625, 9.752685546875, 10.12158203125, 10.490478515625, 10.859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 4.0, 2.0, 8.0, 3.0, 8.0, 11.0, 15.0, 16.0, 15.0, 16.0, 22.0, 22.0, 23.0, 27.0, 34.0, 34.0, 49.0, 75.0, 92.0, 147.0, 343.0, 1397.0, 150.0, 68.0, 64.0, 67.0, 50.0, 38.0, 34.0, 28.0, 33.0, 21.0, 17.0, 14.0, 13.0, 19.0, 16.0, 7.0, 6.0, 6.0, 1.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-19.84375, -19.18310546875, -18.5224609375, -17.86181640625, -17.201171875, -16.54052734375, -15.8798828125, -15.21923828125, -14.55859375, -13.89794921875, -13.2373046875, -12.57666015625, -11.916015625, -11.25537109375, -10.5947265625, -9.93408203125, -9.2734375, -8.61279296875, -7.9521484375, -7.29150390625, -6.630859375, -5.97021484375, -5.3095703125, -4.64892578125, -3.98828125, -3.32763671875, -2.6669921875, -2.00634765625, -1.345703125, -0.68505859375, -0.0244140625, 0.63623046875, 1.296875, 1.95751953125, 2.6181640625, 3.27880859375, 3.939453125, 4.60009765625, 5.2607421875, 5.92138671875, 6.58203125, 7.24267578125, 7.9033203125, 8.56396484375, 9.224609375, 9.88525390625, 10.5458984375, 11.20654296875, 11.8671875, 12.52783203125, 13.1884765625, 13.84912109375, 14.509765625, 15.17041015625, 15.8310546875, 16.49169921875, 17.15234375, 17.81298828125, 18.4736328125, 19.13427734375, 19.794921875, 20.45556640625, 21.1162109375, 21.77685546875, 22.4375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 4.0, 10.0, 5.0, 7.0, 5.0, 11.0, 12.0, 20.0, 24.0, 46.0, 46.0, 70.0, 124.0, 154.0, 356.0, 1071.0, 9077.0, 2892130.0, 236953.0, 4115.0, 718.0, 268.0, 152.0, 89.0, 57.0, 41.0, 31.0, 21.0, 14.0, 8.0, 9.0, 8.0, 8.0, 4.0, 5.0, 4.0, 5.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-79.1875, -76.3447265625, -73.501953125, -70.6591796875, -67.81640625, -64.9736328125, -62.130859375, -59.2880859375, -56.4453125, -53.6025390625, -50.759765625, -47.9169921875, -45.07421875, -42.2314453125, -39.388671875, -36.5458984375, -33.703125, -30.8603515625, -28.017578125, -25.1748046875, -22.33203125, -19.4892578125, -16.646484375, -13.8037109375, -10.9609375, -8.1181640625, -5.275390625, -2.4326171875, 0.41015625, 3.2529296875, 6.095703125, 8.9384765625, 11.78125, 14.6240234375, 17.466796875, 20.3095703125, 23.15234375, 25.9951171875, 28.837890625, 31.6806640625, 34.5234375, 37.3662109375, 40.208984375, 43.0517578125, 45.89453125, 48.7373046875, 51.580078125, 54.4228515625, 57.265625, 60.1083984375, 62.951171875, 65.7939453125, 68.63671875, 71.4794921875, 74.322265625, 77.1650390625, 80.0078125, 82.8505859375, 85.693359375, 88.5361328125, 91.37890625, 94.2216796875, 97.064453125, 99.9072265625, 102.75]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 30.0, 683.0, 296.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.8226432800293, -48.93228530883789, -36.04193115234375, -23.151573181152344, -10.261215209960938, 2.629138946533203, 15.51949691772461, 28.409854888916016, 41.30021286010742, 54.19057083129883, 67.08092498779297, 79.97128295898438, 92.86164093017578, 105.75199890136719, 118.64234924316406, 131.53271484375, 144.42306518554688, 157.31341552734375, 170.2037811279297, 183.09413146972656, 195.9844970703125, 208.87484741210938, 221.76519775390625, 234.6555633544922, 247.54592895507812, 260.436279296875, 273.3266296386719, 286.2170104980469, 299.10736083984375, 311.9977111816406, 324.8880615234375, 337.7784423828125, 350.6687927246094, 363.55914306640625, 376.4494934082031, 389.3398742675781, 402.230224609375, 415.1205749511719, 428.01092529296875, 440.90130615234375, 453.7916564941406, 466.6820068359375, 479.5723571777344, 492.4627380371094, 505.35308837890625, 518.243408203125, 531.1337890625, 544.024169921875, 556.9144897460938, 569.8048706054688, 582.6951904296875, 595.5855712890625, 608.4758911132812, 621.3662719726562, 634.2566528320312, 647.14697265625, 660.037353515625, 672.927734375, 685.8180541992188, 698.7084350585938, 711.5987548828125, 724.4891357421875, 737.3795166015625, 750.2698364257812, 763.1602172851562]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 6.0, 8.0, 4.0, 12.0, 10.0, 10.0, 16.0, 23.0, 21.0, 28.0, 31.0, 31.0, 26.0, 30.0, 32.0, 37.0, 36.0, 30.0, 37.0, 28.0, 36.0, 45.0, 38.0, 44.0, 41.0, 41.0, 42.0, 22.0, 33.0, 34.0, 29.0, 24.0, 25.0, 18.0, 9.0, 14.0, 12.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0], "bins": [-58.8868293762207, -57.15303421020508, -55.41923522949219, -53.68544006347656, -51.95164489746094, -50.21784591674805, -48.48405075073242, -46.75025177001953, -45.016456604003906, -43.28266143798828, -41.54886245727539, -39.815067291259766, -38.081268310546875, -36.34747314453125, -34.613677978515625, -32.8798828125, -31.14608383178711, -29.41228675842285, -27.678489685058594, -25.94469451904297, -24.21089744567871, -22.477100372314453, -20.743305206298828, -19.00950813293457, -17.275711059570312, -15.541913986206055, -13.808117866516113, -12.074321746826172, -10.340524673461914, -8.606727600097656, -6.872931480407715, -5.139135360717773, -3.4053421020507812, -1.6715455055236816, 0.06225109100341797, 1.7960476875305176, 3.529844284057617, 5.263641357421875, 6.997437477111816, 8.731233596801758, 10.465030670166016, 12.198827743530273, 13.932623863220215, 15.666419982910156, 17.400217056274414, 19.134014129638672, 20.867809295654297, 22.601606369018555, 24.335403442382812, 26.06920051574707, 27.802997589111328, 29.536792755126953, 31.27058982849121, 33.00438690185547, 34.738182067871094, 36.47197723388672, 38.20577621459961, 39.939571380615234, 41.673370361328125, 43.40716552734375, 45.140960693359375, 46.874759674072266, 48.60855484008789, 50.34235382080078, 52.076148986816406]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 6.0, 4.0, 6.0, 6.0, 11.0, 9.0, 10.0, 23.0, 22.0, 24.0, 21.0, 29.0, 20.0, 39.0, 27.0, 28.0, 38.0, 36.0, 45.0, 41.0, 41.0, 46.0, 36.0, 43.0, 37.0, 38.0, 28.0, 32.0, 27.0, 25.0, 26.0, 20.0, 17.0, 23.0, 20.0, 13.0, 12.0, 13.0, 7.0, 9.0, 6.0, 8.0, 4.0, 7.0, 2.0, 2.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.68359375, -6.4713134765625, -6.259033203125, -6.0467529296875, -5.83447265625, -5.6221923828125, -5.409912109375, -5.1976318359375, -4.9853515625, -4.7730712890625, -4.560791015625, -4.3485107421875, -4.13623046875, -3.9239501953125, -3.711669921875, -3.4993896484375, -3.287109375, -3.0748291015625, -2.862548828125, -2.6502685546875, -2.43798828125, -2.2257080078125, -2.013427734375, -1.8011474609375, -1.5888671875, -1.3765869140625, -1.164306640625, -0.9520263671875, -0.73974609375, -0.5274658203125, -0.315185546875, -0.1029052734375, 0.109375, 0.3216552734375, 0.533935546875, 0.7462158203125, 0.95849609375, 1.1707763671875, 1.383056640625, 1.5953369140625, 1.8076171875, 2.0198974609375, 2.232177734375, 2.4444580078125, 2.65673828125, 2.8690185546875, 3.081298828125, 3.2935791015625, 3.505859375, 3.7181396484375, 3.930419921875, 4.1427001953125, 4.35498046875, 4.5672607421875, 4.779541015625, 4.9918212890625, 5.2041015625, 5.4163818359375, 5.628662109375, 5.8409423828125, 6.05322265625, 6.2655029296875, 6.477783203125, 6.6900634765625, 6.90234375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 3.0, 7.0, 16.0, 10.0, 26.0, 22.0, 24.0, 51.0, 72.0, 114.0, 158.0, 189.0, 347.0, 528.0, 804.0, 1533.0, 2891.0, 5617.0, 12681.0, 33905.0, 153323.0, 1199662.0, 2321215.0, 365407.0, 59087.0, 19364.0, 8119.0, 3957.0, 2087.0, 1097.0, 633.0, 434.0, 305.0, 176.0, 118.0, 87.0, 52.0, 39.0, 25.0, 19.0, 17.0, 11.0, 9.0, 11.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-15.296875, -14.862548828125, -14.42822265625, -13.993896484375, -13.5595703125, -13.125244140625, -12.69091796875, -12.256591796875, -11.822265625, -11.387939453125, -10.95361328125, -10.519287109375, -10.0849609375, -9.650634765625, -9.21630859375, -8.781982421875, -8.34765625, -7.913330078125, -7.47900390625, -7.044677734375, -6.6103515625, -6.176025390625, -5.74169921875, -5.307373046875, -4.873046875, -4.438720703125, -4.00439453125, -3.570068359375, -3.1357421875, -2.701416015625, -2.26708984375, -1.832763671875, -1.3984375, -0.964111328125, -0.52978515625, -0.095458984375, 0.3388671875, 0.773193359375, 1.20751953125, 1.641845703125, 2.076171875, 2.510498046875, 2.94482421875, 3.379150390625, 3.8134765625, 4.247802734375, 4.68212890625, 5.116455078125, 5.55078125, 5.985107421875, 6.41943359375, 6.853759765625, 7.2880859375, 7.722412109375, 8.15673828125, 8.591064453125, 9.025390625, 9.459716796875, 9.89404296875, 10.328369140625, 10.7626953125, 11.197021484375, 11.63134765625, 12.065673828125, 12.5]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 4.0, 4.0, 8.0, 3.0, 9.0, 11.0, 18.0, 21.0, 21.0, 24.0, 45.0, 53.0, 71.0, 110.0, 191.0, 300.0, 518.0, 698.0, 679.0, 456.0, 285.0, 164.0, 111.0, 64.0, 46.0, 34.0, 25.0, 19.0, 20.0, 18.0, 7.0, 5.0, 11.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.78125, -15.285888671875, -14.79052734375, -14.295166015625, -13.7998046875, -13.304443359375, -12.80908203125, -12.313720703125, -11.818359375, -11.322998046875, -10.82763671875, -10.332275390625, -9.8369140625, -9.341552734375, -8.84619140625, -8.350830078125, -7.85546875, -7.360107421875, -6.86474609375, -6.369384765625, -5.8740234375, -5.378662109375, -4.88330078125, -4.387939453125, -3.892578125, -3.397216796875, -2.90185546875, -2.406494140625, -1.9111328125, -1.415771484375, -0.92041015625, -0.425048828125, 0.0703125, 0.565673828125, 1.06103515625, 1.556396484375, 2.0517578125, 2.547119140625, 3.04248046875, 3.537841796875, 4.033203125, 4.528564453125, 5.02392578125, 5.519287109375, 6.0146484375, 6.510009765625, 7.00537109375, 7.500732421875, 7.99609375, 8.491455078125, 8.98681640625, 9.482177734375, 9.9775390625, 10.472900390625, 10.96826171875, 11.463623046875, 11.958984375, 12.454345703125, 12.94970703125, 13.445068359375, 13.9404296875, 14.435791015625, 14.93115234375, 15.426513671875, 15.921875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 9.0, 7.0, 6.0, 10.0, 18.0, 21.0, 22.0, 42.0, 67.0, 122.0, 235.0, 586.0, 1776.0, 7050.0, 42522.0, 1320546.0, 2745444.0, 63223.0, 9019.0, 2209.0, 729.0, 273.0, 111.0, 73.0, 42.0, 29.0, 17.0, 17.0, 11.0, 13.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.06396484375, -33.8154296875, -32.56689453125, -31.318359375, -30.06982421875, -28.8212890625, -27.57275390625, -26.32421875, -25.07568359375, -23.8271484375, -22.57861328125, -21.330078125, -20.08154296875, -18.8330078125, -17.58447265625, -16.3359375, -15.08740234375, -13.8388671875, -12.59033203125, -11.341796875, -10.09326171875, -8.8447265625, -7.59619140625, -6.34765625, -5.09912109375, -3.8505859375, -2.60205078125, -1.353515625, -0.10498046875, 1.1435546875, 2.39208984375, 3.640625, 4.88916015625, 6.1376953125, 7.38623046875, 8.634765625, 9.88330078125, 11.1318359375, 12.38037109375, 13.62890625, 14.87744140625, 16.1259765625, 17.37451171875, 18.623046875, 19.87158203125, 21.1201171875, 22.36865234375, 23.6171875, 24.86572265625, 26.1142578125, 27.36279296875, 28.611328125, 29.85986328125, 31.1083984375, 32.35693359375, 33.60546875, 34.85400390625, 36.1025390625, 37.35107421875, 38.599609375, 39.84814453125, 41.0966796875, 42.34521484375, 43.59375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 13.0, 54.0, 67.0, 189.0, 238.0, 228.0, 123.0, 59.0, 26.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-204.87384033203125, -200.57501220703125, -196.2761688232422, -191.97732543945312, -187.67849731445312, -183.37966918945312, -179.08082580566406, -174.781982421875, -170.483154296875, -166.184326171875, -161.88548278808594, -157.58663940429688, -153.28781127929688, -148.98898315429688, -144.6901397705078, -140.39129638671875, -136.09246826171875, -131.79364013671875, -127.49479675292969, -123.19596099853516, -118.89712524414062, -114.5982894897461, -110.29945373535156, -106.00061798095703, -101.7017822265625, -97.40294647216797, -93.10411071777344, -88.8052749633789, -84.50643920898438, -80.20760345458984, -75.90876770019531, -71.60993194580078, -67.31109619140625, -63.01226043701172, -58.71342468261719, -54.414588928222656, -50.115753173828125, -45.816917419433594, -41.51808166503906, -37.21924591064453, -32.92041015625, -28.62157440185547, -24.322738647460938, -20.023902893066406, -15.725067138671875, -11.426231384277344, -7.1273956298828125, -2.8285598754882812, 1.47027587890625, 5.769111633300781, 10.067947387695312, 14.366783142089844, 18.665618896484375, 22.964454650878906, 27.263290405273438, 31.56212615966797, 35.8609619140625, 40.15979766845703, 44.45863342285156, 48.757469177246094, 53.056304931640625, 57.355140686035156, 61.65397644042969, 65.95281219482422, 70.25164794921875]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 7.0, 7.0, 17.0, 22.0, 20.0, 20.0, 24.0, 28.0, 26.0, 28.0, 37.0, 26.0, 34.0, 42.0, 38.0, 47.0, 44.0, 50.0, 34.0, 44.0, 39.0, 30.0, 32.0, 38.0, 35.0, 31.0, 32.0, 29.0, 21.0, 20.0, 16.0, 16.0, 14.0, 8.0, 7.0, 7.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-47.331844329833984, -45.90064239501953, -44.469444274902344, -43.03824234008789, -41.60704040527344, -40.17584228515625, -38.7446403503418, -37.313438415527344, -35.882240295410156, -34.4510383605957, -33.019840240478516, -31.588638305664062, -30.15743637084961, -28.72623634338379, -27.29503631591797, -25.863834381103516, -24.432632446289062, -23.001432418823242, -21.57023048400879, -20.13903045654297, -18.707828521728516, -17.276628494262695, -15.845428466796875, -14.414227485656738, -12.983026504516602, -11.551825523376465, -10.120624542236328, -8.689424514770508, -7.258223533630371, -5.827022552490234, -4.395822525024414, -2.9646215438842773, -1.5334205627441406, -0.10221982002258301, 1.3289809226989746, 2.760181427001953, 4.19138240814209, 5.622583389282227, 7.053783416748047, 8.484984397888184, 9.91618537902832, 11.347386360168457, 12.778587341308594, 14.209787368774414, 15.64098834991455, 17.072189331054688, 18.503389358520508, 19.934589385986328, 21.36579132080078, 22.7969913482666, 24.228193283081055, 25.659393310546875, 27.090595245361328, 28.52179527282715, 29.95299530029297, 31.384197235107422, 32.815399169921875, 34.24660110473633, 35.677799224853516, 37.10900115966797, 38.54020309448242, 39.971405029296875, 41.40260314941406, 42.833805084228516, 44.2650032043457]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 10.0, 11.0, 15.0, 19.0, 12.0, 25.0, 29.0, 23.0, 29.0, 30.0, 44.0, 34.0, 44.0, 29.0, 51.0, 38.0, 37.0, 53.0, 44.0, 43.0, 46.0, 47.0, 33.0, 33.0, 20.0, 24.0, 16.0, 24.0, 24.0, 12.0, 8.0, 17.0, 11.0, 9.0, 3.0, 9.0, 8.0, 7.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.94586181640625, -5.7315673828125, -5.51727294921875, -5.302978515625, -5.08868408203125, -4.8743896484375, -4.66009521484375, -4.44580078125, -4.23150634765625, -4.0172119140625, -3.80291748046875, -3.588623046875, -3.37432861328125, -3.1600341796875, -2.94573974609375, -2.7314453125, -2.51715087890625, -2.3028564453125, -2.08856201171875, -1.874267578125, -1.65997314453125, -1.4456787109375, -1.23138427734375, -1.01708984375, -0.80279541015625, -0.5885009765625, -0.37420654296875, -0.159912109375, 0.05438232421875, 0.2686767578125, 0.48297119140625, 0.697265625, 0.91156005859375, 1.1258544921875, 1.34014892578125, 1.554443359375, 1.76873779296875, 1.9830322265625, 2.19732666015625, 2.41162109375, 2.62591552734375, 2.8402099609375, 3.05450439453125, 3.268798828125, 3.48309326171875, 3.6973876953125, 3.91168212890625, 4.1259765625, 4.34027099609375, 4.5545654296875, 4.76885986328125, 4.983154296875, 5.19744873046875, 5.4117431640625, 5.62603759765625, 5.84033203125, 6.05462646484375, 6.2689208984375, 6.48321533203125, 6.697509765625, 6.91180419921875, 7.1260986328125, 7.34039306640625, 7.5546875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 8.0, 7.0, 16.0, 10.0, 17.0, 24.0, 33.0, 56.0, 77.0, 134.0, 173.0, 287.0, 412.0, 597.0, 1046.0, 1639.0, 2806.0, 5106.0, 9686.0, 20031.0, 49262.0, 143822.0, 412992.0, 259237.0, 80918.0, 30315.0, 13569.0, 6745.0, 3802.0, 2101.0, 1295.0, 745.0, 517.0, 344.0, 211.0, 164.0, 99.0, 67.0, 42.0, 34.0, 20.0, 21.0, 20.0, 6.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.384765625, -3.27813720703125, -3.1715087890625, -3.06488037109375, -2.958251953125, -2.85162353515625, -2.7449951171875, -2.63836669921875, -2.53173828125, -2.42510986328125, -2.3184814453125, -2.21185302734375, -2.105224609375, -1.99859619140625, -1.8919677734375, -1.78533935546875, -1.6787109375, -1.57208251953125, -1.4654541015625, -1.35882568359375, -1.252197265625, -1.14556884765625, -1.0389404296875, -0.93231201171875, -0.82568359375, -0.71905517578125, -0.6124267578125, -0.50579833984375, -0.399169921875, -0.29254150390625, -0.1859130859375, -0.07928466796875, 0.02734375, 0.13397216796875, 0.2406005859375, 0.34722900390625, 0.453857421875, 0.56048583984375, 0.6671142578125, 0.77374267578125, 0.88037109375, 0.98699951171875, 1.0936279296875, 1.20025634765625, 1.306884765625, 1.41351318359375, 1.5201416015625, 1.62677001953125, 1.7333984375, 1.84002685546875, 1.9466552734375, 2.05328369140625, 2.159912109375, 2.26654052734375, 2.3731689453125, 2.47979736328125, 2.58642578125, 2.69305419921875, 2.7996826171875, 2.90631103515625, 3.012939453125, 3.11956787109375, 3.2261962890625, 3.33282470703125, 3.439453125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 9.0, 13.0, 15.0, 20.0, 13.0, 22.0, 21.0, 28.0, 21.0, 29.0, 25.0, 39.0, 45.0, 33.0, 50.0, 49.0, 1077.0, 48.0, 49.0, 63.0, 43.0, 36.0, 37.0, 29.0, 35.0, 25.0, 25.0, 19.0, 25.0, 16.0, 13.0, 13.0, 9.0, 12.0, 4.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.55078125, -5.3868408203125, -5.222900390625, -5.0589599609375, -4.89501953125, -4.7310791015625, -4.567138671875, -4.4031982421875, -4.2392578125, -4.0753173828125, -3.911376953125, -3.7474365234375, -3.58349609375, -3.4195556640625, -3.255615234375, -3.0916748046875, -2.927734375, -2.7637939453125, -2.599853515625, -2.4359130859375, -2.27197265625, -2.1080322265625, -1.944091796875, -1.7801513671875, -1.6162109375, -1.4522705078125, -1.288330078125, -1.1243896484375, -0.96044921875, -0.7965087890625, -0.632568359375, -0.4686279296875, -0.3046875, -0.1407470703125, 0.023193359375, 0.1871337890625, 0.35107421875, 0.5150146484375, 0.678955078125, 0.8428955078125, 1.0068359375, 1.1707763671875, 1.334716796875, 1.4986572265625, 1.66259765625, 1.8265380859375, 1.990478515625, 2.1544189453125, 2.318359375, 2.4822998046875, 2.646240234375, 2.8101806640625, 2.97412109375, 3.1380615234375, 3.302001953125, 3.4659423828125, 3.6298828125, 3.7938232421875, 3.957763671875, 4.1217041015625, 4.28564453125, 4.4495849609375, 4.613525390625, 4.7774658203125, 4.94140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 8.0, 3.0, 8.0, 27.0, 23.0, 26.0, 52.0, 66.0, 87.0, 133.0, 258.0, 327.0, 598.0, 994.0, 1868.0, 3787.0, 9042.0, 30211.0, 189440.0, 1622658.0, 189820.0, 30631.0, 9000.0, 3709.0, 1802.0, 983.0, 604.0, 335.0, 203.0, 145.0, 93.0, 66.0, 37.0, 29.0, 17.0, 22.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.55889892578125, -3.4459228515625, -3.33294677734375, -3.219970703125, -3.10699462890625, -2.9940185546875, -2.88104248046875, -2.76806640625, -2.65509033203125, -2.5421142578125, -2.42913818359375, -2.316162109375, -2.20318603515625, -2.0902099609375, -1.97723388671875, -1.8642578125, -1.75128173828125, -1.6383056640625, -1.52532958984375, -1.412353515625, -1.29937744140625, -1.1864013671875, -1.07342529296875, -0.96044921875, -0.84747314453125, -0.7344970703125, -0.62152099609375, -0.508544921875, -0.39556884765625, -0.2825927734375, -0.16961669921875, -0.056640625, 0.05633544921875, 0.1693115234375, 0.28228759765625, 0.395263671875, 0.50823974609375, 0.6212158203125, 0.73419189453125, 0.84716796875, 0.96014404296875, 1.0731201171875, 1.18609619140625, 1.299072265625, 1.41204833984375, 1.5250244140625, 1.63800048828125, 1.7509765625, 1.86395263671875, 1.9769287109375, 2.08990478515625, 2.202880859375, 2.31585693359375, 2.4288330078125, 2.54180908203125, 2.65478515625, 2.76776123046875, 2.8807373046875, 2.99371337890625, 3.106689453125, 3.21966552734375, 3.3326416015625, 3.44561767578125, 3.55859375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 6.0, 14.0, 18.0, 48.0, 65.0, 101.0, 184.0, 205.0, 125.0, 78.0, 50.0, 29.0, 21.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.9663848876953125, -0.939605712890625, -0.9128265380859375, -0.88604736328125, -0.8592681884765625, -0.832489013671875, -0.8057098388671875, -0.7789306640625, -0.7521514892578125, -0.725372314453125, -0.6985931396484375, -0.67181396484375, -0.6450347900390625, -0.618255615234375, -0.5914764404296875, -0.564697265625, -0.5379180908203125, -0.511138916015625, -0.4843597412109375, -0.45758056640625, -0.4308013916015625, -0.404022216796875, -0.3772430419921875, -0.3504638671875, -0.3236846923828125, -0.296905517578125, -0.2701263427734375, -0.24334716796875, -0.2165679931640625, -0.189788818359375, -0.1630096435546875, -0.13623046875, -0.1094512939453125, -0.082672119140625, -0.0558929443359375, -0.02911376953125, -0.0023345947265625, 0.024444580078125, 0.0512237548828125, 0.0780029296875, 0.1047821044921875, 0.131561279296875, 0.1583404541015625, 0.18511962890625, 0.2118988037109375, 0.238677978515625, 0.2654571533203125, 0.292236328125, 0.3190155029296875, 0.345794677734375, 0.3725738525390625, 0.39935302734375, 0.4261322021484375, 0.452911376953125, 0.4796905517578125, 0.5064697265625, 0.5332489013671875, 0.560028076171875, 0.5868072509765625, 0.61358642578125, 0.6403656005859375, 0.667144775390625, 0.6939239501953125, 0.720703125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 13.0, 14.0, 17.0, 15.0, 36.0, 60.0, 91.0, 199.0, 841.0, 8261.0, 1001189.0, 35374.0, 1729.0, 319.0, 133.0, 74.0, 28.0, 29.0, 16.0, 16.0, 10.0, 7.0, 7.0, 7.0, 6.0, 5.0, 4.0, 2.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.7996826171875, -11.388427734375, -10.9771728515625, -10.56591796875, -10.1546630859375, -9.743408203125, -9.3321533203125, -8.9208984375, -8.5096435546875, -8.098388671875, -7.6871337890625, -7.27587890625, -6.8646240234375, -6.453369140625, -6.0421142578125, -5.630859375, -5.2196044921875, -4.808349609375, -4.3970947265625, -3.98583984375, -3.5745849609375, -3.163330078125, -2.7520751953125, -2.3408203125, -1.9295654296875, -1.518310546875, -1.1070556640625, -0.69580078125, -0.2845458984375, 0.126708984375, 0.5379638671875, 0.94921875, 1.3604736328125, 1.771728515625, 2.1829833984375, 2.59423828125, 3.0054931640625, 3.416748046875, 3.8280029296875, 4.2392578125, 4.6505126953125, 5.061767578125, 5.4730224609375, 5.88427734375, 6.2955322265625, 6.706787109375, 7.1180419921875, 7.529296875, 7.9405517578125, 8.351806640625, 8.7630615234375, 9.17431640625, 9.5855712890625, 9.996826171875, 10.4080810546875, 10.8193359375, 11.2305908203125, 11.641845703125, 12.0531005859375, 12.46435546875, 12.8756103515625, 13.286865234375, 13.6981201171875, 14.109375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 18.0, 121.0, 453.0, 335.0, 72.0, 10.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4320948123931885, -3.308811902999878, -3.1855287551879883, -3.0622458457946777, -2.938962697982788, -2.8156797885894775, -2.692396640777588, -2.5691137313842773, -2.445830821990967, -2.3225479125976562, -2.1992647647857666, -2.075981855392456, -1.9526987075805664, -1.8294157981872559, -1.7061327695846558, -1.5828497409820557, -1.459566593170166, -1.336283564567566, -1.2130005359649658, -1.0897176265716553, -0.9664345383644104, -0.8431515097618103, -0.719868540763855, -0.5965855121612549, -0.4733024835586548, -0.3500194549560547, -0.22673645615577698, -0.10345345735549927, 0.01982957124710083, 0.14311259984970093, 0.26639556884765625, 0.38967859745025635, 0.5129618644714355, 0.6362448930740356, 0.7595279216766357, 0.8828108906745911, 1.006093978881836, 1.1293768882751465, 1.2526599168777466, 1.3759429454803467, 1.4992259740829468, 1.6225090026855469, 1.745792031288147, 1.869075059890747, 1.9923579692840576, 2.1156411170959473, 2.238924026489258, 2.3622069358825684, 2.485490083694458, 2.6087729930877686, 2.732056140899658, 2.8553390502929688, 2.9786221981048584, 3.101905107498169, 3.2251882553100586, 3.348471164703369, 3.4717540740966797, 3.5950369834899902, 3.71832013130188, 3.8416030406951904, 3.96488618850708, 4.088169097900391, 4.211452007293701, 4.334734916687012, 4.4580183029174805]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 11.0, 17.0, 13.0, 11.0, 15.0, 18.0, 15.0, 19.0, 30.0, 35.0, 33.0, 39.0, 29.0, 53.0, 37.0, 42.0, 34.0, 39.0, 38.0, 38.0, 45.0, 32.0, 38.0, 41.0, 29.0, 31.0, 40.0, 35.0, 14.0, 18.0, 14.0, 12.0, 10.0, 12.0, 9.0, 7.0, 6.0, 4.0, 2.0, 6.0, 3.0, 0.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5835478901863098, -0.5644182562828064, -0.5452886819839478, -0.5261590480804443, -0.5070294737815857, -0.48789986968040466, -0.46877026557922363, -0.4496406316757202, -0.4305110573768616, -0.41138145327568054, -0.3922518491744995, -0.3731222450733185, -0.35399264097213745, -0.3348630368709564, -0.3157334327697754, -0.296603798866272, -0.27747419476509094, -0.2583445906639099, -0.23921498656272888, -0.22008538246154785, -0.20095577836036682, -0.1818261742591858, -0.16269655525684357, -0.14356695115566254, -0.1244373470544815, -0.10530774295330048, -0.08617813885211945, -0.06704852730035782, -0.04791892319917679, -0.028789319097995758, -0.00965970754623413, 0.0094698965549469, 0.02859950065612793, 0.04772910475730896, 0.06685870885848999, 0.08598832041025162, 0.10511792451143265, 0.12424752861261368, 0.1433771401643753, 0.16250674426555634, 0.18163634836673737, 0.2007659524679184, 0.21989555656909943, 0.23902517557144165, 0.2581547796726227, 0.2772843837738037, 0.29641398787498474, 0.31554359197616577, 0.3346731960773468, 0.35380280017852783, 0.37293240427970886, 0.3920620083808899, 0.4111916124820709, 0.43032121658325195, 0.44945085048675537, 0.468580424785614, 0.48771005868911743, 0.5068396925926208, 0.5259692668914795, 0.5450989007949829, 0.5642284750938416, 0.583358108997345, 0.6024876832962036, 0.621617317199707, 0.6407468914985657]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 12.0, 18.0, 12.0, 17.0, 11.0, 17.0, 20.0, 31.0, 26.0, 24.0, 24.0, 34.0, 49.0, 43.0, 35.0, 42.0, 44.0, 47.0, 37.0, 39.0, 38.0, 51.0, 40.0, 37.0, 21.0, 16.0, 30.0, 24.0, 20.0, 18.0, 14.0, 17.0, 18.0, 13.0, 10.0, 12.0, 10.0, 2.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.92462158203125, -5.7125244140625, -5.50042724609375, -5.288330078125, -5.07623291015625, -4.8641357421875, -4.65203857421875, -4.43994140625, -4.22784423828125, -4.0157470703125, -3.80364990234375, -3.591552734375, -3.37945556640625, -3.1673583984375, -2.95526123046875, -2.7431640625, -2.53106689453125, -2.3189697265625, -2.10687255859375, -1.894775390625, -1.68267822265625, -1.4705810546875, -1.25848388671875, -1.04638671875, -0.83428955078125, -0.6221923828125, -0.41009521484375, -0.197998046875, 0.01409912109375, 0.2261962890625, 0.43829345703125, 0.650390625, 0.86248779296875, 1.0745849609375, 1.28668212890625, 1.498779296875, 1.71087646484375, 1.9229736328125, 2.13507080078125, 2.34716796875, 2.55926513671875, 2.7713623046875, 2.98345947265625, 3.195556640625, 3.40765380859375, 3.6197509765625, 3.83184814453125, 4.0439453125, 4.25604248046875, 4.4681396484375, 4.68023681640625, 4.892333984375, 5.10443115234375, 5.3165283203125, 5.52862548828125, 5.74072265625, 5.95281982421875, 6.1649169921875, 6.37701416015625, 6.589111328125, 6.80120849609375, 7.0133056640625, 7.22540283203125, 7.4375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 9.0, 5.0, 8.0, 17.0, 37.0, 30.0, 57.0, 83.0, 95.0, 165.0, 203.0, 307.0, 465.0, 718.0, 1036.0, 1624.0, 2693.0, 4331.0, 7510.0, 13491.0, 26725.0, 59337.0, 155511.0, 454401.0, 185552.0, 68358.0, 30032.0, 14859.0, 8234.0, 4739.0, 2777.0, 1625.0, 1127.0, 747.0, 487.0, 315.0, 261.0, 161.0, 111.0, 90.0, 60.0, 43.0, 28.0, 27.0, 17.0, 12.0, 11.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0078125, -7.737060546875, -7.46630859375, -7.195556640625, -6.9248046875, -6.654052734375, -6.38330078125, -6.112548828125, -5.841796875, -5.571044921875, -5.30029296875, -5.029541015625, -4.7587890625, -4.488037109375, -4.21728515625, -3.946533203125, -3.67578125, -3.405029296875, -3.13427734375, -2.863525390625, -2.5927734375, -2.322021484375, -2.05126953125, -1.780517578125, -1.509765625, -1.239013671875, -0.96826171875, -0.697509765625, -0.4267578125, -0.156005859375, 0.11474609375, 0.385498046875, 0.65625, 0.927001953125, 1.19775390625, 1.468505859375, 1.7392578125, 2.010009765625, 2.28076171875, 2.551513671875, 2.822265625, 3.093017578125, 3.36376953125, 3.634521484375, 3.9052734375, 4.176025390625, 4.44677734375, 4.717529296875, 4.98828125, 5.259033203125, 5.52978515625, 5.800537109375, 6.0712890625, 6.342041015625, 6.61279296875, 6.883544921875, 7.154296875, 7.425048828125, 7.69580078125, 7.966552734375, 8.2373046875, 8.508056640625, 8.77880859375, 9.049560546875, 9.3203125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 11.0, 11.0, 8.0, 15.0, 19.0, 22.0, 35.0, 31.0, 37.0, 49.0, 52.0, 53.0, 79.0, 135.0, 242.0, 1477.0, 249.0, 103.0, 64.0, 48.0, 41.0, 49.0, 33.0, 31.0, 19.0, 22.0, 18.0, 19.0, 11.0, 14.0, 13.0, 7.0, 6.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.324951171875, -21.47802734375, -20.631103515625, -19.7841796875, -18.937255859375, -18.09033203125, -17.243408203125, -16.396484375, -15.549560546875, -14.70263671875, -13.855712890625, -13.0087890625, -12.161865234375, -11.31494140625, -10.468017578125, -9.62109375, -8.774169921875, -7.92724609375, -7.080322265625, -6.2333984375, -5.386474609375, -4.53955078125, -3.692626953125, -2.845703125, -1.998779296875, -1.15185546875, -0.304931640625, 0.5419921875, 1.388916015625, 2.23583984375, 3.082763671875, 3.9296875, 4.776611328125, 5.62353515625, 6.470458984375, 7.3173828125, 8.164306640625, 9.01123046875, 9.858154296875, 10.705078125, 11.552001953125, 12.39892578125, 13.245849609375, 14.0927734375, 14.939697265625, 15.78662109375, 16.633544921875, 17.48046875, 18.327392578125, 19.17431640625, 20.021240234375, 20.8681640625, 21.715087890625, 22.56201171875, 23.408935546875, 24.255859375, 25.102783203125, 25.94970703125, 26.796630859375, 27.6435546875, 28.490478515625, 29.33740234375, 30.184326171875, 31.03125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 13.0, 12.0, 18.0, 30.0, 37.0, 81.0, 129.0, 236.0, 532.0, 1525.0, 18593.0, 3107898.0, 14141.0, 1391.0, 503.0, 234.0, 122.0, 78.0, 36.0, 23.0, 21.0, 18.0, 5.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-116.8125, -113.21484375, -109.6171875, -106.01953125, -102.421875, -98.82421875, -95.2265625, -91.62890625, -88.03125, -84.43359375, -80.8359375, -77.23828125, -73.640625, -70.04296875, -66.4453125, -62.84765625, -59.25, -55.65234375, -52.0546875, -48.45703125, -44.859375, -41.26171875, -37.6640625, -34.06640625, -30.46875, -26.87109375, -23.2734375, -19.67578125, -16.078125, -12.48046875, -8.8828125, -5.28515625, -1.6875, 1.91015625, 5.5078125, 9.10546875, 12.703125, 16.30078125, 19.8984375, 23.49609375, 27.09375, 30.69140625, 34.2890625, 37.88671875, 41.484375, 45.08203125, 48.6796875, 52.27734375, 55.875, 59.47265625, 63.0703125, 66.66796875, 70.265625, 73.86328125, 77.4609375, 81.05859375, 84.65625, 88.25390625, 91.8515625, 95.44921875, 99.046875, 102.64453125, 106.2421875, 109.83984375, 113.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 5.0, 267.0, 688.0, 55.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.845659255981445, -22.082050323486328, -12.318439483642578, -2.554830551147461, 7.208780288696289, 16.97239112854004, 26.735998153686523, 36.499610900878906, 46.263221740722656, 56.026832580566406, 65.79044342041016, 75.55404663085938, 85.31765747070312, 95.08126831054688, 104.84487915039062, 114.60848999023438, 124.37210083007812, 134.13571166992188, 143.89932250976562, 153.66293334960938, 163.42654418945312, 173.19015502929688, 182.95376586914062, 192.71737670898438, 202.48097229003906, 212.2445831298828, 222.00819396972656, 231.7718048095703, 241.53541564941406, 251.2990264892578, 261.0626220703125, 270.82623291015625, 280.5898742675781, 290.3534851074219, 300.1170959472656, 309.8807067871094, 319.6443176269531, 329.4079284667969, 339.1715393066406, 348.9351501464844, 358.6987609863281, 368.4623718261719, 378.2259826660156, 387.9895935058594, 397.7532043457031, 407.5168151855469, 417.2804260253906, 427.0440368652344, 436.8076171875, 446.57122802734375, 456.3348388671875, 466.09844970703125, 475.862060546875, 485.62567138671875, 495.3892822265625, 505.15289306640625, 514.91650390625, 524.6801147460938, 534.4437255859375, 544.2073364257812, 553.970947265625, 563.7345581054688, 573.4981689453125, 583.2617797851562, 593.025390625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 13.0, 10.0, 13.0, 12.0, 13.0, 15.0, 20.0, 14.0, 18.0, 19.0, 20.0, 15.0, 27.0, 21.0, 38.0, 33.0, 38.0, 41.0, 35.0, 39.0, 38.0, 50.0, 30.0, 42.0, 41.0, 39.0, 27.0, 27.0, 19.0, 24.0, 20.0, 27.0, 17.0, 19.0, 15.0, 16.0, 18.0, 10.0, 11.0, 15.0, 12.0, 3.0, 6.0, 6.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-52.3376579284668, -50.684295654296875, -49.03093719482422, -47.3775749206543, -45.72421646118164, -44.07085418701172, -42.41749572753906, -40.76413345336914, -39.11077117919922, -37.4574089050293, -35.80405044555664, -34.15068817138672, -32.49732971191406, -30.84396743774414, -29.19060707092285, -27.537246704101562, -25.883886337280273, -24.230525970458984, -22.577165603637695, -20.923805236816406, -19.270442962646484, -17.617082595825195, -15.963722229003906, -14.3103609085083, -12.657000541687012, -11.003640174865723, -9.350278854370117, -7.696918487548828, -6.043557643890381, -4.390196800231934, -2.7368364334106445, -1.083475112915039, 0.56988525390625, 2.2232460975646973, 3.8766067028045654, 5.529967308044434, 7.183328151702881, 8.836688995361328, 10.490049362182617, 12.143410682678223, 13.796771049499512, 15.4501314163208, 17.103492736816406, 18.756853103637695, 20.410213470458984, 22.063575744628906, 23.716934204101562, 25.370296478271484, 27.023656845092773, 28.677017211914062, 30.33037757873535, 31.98373794555664, 33.63710021972656, 35.29045867919922, 36.94382095336914, 38.59718322753906, 40.25054168701172, 41.90390396118164, 43.5572624206543, 45.21062469482422, 46.863983154296875, 48.5173454284668, 50.17070770263672, 51.824066162109375, 53.4774284362793]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 7.0, 7.0, 11.0, 10.0, 14.0, 15.0, 17.0, 17.0, 21.0, 21.0, 18.0, 30.0, 30.0, 31.0, 34.0, 37.0, 37.0, 36.0, 33.0, 45.0, 41.0, 41.0, 35.0, 35.0, 42.0, 36.0, 30.0, 27.0, 26.0, 31.0, 20.0, 19.0, 29.0, 13.0, 17.0, 11.0, 13.0, 13.0, 5.0, 14.0, 5.0, 3.0, 4.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.58203125, -6.3740234375, -6.166015625, -5.9580078125, -5.75, -5.5419921875, -5.333984375, -5.1259765625, -4.91796875, -4.7099609375, -4.501953125, -4.2939453125, -4.0859375, -3.8779296875, -3.669921875, -3.4619140625, -3.25390625, -3.0458984375, -2.837890625, -2.6298828125, -2.421875, -2.2138671875, -2.005859375, -1.7978515625, -1.58984375, -1.3818359375, -1.173828125, -0.9658203125, -0.7578125, -0.5498046875, -0.341796875, -0.1337890625, 0.07421875, 0.2822265625, 0.490234375, 0.6982421875, 0.90625, 1.1142578125, 1.322265625, 1.5302734375, 1.73828125, 1.9462890625, 2.154296875, 2.3623046875, 2.5703125, 2.7783203125, 2.986328125, 3.1943359375, 3.40234375, 3.6103515625, 3.818359375, 4.0263671875, 4.234375, 4.4423828125, 4.650390625, 4.8583984375, 5.06640625, 5.2744140625, 5.482421875, 5.6904296875, 5.8984375, 6.1064453125, 6.314453125, 6.5224609375, 6.73046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 10.0, 11.0, 12.0, 23.0, 40.0, 39.0, 63.0, 83.0, 138.0, 194.0, 309.0, 455.0, 684.0, 1179.0, 1804.0, 3045.0, 5493.0, 10450.0, 23529.0, 71818.0, 387312.0, 1901670.0, 1445027.0, 248396.0, 52538.0, 19220.0, 8860.0, 4821.0, 2708.0, 1565.0, 1021.0, 619.0, 402.0, 236.0, 145.0, 105.0, 81.0, 52.0, 38.0, 28.0, 12.0, 12.0, 8.0, 5.0, 4.0, 4.0, 0.0, 5.0, 5.0, 1.0, 1.0, 3.0], "bins": [-12.3046875, -11.9415283203125, -11.578369140625, -11.2152099609375, -10.85205078125, -10.4888916015625, -10.125732421875, -9.7625732421875, -9.3994140625, -9.0362548828125, -8.673095703125, -8.3099365234375, -7.94677734375, -7.5836181640625, -7.220458984375, -6.8572998046875, -6.494140625, -6.1309814453125, -5.767822265625, -5.4046630859375, -5.04150390625, -4.6783447265625, -4.315185546875, -3.9520263671875, -3.5888671875, -3.2257080078125, -2.862548828125, -2.4993896484375, -2.13623046875, -1.7730712890625, -1.409912109375, -1.0467529296875, -0.68359375, -0.3204345703125, 0.042724609375, 0.4058837890625, 0.76904296875, 1.1322021484375, 1.495361328125, 1.8585205078125, 2.2216796875, 2.5848388671875, 2.947998046875, 3.3111572265625, 3.67431640625, 4.0374755859375, 4.400634765625, 4.7637939453125, 5.126953125, 5.4901123046875, 5.853271484375, 6.2164306640625, 6.57958984375, 6.9427490234375, 7.305908203125, 7.6690673828125, 8.0322265625, 8.3953857421875, 8.758544921875, 9.1217041015625, 9.48486328125, 9.8480224609375, 10.211181640625, 10.5743408203125, 10.9375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 5.0, 2.0, 9.0, 14.0, 17.0, 10.0, 13.0, 27.0, 28.0, 50.0, 57.0, 69.0, 84.0, 142.0, 211.0, 293.0, 487.0, 549.0, 565.0, 431.0, 302.0, 187.0, 125.0, 93.0, 91.0, 47.0, 31.0, 27.0, 15.0, 15.0, 12.0, 7.0, 10.0, 8.0, 9.0, 7.0, 7.0, 4.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.1171875, -12.7183837890625, -12.319580078125, -11.9207763671875, -11.52197265625, -11.1231689453125, -10.724365234375, -10.3255615234375, -9.9267578125, -9.5279541015625, -9.129150390625, -8.7303466796875, -8.33154296875, -7.9327392578125, -7.533935546875, -7.1351318359375, -6.736328125, -6.3375244140625, -5.938720703125, -5.5399169921875, -5.14111328125, -4.7423095703125, -4.343505859375, -3.9447021484375, -3.5458984375, -3.1470947265625, -2.748291015625, -2.3494873046875, -1.95068359375, -1.5518798828125, -1.153076171875, -0.7542724609375, -0.35546875, 0.0433349609375, 0.442138671875, 0.8409423828125, 1.23974609375, 1.6385498046875, 2.037353515625, 2.4361572265625, 2.8349609375, 3.2337646484375, 3.632568359375, 4.0313720703125, 4.43017578125, 4.8289794921875, 5.227783203125, 5.6265869140625, 6.025390625, 6.4241943359375, 6.822998046875, 7.2218017578125, 7.62060546875, 8.0194091796875, 8.418212890625, 8.8170166015625, 9.2158203125, 9.6146240234375, 10.013427734375, 10.4122314453125, 10.81103515625, 11.2098388671875, 11.608642578125, 12.0074462890625, 12.40625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 11.0, 14.0, 16.0, 13.0, 24.0, 35.0, 39.0, 77.0, 94.0, 157.0, 295.0, 889.0, 3739.0, 26556.0, 804861.0, 3283328.0, 65086.0, 6659.0, 1352.0, 428.0, 180.0, 101.0, 58.0, 54.0, 46.0, 32.0, 24.0, 10.0, 13.0, 14.0, 13.0, 9.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.03125, -39.71484375, -38.3984375, -37.08203125, -35.765625, -34.44921875, -33.1328125, -31.81640625, -30.5, -29.18359375, -27.8671875, -26.55078125, -25.234375, -23.91796875, -22.6015625, -21.28515625, -19.96875, -18.65234375, -17.3359375, -16.01953125, -14.703125, -13.38671875, -12.0703125, -10.75390625, -9.4375, -8.12109375, -6.8046875, -5.48828125, -4.171875, -2.85546875, -1.5390625, -0.22265625, 1.09375, 2.41015625, 3.7265625, 5.04296875, 6.359375, 7.67578125, 8.9921875, 10.30859375, 11.625, 12.94140625, 14.2578125, 15.57421875, 16.890625, 18.20703125, 19.5234375, 20.83984375, 22.15625, 23.47265625, 24.7890625, 26.10546875, 27.421875, 28.73828125, 30.0546875, 31.37109375, 32.6875, 34.00390625, 35.3203125, 36.63671875, 37.953125, 39.26953125, 40.5859375, 41.90234375, 43.21875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 15.0, 49.0, 70.0, 153.0, 230.0, 188.0, 150.0, 70.0, 41.0, 22.0, 10.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-186.3714599609375, -182.85475158691406, -179.33802795410156, -175.82131958007812, -172.30459594726562, -168.7878875732422, -165.27117919921875, -161.75445556640625, -158.2377471923828, -154.72103881835938, -151.20431518554688, -147.68760681152344, -144.17088317871094, -140.6541748046875, -137.137451171875, -133.62074279785156, -130.10403442382812, -126.58731842041016, -123.07060241699219, -119.55389404296875, -116.03717803955078, -112.52046203613281, -109.00374603271484, -105.48703002929688, -101.97030639648438, -98.4535903930664, -94.93687438964844, -91.420166015625, -87.90345001220703, -84.38673400878906, -80.8700180053711, -77.35330200195312, -73.83660125732422, -70.31988525390625, -66.80316925048828, -63.28645706176758, -59.769744873046875, -56.253028869628906, -52.73631286621094, -49.21959686279297, -45.702884674072266, -42.1861686706543, -38.669456481933594, -35.152740478515625, -31.63602638244629, -28.119312286376953, -24.602596282958984, -21.08588218688965, -17.569168090820312, -14.052453994750977, -10.535738945007324, -7.019023895263672, -3.502309799194336, 0.014404296875, 3.5311203002929688, 7.047834396362305, 10.56454849243164, 14.081262588500977, 17.597976684570312, 21.11469268798828, 24.631406784057617, 28.148120880126953, 31.664836883544922, 35.181549072265625, 38.698265075683594]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 7.0, 6.0, 11.0, 8.0, 16.0, 20.0, 27.0, 21.0, 14.0, 22.0, 29.0, 26.0, 37.0, 33.0, 42.0, 43.0, 40.0, 49.0, 28.0, 42.0, 39.0, 28.0, 39.0, 29.0, 37.0, 25.0, 33.0, 27.0, 31.0, 28.0, 30.0, 24.0, 21.0, 21.0, 16.0, 6.0, 4.0, 6.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-43.047080993652344, -41.76441955566406, -40.481754302978516, -39.199092864990234, -37.91642761230469, -36.633766174316406, -35.35110092163086, -34.06843948364258, -32.78577423095703, -31.503110885620117, -30.220447540283203, -28.93778419494629, -27.655120849609375, -26.372459411621094, -25.08979606628418, -23.807132720947266, -22.524471282958984, -21.24180793762207, -19.959144592285156, -18.676481246948242, -17.393817901611328, -16.111156463623047, -14.828493118286133, -13.545829772949219, -12.263166427612305, -10.98050308227539, -9.697839736938477, -8.415177345275879, -7.132513999938965, -5.849850654602051, -4.567187786102295, -3.284524917602539, -2.0018653869628906, -0.7192022800445557, 0.5634608268737793, 1.8461239337921143, 3.128787040710449, 4.411450386047363, 5.694113254547119, 6.976776123046875, 8.259439468383789, 9.542102813720703, 10.824766159057617, 12.107428550720215, 13.390091896057129, 14.672755241394043, 15.95541763305664, 17.238080978393555, 18.52074432373047, 19.803407669067383, 21.086071014404297, 22.36873435974121, 23.651397705078125, 24.934059143066406, 26.21672248840332, 27.499385833740234, 28.78204917907715, 30.064712524414062, 31.347375869750977, 32.63003921508789, 33.91270065307617, 35.19536590576172, 36.47802734375, 37.76068878173828, 39.04335403442383]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 3.0, 3.0, 4.0, 5.0, 12.0, 11.0, 13.0, 20.0, 20.0, 16.0, 18.0, 26.0, 30.0, 39.0, 40.0, 35.0, 44.0, 42.0, 44.0, 36.0, 58.0, 37.0, 42.0, 45.0, 42.0, 33.0, 29.0, 31.0, 23.0, 32.0, 22.0, 10.0, 21.0, 20.0, 18.0, 16.0, 11.0, 13.0, 9.0, 8.0, 2.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-7.27734375, -7.06268310546875, -6.8480224609375, -6.63336181640625, -6.418701171875, -6.20404052734375, -5.9893798828125, -5.77471923828125, -5.56005859375, -5.34539794921875, -5.1307373046875, -4.91607666015625, -4.701416015625, -4.48675537109375, -4.2720947265625, -4.05743408203125, -3.8427734375, -3.62811279296875, -3.4134521484375, -3.19879150390625, -2.984130859375, -2.76947021484375, -2.5548095703125, -2.34014892578125, -2.12548828125, -1.91082763671875, -1.6961669921875, -1.48150634765625, -1.266845703125, -1.05218505859375, -0.8375244140625, -0.62286376953125, -0.408203125, -0.19354248046875, 0.0211181640625, 0.23577880859375, 0.450439453125, 0.66510009765625, 0.8797607421875, 1.09442138671875, 1.30908203125, 1.52374267578125, 1.7384033203125, 1.95306396484375, 2.167724609375, 2.38238525390625, 2.5970458984375, 2.81170654296875, 3.0263671875, 3.24102783203125, 3.4556884765625, 3.67034912109375, 3.885009765625, 4.09967041015625, 4.3143310546875, 4.52899169921875, 4.74365234375, 4.95831298828125, 5.1729736328125, 5.38763427734375, 5.602294921875, 5.81695556640625, 6.0316162109375, 6.24627685546875, 6.4609375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 9.0, 12.0, 14.0, 12.0, 22.0, 15.0, 42.0, 55.0, 65.0, 88.0, 129.0, 184.0, 241.0, 395.0, 545.0, 797.0, 1168.0, 1886.0, 3054.0, 5290.0, 10251.0, 22556.0, 57961.0, 179578.0, 418661.0, 221286.0, 70482.0, 26373.0, 11801.0, 5933.0, 3386.0, 2046.0, 1358.0, 850.0, 580.0, 400.0, 253.0, 210.0, 153.0, 110.0, 79.0, 60.0, 40.0, 35.0, 26.0, 18.0, 14.0, 12.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 4.0], "bins": [-3.091796875, -2.999755859375, -2.90771484375, -2.815673828125, -2.7236328125, -2.631591796875, -2.53955078125, -2.447509765625, -2.35546875, -2.263427734375, -2.17138671875, -2.079345703125, -1.9873046875, -1.895263671875, -1.80322265625, -1.711181640625, -1.619140625, -1.527099609375, -1.43505859375, -1.343017578125, -1.2509765625, -1.158935546875, -1.06689453125, -0.974853515625, -0.8828125, -0.790771484375, -0.69873046875, -0.606689453125, -0.5146484375, -0.422607421875, -0.33056640625, -0.238525390625, -0.146484375, -0.054443359375, 0.03759765625, 0.129638671875, 0.2216796875, 0.313720703125, 0.40576171875, 0.497802734375, 0.58984375, 0.681884765625, 0.77392578125, 0.865966796875, 0.9580078125, 1.050048828125, 1.14208984375, 1.234130859375, 1.326171875, 1.418212890625, 1.51025390625, 1.602294921875, 1.6943359375, 1.786376953125, 1.87841796875, 1.970458984375, 2.0625, 2.154541015625, 2.24658203125, 2.338623046875, 2.4306640625, 2.522705078125, 2.61474609375, 2.706787109375, 2.798828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 6.0, 8.0, 7.0, 14.0, 20.0, 10.0, 11.0, 15.0, 19.0, 21.0, 20.0, 21.0, 28.0, 29.0, 23.0, 38.0, 42.0, 38.0, 38.0, 39.0, 37.0, 1058.0, 48.0, 46.0, 35.0, 29.0, 40.0, 34.0, 31.0, 24.0, 27.0, 25.0, 27.0, 19.0, 19.0, 18.0, 11.0, 10.0, 9.0, 7.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0], "bins": [-5.09765625, -4.94952392578125, -4.8013916015625, -4.65325927734375, -4.505126953125, -4.35699462890625, -4.2088623046875, -4.06072998046875, -3.91259765625, -3.76446533203125, -3.6163330078125, -3.46820068359375, -3.320068359375, -3.17193603515625, -3.0238037109375, -2.87567138671875, -2.7275390625, -2.57940673828125, -2.4312744140625, -2.28314208984375, -2.135009765625, -1.98687744140625, -1.8387451171875, -1.69061279296875, -1.54248046875, -1.39434814453125, -1.2462158203125, -1.09808349609375, -0.949951171875, -0.80181884765625, -0.6536865234375, -0.50555419921875, -0.357421875, -0.20928955078125, -0.0611572265625, 0.08697509765625, 0.235107421875, 0.38323974609375, 0.5313720703125, 0.67950439453125, 0.82763671875, 0.97576904296875, 1.1239013671875, 1.27203369140625, 1.420166015625, 1.56829833984375, 1.7164306640625, 1.86456298828125, 2.0126953125, 2.16082763671875, 2.3089599609375, 2.45709228515625, 2.605224609375, 2.75335693359375, 2.9014892578125, 3.04962158203125, 3.19775390625, 3.34588623046875, 3.4940185546875, 3.64215087890625, 3.790283203125, 3.93841552734375, 4.0865478515625, 4.23468017578125, 4.3828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 7.0, 2.0, 9.0, 14.0, 19.0, 26.0, 40.0, 54.0, 81.0, 105.0, 146.0, 229.0, 371.0, 634.0, 1041.0, 1901.0, 3298.0, 6499.0, 14090.0, 39289.0, 172693.0, 1419835.0, 336915.0, 62006.0, 19574.0, 8470.0, 4152.0, 2274.0, 1251.0, 759.0, 443.0, 280.0, 197.0, 113.0, 88.0, 55.0, 50.0, 29.0, 20.0, 17.0, 13.0, 10.0, 17.0, 6.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.841796875, -2.75482177734375, -2.6678466796875, -2.58087158203125, -2.493896484375, -2.40692138671875, -2.3199462890625, -2.23297119140625, -2.14599609375, -2.05902099609375, -1.9720458984375, -1.88507080078125, -1.798095703125, -1.71112060546875, -1.6241455078125, -1.53717041015625, -1.4501953125, -1.36322021484375, -1.2762451171875, -1.18927001953125, -1.102294921875, -1.01531982421875, -0.9283447265625, -0.84136962890625, -0.75439453125, -0.66741943359375, -0.5804443359375, -0.49346923828125, -0.406494140625, -0.31951904296875, -0.2325439453125, -0.14556884765625, -0.05859375, 0.02838134765625, 0.1153564453125, 0.20233154296875, 0.289306640625, 0.37628173828125, 0.4632568359375, 0.55023193359375, 0.63720703125, 0.72418212890625, 0.8111572265625, 0.89813232421875, 0.985107421875, 1.07208251953125, 1.1590576171875, 1.24603271484375, 1.3330078125, 1.41998291015625, 1.5069580078125, 1.59393310546875, 1.680908203125, 1.76788330078125, 1.8548583984375, 1.94183349609375, 2.02880859375, 2.11578369140625, 2.2027587890625, 2.28973388671875, 2.376708984375, 2.46368408203125, 2.5506591796875, 2.63763427734375, 2.724609375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 9.0, 6.0, 9.0, 6.0, 10.0, 18.0, 23.0, 66.0, 74.0, 144.0, 252.0, 129.0, 74.0, 54.0, 27.0, 22.0, 9.0, 7.0, 9.0, 6.0, 9.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.927734375, -0.897125244140625, -0.86651611328125, -0.835906982421875, -0.8052978515625, -0.774688720703125, -0.74407958984375, -0.713470458984375, -0.682861328125, -0.652252197265625, -0.62164306640625, -0.591033935546875, -0.5604248046875, -0.529815673828125, -0.49920654296875, -0.468597412109375, -0.43798828125, -0.407379150390625, -0.37677001953125, -0.346160888671875, -0.3155517578125, -0.284942626953125, -0.25433349609375, -0.223724365234375, -0.193115234375, -0.162506103515625, -0.13189697265625, -0.101287841796875, -0.0706787109375, -0.040069580078125, -0.00946044921875, 0.021148681640625, 0.0517578125, 0.082366943359375, 0.11297607421875, 0.143585205078125, 0.1741943359375, 0.204803466796875, 0.23541259765625, 0.266021728515625, 0.296630859375, 0.327239990234375, 0.35784912109375, 0.388458251953125, 0.4190673828125, 0.449676513671875, 0.48028564453125, 0.510894775390625, 0.54150390625, 0.572113037109375, 0.60272216796875, 0.633331298828125, 0.6639404296875, 0.694549560546875, 0.72515869140625, 0.755767822265625, 0.786376953125, 0.816986083984375, 0.84759521484375, 0.878204345703125, 0.9088134765625, 0.939422607421875, 0.97003173828125, 1.000640869140625, 1.03125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 10.0, 4.0, 13.0, 10.0, 21.0, 20.0, 24.0, 37.0, 40.0, 74.0, 89.0, 148.0, 372.0, 2973.0, 65509.0, 968625.0, 9176.0, 773.0, 196.0, 130.0, 43.0, 53.0, 40.0, 27.0, 25.0, 15.0, 15.0, 12.0, 12.0, 11.0, 5.0, 3.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.8828125, -14.44775390625, -14.0126953125, -13.57763671875, -13.142578125, -12.70751953125, -12.2724609375, -11.83740234375, -11.40234375, -10.96728515625, -10.5322265625, -10.09716796875, -9.662109375, -9.22705078125, -8.7919921875, -8.35693359375, -7.921875, -7.48681640625, -7.0517578125, -6.61669921875, -6.181640625, -5.74658203125, -5.3115234375, -4.87646484375, -4.44140625, -4.00634765625, -3.5712890625, -3.13623046875, -2.701171875, -2.26611328125, -1.8310546875, -1.39599609375, -0.9609375, -0.52587890625, -0.0908203125, 0.34423828125, 0.779296875, 1.21435546875, 1.6494140625, 2.08447265625, 2.51953125, 2.95458984375, 3.3896484375, 3.82470703125, 4.259765625, 4.69482421875, 5.1298828125, 5.56494140625, 6.0, 6.43505859375, 6.8701171875, 7.30517578125, 7.740234375, 8.17529296875, 8.6103515625, 9.04541015625, 9.48046875, 9.91552734375, 10.3505859375, 10.78564453125, 11.220703125, 11.65576171875, 12.0908203125, 12.52587890625, 12.9609375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 18.0, 97.0, 467.0, 362.0, 58.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.233728408813477, -4.069983005523682, -3.9062376022338867, -3.742492198944092, -3.578746795654297, -3.415001392364502, -3.251255989074707, -3.087510585784912, -2.923765182495117, -2.7600197792053223, -2.5962743759155273, -2.4325289726257324, -2.2687835693359375, -2.1050381660461426, -1.941292643547058, -1.7775472402572632, -1.6138017177581787, -1.4500563144683838, -1.2863109111785889, -1.122565507888794, -0.9588200449943542, -0.7950746417045593, -0.6313291788101196, -0.4675837755203247, -0.3038383722305298, -0.14009295403957367, 0.023652464151382446, 0.18739789724349976, 0.3511433005332947, 0.5148887038230896, 0.6786341667175293, 0.8423795700073242, 1.0061249732971191, 1.169870376586914, 1.333615779876709, 1.497361183166504, 1.6611065864562988, 1.8248519897460938, 1.9885975122451782, 2.1523427963256836, 2.3160881996154785, 2.4798336029052734, 2.6435790061950684, 2.8073244094848633, 2.971069812774658, 3.134815216064453, 3.298560619354248, 3.462306022644043, 3.626051664352417, 3.789797067642212, 3.953542470932007, 4.117288112640381, 4.281033515930176, 4.444778919219971, 4.608524322509766, 4.7722697257995605, 4.9360151290893555, 5.09976053237915, 5.263505935668945, 5.42725133895874, 5.590996742248535, 5.75474214553833, 5.918487548828125, 6.08223295211792, 6.245978355407715]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 6.0, 9.0, 16.0, 13.0, 17.0, 18.0, 20.0, 31.0, 22.0, 29.0, 23.0, 34.0, 29.0, 30.0, 46.0, 39.0, 41.0, 50.0, 44.0, 49.0, 37.0, 45.0, 36.0, 34.0, 43.0, 40.0, 38.0, 34.0, 22.0, 25.0, 21.0, 11.0, 6.0, 6.0, 6.0, 4.0, 2.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0], "bins": [-0.9355704188346863, -0.9113280177116394, -0.8870856165885925, -0.8628432154655457, -0.8386008143424988, -0.8143584132194519, -0.7901160717010498, -0.7658736705780029, -0.741631269454956, -0.7173888683319092, -0.6931464672088623, -0.6689040660858154, -0.6446616649627686, -0.6204192638397217, -0.5961768627166748, -0.5719344615936279, -0.547692060470581, -0.5234496593475342, -0.4992072582244873, -0.47496485710144043, -0.45072245597839355, -0.4264800548553467, -0.4022376835346222, -0.3779952824115753, -0.35375288128852844, -0.32951048016548157, -0.3052680790424347, -0.2810257077217102, -0.25678330659866333, -0.23254089057445526, -0.20829850435256958, -0.1840561032295227, -0.15981364250183105, -0.13557124137878418, -0.1113288477063179, -0.08708645403385162, -0.06284405291080475, -0.038601651787757874, -0.014359265565872192, 0.009883135557174683, 0.03412553668022156, 0.058367934077978134, 0.08261033147573471, 0.10685272514820099, 0.13109512627124786, 0.15533752739429474, 0.17957991361618042, 0.2038223147392273, 0.22806471586227417, 0.25230711698532104, 0.2765495181083679, 0.3007919192314148, 0.32503432035446167, 0.34927672147750854, 0.37351909279823303, 0.3977614939212799, 0.4220038950443268, 0.44624629616737366, 0.47048869729042053, 0.494731068611145, 0.5189734697341919, 0.5432158708572388, 0.5674582719802856, 0.5917006731033325, 0.6159430742263794]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 14.0, 6.0, 15.0, 15.0, 21.0, 13.0, 23.0, 21.0, 30.0, 24.0, 35.0, 42.0, 31.0, 43.0, 45.0, 39.0, 41.0, 41.0, 45.0, 37.0, 36.0, 41.0, 34.0, 36.0, 29.0, 26.0, 19.0, 19.0, 18.0, 24.0, 16.0, 12.0, 24.0, 19.0, 17.0, 8.0, 3.0, 8.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.89453125, -6.6868896484375, -6.479248046875, -6.2716064453125, -6.06396484375, -5.8563232421875, -5.648681640625, -5.4410400390625, -5.2333984375, -5.0257568359375, -4.818115234375, -4.6104736328125, -4.40283203125, -4.1951904296875, -3.987548828125, -3.7799072265625, -3.572265625, -3.3646240234375, -3.156982421875, -2.9493408203125, -2.74169921875, -2.5340576171875, -2.326416015625, -2.1187744140625, -1.9111328125, -1.7034912109375, -1.495849609375, -1.2882080078125, -1.08056640625, -0.8729248046875, -0.665283203125, -0.4576416015625, -0.25, -0.0423583984375, 0.165283203125, 0.3729248046875, 0.58056640625, 0.7882080078125, 0.995849609375, 1.2034912109375, 1.4111328125, 1.6187744140625, 1.826416015625, 2.0340576171875, 2.24169921875, 2.4493408203125, 2.656982421875, 2.8646240234375, 3.072265625, 3.2799072265625, 3.487548828125, 3.6951904296875, 3.90283203125, 4.1104736328125, 4.318115234375, 4.5257568359375, 4.7333984375, 4.9410400390625, 5.148681640625, 5.3563232421875, 5.56396484375, 5.7716064453125, 5.979248046875, 6.1868896484375, 6.39453125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 8.0, 8.0, 14.0, 21.0, 32.0, 38.0, 45.0, 65.0, 93.0, 135.0, 198.0, 230.0, 335.0, 450.0, 657.0, 1002.0, 1506.0, 2346.0, 3994.0, 7110.0, 13138.0, 26401.0, 59939.0, 184718.0, 480147.0, 158206.0, 54143.0, 24192.0, 12171.0, 6532.0, 3788.0, 2331.0, 1431.0, 878.0, 642.0, 436.0, 330.0, 215.0, 153.0, 122.0, 100.0, 60.0, 64.0, 37.0, 30.0, 13.0, 18.0, 16.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.9609375, -10.6331787109375, -10.305419921875, -9.9776611328125, -9.64990234375, -9.3221435546875, -8.994384765625, -8.6666259765625, -8.3388671875, -8.0111083984375, -7.683349609375, -7.3555908203125, -7.02783203125, -6.7000732421875, -6.372314453125, -6.0445556640625, -5.716796875, -5.3890380859375, -5.061279296875, -4.7335205078125, -4.40576171875, -4.0780029296875, -3.750244140625, -3.4224853515625, -3.0947265625, -2.7669677734375, -2.439208984375, -2.1114501953125, -1.78369140625, -1.4559326171875, -1.128173828125, -0.8004150390625, -0.47265625, -0.1448974609375, 0.182861328125, 0.5106201171875, 0.83837890625, 1.1661376953125, 1.493896484375, 1.8216552734375, 2.1494140625, 2.4771728515625, 2.804931640625, 3.1326904296875, 3.46044921875, 3.7882080078125, 4.115966796875, 4.4437255859375, 4.771484375, 5.0992431640625, 5.427001953125, 5.7547607421875, 6.08251953125, 6.4102783203125, 6.738037109375, 7.0657958984375, 7.3935546875, 7.7213134765625, 8.049072265625, 8.3768310546875, 8.70458984375, 9.0323486328125, 9.360107421875, 9.6878662109375, 10.015625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 6.0, 7.0, 10.0, 3.0, 8.0, 12.0, 16.0, 17.0, 18.0, 29.0, 27.0, 20.0, 44.0, 36.0, 47.0, 43.0, 51.0, 55.0, 86.0, 164.0, 336.0, 1370.0, 171.0, 82.0, 51.0, 35.0, 39.0, 37.0, 33.0, 34.0, 27.0, 21.0, 18.0, 14.0, 15.0, 14.0, 7.0, 8.0, 19.0, 6.0, 2.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.96875, -22.273193359375, -21.57763671875, -20.882080078125, -20.1865234375, -19.490966796875, -18.79541015625, -18.099853515625, -17.404296875, -16.708740234375, -16.01318359375, -15.317626953125, -14.6220703125, -13.926513671875, -13.23095703125, -12.535400390625, -11.83984375, -11.144287109375, -10.44873046875, -9.753173828125, -9.0576171875, -8.362060546875, -7.66650390625, -6.970947265625, -6.275390625, -5.579833984375, -4.88427734375, -4.188720703125, -3.4931640625, -2.797607421875, -2.10205078125, -1.406494140625, -0.7109375, -0.015380859375, 0.68017578125, 1.375732421875, 2.0712890625, 2.766845703125, 3.46240234375, 4.157958984375, 4.853515625, 5.549072265625, 6.24462890625, 6.940185546875, 7.6357421875, 8.331298828125, 9.02685546875, 9.722412109375, 10.41796875, 11.113525390625, 11.80908203125, 12.504638671875, 13.2001953125, 13.895751953125, 14.59130859375, 15.286865234375, 15.982421875, 16.677978515625, 17.37353515625, 18.069091796875, 18.7646484375, 19.460205078125, 20.15576171875, 20.851318359375, 21.546875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 6.0, 13.0, 6.0, 14.0, 16.0, 20.0, 25.0, 23.0, 30.0, 45.0, 40.0, 66.0, 89.0, 113.0, 149.0, 234.0, 499.0, 1711.0, 10670.0, 239140.0, 2844217.0, 41985.0, 4476.0, 915.0, 342.0, 202.0, 154.0, 108.0, 75.0, 64.0, 33.0, 42.0, 41.0, 30.0, 18.0, 19.0, 11.0, 10.0, 11.0, 7.0, 2.0, 5.0, 6.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-52.65625, -51.07373046875, -49.4912109375, -47.90869140625, -46.326171875, -44.74365234375, -43.1611328125, -41.57861328125, -39.99609375, -38.41357421875, -36.8310546875, -35.24853515625, -33.666015625, -32.08349609375, -30.5009765625, -28.91845703125, -27.3359375, -25.75341796875, -24.1708984375, -22.58837890625, -21.005859375, -19.42333984375, -17.8408203125, -16.25830078125, -14.67578125, -13.09326171875, -11.5107421875, -9.92822265625, -8.345703125, -6.76318359375, -5.1806640625, -3.59814453125, -2.015625, -0.43310546875, 1.1494140625, 2.73193359375, 4.314453125, 5.89697265625, 7.4794921875, 9.06201171875, 10.64453125, 12.22705078125, 13.8095703125, 15.39208984375, 16.974609375, 18.55712890625, 20.1396484375, 21.72216796875, 23.3046875, 24.88720703125, 26.4697265625, 28.05224609375, 29.634765625, 31.21728515625, 32.7998046875, 34.38232421875, 35.96484375, 37.54736328125, 39.1298828125, 40.71240234375, 42.294921875, 43.87744140625, 45.4599609375, 47.04248046875, 48.625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 60.0, 277.0, 474.0, 164.0, 30.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.5859432220459, -25.71642303466797, -20.846904754638672, -15.977384567260742, -11.107864379882812, -6.238344192504883, -1.368825912475586, 3.5006961822509766, 8.370214462280273, 13.239734649658203, 18.1092529296875, 22.97877311706543, 27.84829330444336, 32.717811584472656, 37.58733367919922, 42.45685577392578, 47.32637023925781, 52.19588851928711, 57.06541061401367, 61.93492889404297, 66.80445098876953, 71.67396545410156, 76.54348754882812, 81.41300964355469, 86.28253173828125, 91.15205383300781, 96.02156829833984, 100.8910903930664, 105.76061248779297, 110.630126953125, 115.49964904785156, 120.36917114257812, 125.23869323730469, 130.10821533203125, 134.9777374267578, 139.84725952148438, 144.71676635742188, 149.58628845214844, 154.455810546875, 159.32533264160156, 164.19485473632812, 169.0643768310547, 173.93389892578125, 178.80340576171875, 183.6729278564453, 188.54244995117188, 193.41197204589844, 198.281494140625, 203.1510009765625, 208.02052307128906, 212.89004516601562, 217.75955200195312, 222.6290740966797, 227.49859619140625, 232.3681182861328, 237.23764038085938, 242.10716247558594, 246.9766845703125, 251.84620666503906, 256.7157287597656, 261.5852355957031, 266.45477294921875, 271.32427978515625, 276.19378662109375, 281.0633239746094]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 9.0, 18.0, 11.0, 12.0, 18.0, 17.0, 22.0, 24.0, 26.0, 27.0, 20.0, 30.0, 35.0, 36.0, 36.0, 39.0, 47.0, 48.0, 43.0, 46.0, 33.0, 55.0, 28.0, 31.0, 29.0, 26.0, 24.0, 32.0, 22.0, 19.0, 18.0, 18.0, 17.0, 11.0, 6.0, 12.0, 13.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-55.228755950927734, -53.60174560546875, -51.974735260009766, -50.34772491455078, -48.72071838378906, -47.09370422363281, -45.466697692871094, -43.83968734741211, -42.212677001953125, -40.58566665649414, -38.958656311035156, -37.33164596557617, -35.70463562011719, -34.07762908935547, -32.450618743896484, -30.8236083984375, -29.196598052978516, -27.56958770751953, -25.942577362060547, -24.315568923950195, -22.68855857849121, -21.061548233032227, -19.434539794921875, -17.80752944946289, -16.180519104003906, -14.553508758544922, -12.926499366760254, -11.299489974975586, -9.672479629516602, -8.045469284057617, -6.418459892272949, -4.791450500488281, -3.164440155029297, -1.5374302864074707, 0.08957958221435547, 1.7165894508361816, 3.343599319458008, 4.970609664916992, 6.59761905670166, 8.224628448486328, 9.851638793945312, 11.478649139404297, 13.105658531188965, 14.732667922973633, 16.359678268432617, 17.9866886138916, 19.613697052001953, 21.240707397460938, 22.867717742919922, 24.494728088378906, 26.12173843383789, 27.748746871948242, 29.375757217407227, 31.00276756286621, 32.62977600097656, 34.25678634643555, 35.88379669189453, 37.510807037353516, 39.1378173828125, 40.764827728271484, 42.39183807373047, 44.01884460449219, 45.64585494995117, 47.272865295410156, 48.89987564086914]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 10.0, 11.0, 16.0, 19.0, 16.0, 21.0, 16.0, 19.0, 28.0, 29.0, 36.0, 40.0, 37.0, 34.0, 28.0, 39.0, 45.0, 45.0, 34.0, 43.0, 25.0, 38.0, 46.0, 19.0, 26.0, 17.0, 32.0, 27.0, 27.0, 24.0, 15.0, 12.0, 18.0, 12.0, 13.0, 10.0, 9.0, 7.0, 7.0, 8.0, 4.0, 5.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.51953125, -6.31005859375, -6.1005859375, -5.89111328125, -5.681640625, -5.47216796875, -5.2626953125, -5.05322265625, -4.84375, -4.63427734375, -4.4248046875, -4.21533203125, -4.005859375, -3.79638671875, -3.5869140625, -3.37744140625, -3.16796875, -2.95849609375, -2.7490234375, -2.53955078125, -2.330078125, -2.12060546875, -1.9111328125, -1.70166015625, -1.4921875, -1.28271484375, -1.0732421875, -0.86376953125, -0.654296875, -0.44482421875, -0.2353515625, -0.02587890625, 0.18359375, 0.39306640625, 0.6025390625, 0.81201171875, 1.021484375, 1.23095703125, 1.4404296875, 1.64990234375, 1.859375, 2.06884765625, 2.2783203125, 2.48779296875, 2.697265625, 2.90673828125, 3.1162109375, 3.32568359375, 3.53515625, 3.74462890625, 3.9541015625, 4.16357421875, 4.373046875, 4.58251953125, 4.7919921875, 5.00146484375, 5.2109375, 5.42041015625, 5.6298828125, 5.83935546875, 6.048828125, 6.25830078125, 6.4677734375, 6.67724609375, 6.88671875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 14.0, 11.0, 17.0, 24.0, 36.0, 43.0, 85.0, 92.0, 142.0, 219.0, 308.0, 517.0, 845.0, 1417.0, 2508.0, 4948.0, 11349.0, 35090.0, 229704.0, 2059667.0, 1638267.0, 157631.0, 29423.0, 10803.0, 4804.0, 2500.0, 1404.0, 821.0, 502.0, 349.0, 226.0, 145.0, 90.0, 75.0, 60.0, 42.0, 22.0, 27.0, 14.0, 11.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-17.828125, -17.3319091796875, -16.835693359375, -16.3394775390625, -15.84326171875, -15.3470458984375, -14.850830078125, -14.3546142578125, -13.8583984375, -13.3621826171875, -12.865966796875, -12.3697509765625, -11.87353515625, -11.3773193359375, -10.881103515625, -10.3848876953125, -9.888671875, -9.3924560546875, -8.896240234375, -8.4000244140625, -7.90380859375, -7.4075927734375, -6.911376953125, -6.4151611328125, -5.9189453125, -5.4227294921875, -4.926513671875, -4.4302978515625, -3.93408203125, -3.4378662109375, -2.941650390625, -2.4454345703125, -1.94921875, -1.4530029296875, -0.956787109375, -0.4605712890625, 0.03564453125, 0.5318603515625, 1.028076171875, 1.5242919921875, 2.0205078125, 2.5167236328125, 3.012939453125, 3.5091552734375, 4.00537109375, 4.5015869140625, 4.997802734375, 5.4940185546875, 5.990234375, 6.4864501953125, 6.982666015625, 7.4788818359375, 7.97509765625, 8.4713134765625, 8.967529296875, 9.4637451171875, 9.9599609375, 10.4561767578125, 10.952392578125, 11.4486083984375, 11.94482421875, 12.4410400390625, 12.937255859375, 13.4334716796875, 13.9296875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 4.0, 7.0, 7.0, 15.0, 19.0, 15.0, 30.0, 30.0, 46.0, 53.0, 68.0, 96.0, 120.0, 176.0, 279.0, 381.0, 585.0, 607.0, 480.0, 303.0, 217.0, 138.0, 93.0, 59.0, 60.0, 34.0, 29.0, 23.0, 18.0, 7.0, 9.0, 16.0, 8.0, 3.0, 8.0, 2.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.0546875, -13.654052734375, -13.25341796875, -12.852783203125, -12.4521484375, -12.051513671875, -11.65087890625, -11.250244140625, -10.849609375, -10.448974609375, -10.04833984375, -9.647705078125, -9.2470703125, -8.846435546875, -8.44580078125, -8.045166015625, -7.64453125, -7.243896484375, -6.84326171875, -6.442626953125, -6.0419921875, -5.641357421875, -5.24072265625, -4.840087890625, -4.439453125, -4.038818359375, -3.63818359375, -3.237548828125, -2.8369140625, -2.436279296875, -2.03564453125, -1.635009765625, -1.234375, -0.833740234375, -0.43310546875, -0.032470703125, 0.3681640625, 0.768798828125, 1.16943359375, 1.570068359375, 1.970703125, 2.371337890625, 2.77197265625, 3.172607421875, 3.5732421875, 3.973876953125, 4.37451171875, 4.775146484375, 5.17578125, 5.576416015625, 5.97705078125, 6.377685546875, 6.7783203125, 7.178955078125, 7.57958984375, 7.980224609375, 8.380859375, 8.781494140625, 9.18212890625, 9.582763671875, 9.9833984375, 10.384033203125, 10.78466796875, 11.185302734375, 11.5859375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 9.0, 8.0, 13.0, 18.0, 20.0, 29.0, 39.0, 66.0, 70.0, 124.0, 216.0, 494.0, 2219.0, 22078.0, 1008329.0, 3113031.0, 42587.0, 3484.0, 660.0, 266.0, 133.0, 92.0, 60.0, 60.0, 36.0, 31.0, 28.0, 12.0, 10.0, 10.0, 5.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.625, -37.14599609375, -35.6669921875, -34.18798828125, -32.708984375, -31.22998046875, -29.7509765625, -28.27197265625, -26.79296875, -25.31396484375, -23.8349609375, -22.35595703125, -20.876953125, -19.39794921875, -17.9189453125, -16.43994140625, -14.9609375, -13.48193359375, -12.0029296875, -10.52392578125, -9.044921875, -7.56591796875, -6.0869140625, -4.60791015625, -3.12890625, -1.64990234375, -0.1708984375, 1.30810546875, 2.787109375, 4.26611328125, 5.7451171875, 7.22412109375, 8.703125, 10.18212890625, 11.6611328125, 13.14013671875, 14.619140625, 16.09814453125, 17.5771484375, 19.05615234375, 20.53515625, 22.01416015625, 23.4931640625, 24.97216796875, 26.451171875, 27.93017578125, 29.4091796875, 30.88818359375, 32.3671875, 33.84619140625, 35.3251953125, 36.80419921875, 38.283203125, 39.76220703125, 41.2412109375, 42.72021484375, 44.19921875, 45.67822265625, 47.1572265625, 48.63623046875, 50.115234375, 51.59423828125, 53.0732421875, 54.55224609375, 56.03125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 15.0, 51.0, 196.0, 364.0, 255.0, 97.0, 23.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.5663146972656, -262.0649108886719, -256.56353759765625, -251.0621337890625, -245.56072998046875, -240.05934143066406, -234.55795288085938, -229.05654907226562, -223.55516052246094, -218.05377197265625, -212.5523681640625, -207.0509796142578, -201.54957580566406, -196.04818725585938, -190.54678344726562, -185.04539489746094, -179.54400634765625, -174.04261779785156, -168.5412139892578, -163.03982543945312, -157.53842163085938, -152.0370330810547, -146.53564453125, -141.03424072265625, -135.5328369140625, -130.0314483642578, -124.53004455566406, -119.02865600585938, -113.52725982666016, -108.02586364746094, -102.52446746826172, -97.0230712890625, -91.52169036865234, -86.02029418945312, -80.5188980102539, -75.01750183105469, -69.51611328125, -64.01471710205078, -58.51332092285156, -53.01192855834961, -47.51053237915039, -42.00913619995117, -36.50774383544922, -31.00634765625, -25.504953384399414, -20.003559112548828, -14.50216293334961, -9.000770568847656, -3.4993743896484375, 2.0020203590393066, 7.503415107727051, 13.004810333251953, 18.50620460510254, 24.007598876953125, 29.508995056152344, 35.0103874206543, 40.511783599853516, 46.013179779052734, 51.51457214355469, 57.015968322753906, 62.517364501953125, 68.01875305175781, 73.52015686035156, 79.02154541015625, 84.52294158935547]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 14.0, 10.0, 30.0, 27.0, 25.0, 25.0, 28.0, 22.0, 25.0, 48.0, 46.0, 43.0, 44.0, 46.0, 55.0, 55.0, 48.0, 42.0, 38.0, 38.0, 32.0, 37.0, 35.0, 24.0, 29.0, 25.0, 13.0, 12.0, 15.0, 9.0, 7.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.775054931640625, -46.30236053466797, -44.82966613769531, -43.356971740722656, -41.88427734375, -40.411582946777344, -38.93888854980469, -37.46619415283203, -35.993499755859375, -34.52080535888672, -33.04811096191406, -31.575416564941406, -30.10272216796875, -28.630027770996094, -27.157331466674805, -25.68463706970215, -24.21194076538086, -22.739246368408203, -21.266551971435547, -19.79385757446289, -18.321163177490234, -16.848468780517578, -15.375772476196289, -13.903078079223633, -12.430383682250977, -10.95768928527832, -9.484994888305664, -8.012299537658691, -6.539605140686035, -5.066910743713379, -3.5942153930664062, -2.12152099609375, -0.6488304138183594, 0.823864221572876, 2.2965588569641113, 3.769253730773926, 5.241948127746582, 6.714642524719238, 8.187337875366211, 9.660032272338867, 11.132726669311523, 12.60542106628418, 14.078115463256836, 15.550810813903809, 17.02350616455078, 18.496200561523438, 19.968894958496094, 21.44158935546875, 22.914283752441406, 24.386978149414062, 25.85967254638672, 27.332366943359375, 28.80506134033203, 30.277755737304688, 31.750452041625977, 33.22314453125, 34.695838928222656, 36.16853332519531, 37.64122772216797, 39.113922119140625, 40.58661651611328, 42.05931091308594, 43.532005310058594, 45.00469970703125, 46.47739791870117]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 7.0, 8.0, 2.0, 13.0, 7.0, 15.0, 24.0, 13.0, 15.0, 21.0, 28.0, 25.0, 33.0, 36.0, 47.0, 33.0, 37.0, 29.0, 35.0, 41.0, 47.0, 40.0, 39.0, 43.0, 39.0, 30.0, 29.0, 23.0, 26.0, 31.0, 16.0, 26.0, 29.0, 17.0, 12.0, 17.0, 15.0, 5.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.4140625, -6.21038818359375, -6.0067138671875, -5.80303955078125, -5.599365234375, -5.39569091796875, -5.1920166015625, -4.98834228515625, -4.78466796875, -4.58099365234375, -4.3773193359375, -4.17364501953125, -3.969970703125, -3.76629638671875, -3.5626220703125, -3.35894775390625, -3.1552734375, -2.95159912109375, -2.7479248046875, -2.54425048828125, -2.340576171875, -2.13690185546875, -1.9332275390625, -1.72955322265625, -1.52587890625, -1.32220458984375, -1.1185302734375, -0.91485595703125, -0.711181640625, -0.50750732421875, -0.3038330078125, -0.10015869140625, 0.103515625, 0.30718994140625, 0.5108642578125, 0.71453857421875, 0.918212890625, 1.12188720703125, 1.3255615234375, 1.52923583984375, 1.73291015625, 1.93658447265625, 2.1402587890625, 2.34393310546875, 2.547607421875, 2.75128173828125, 2.9549560546875, 3.15863037109375, 3.3623046875, 3.56597900390625, 3.7696533203125, 3.97332763671875, 4.177001953125, 4.38067626953125, 4.5843505859375, 4.78802490234375, 4.99169921875, 5.19537353515625, 5.3990478515625, 5.60272216796875, 5.806396484375, 6.01007080078125, 6.2137451171875, 6.41741943359375, 6.62109375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 6.0, 16.0, 32.0, 32.0, 43.0, 102.0, 142.0, 208.0, 317.0, 470.0, 696.0, 1137.0, 1678.0, 2644.0, 4201.0, 6693.0, 10897.0, 17992.0, 30775.0, 53420.0, 97926.0, 179495.0, 248217.0, 171706.0, 93223.0, 51447.0, 29146.0, 17448.0, 10643.0, 6458.0, 4060.0, 2537.0, 1609.0, 1084.0, 717.0, 448.0, 316.0, 200.0, 130.0, 81.0, 53.0, 30.0, 31.0, 16.0, 9.0, 10.0, 9.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0830078125, -1.047454833984375, -1.01190185546875, -0.976348876953125, -0.9407958984375, -0.905242919921875, -0.86968994140625, -0.834136962890625, -0.798583984375, -0.763031005859375, -0.72747802734375, -0.691925048828125, -0.6563720703125, -0.620819091796875, -0.58526611328125, -0.549713134765625, -0.51416015625, -0.478607177734375, -0.44305419921875, -0.407501220703125, -0.3719482421875, -0.336395263671875, -0.30084228515625, -0.265289306640625, -0.229736328125, -0.194183349609375, -0.15863037109375, -0.123077392578125, -0.0875244140625, -0.051971435546875, -0.01641845703125, 0.019134521484375, 0.0546875, 0.090240478515625, 0.12579345703125, 0.161346435546875, 0.1968994140625, 0.232452392578125, 0.26800537109375, 0.303558349609375, 0.339111328125, 0.374664306640625, 0.41021728515625, 0.445770263671875, 0.4813232421875, 0.516876220703125, 0.55242919921875, 0.587982177734375, 0.62353515625, 0.659088134765625, 0.69464111328125, 0.730194091796875, 0.7657470703125, 0.801300048828125, 0.83685302734375, 0.872406005859375, 0.907958984375, 0.943511962890625, 0.97906494140625, 1.014617919921875, 1.0501708984375, 1.085723876953125, 1.12127685546875, 1.156829833984375, 1.1923828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 14.0, 13.0, 13.0, 16.0, 12.0, 24.0, 19.0, 19.0, 18.0, 39.0, 34.0, 36.0, 40.0, 51.0, 40.0, 37.0, 1070.0, 42.0, 42.0, 39.0, 31.0, 37.0, 32.0, 33.0, 43.0, 23.0, 22.0, 28.0, 19.0, 17.0, 15.0, 12.0, 12.0, 15.0, 10.0, 7.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.07867431640625, -3.9307861328125, -3.78289794921875, -3.635009765625, -3.48712158203125, -3.3392333984375, -3.19134521484375, -3.04345703125, -2.89556884765625, -2.7476806640625, -2.59979248046875, -2.451904296875, -2.30401611328125, -2.1561279296875, -2.00823974609375, -1.8603515625, -1.71246337890625, -1.5645751953125, -1.41668701171875, -1.268798828125, -1.12091064453125, -0.9730224609375, -0.82513427734375, -0.67724609375, -0.52935791015625, -0.3814697265625, -0.23358154296875, -0.085693359375, 0.06219482421875, 0.2100830078125, 0.35797119140625, 0.505859375, 0.65374755859375, 0.8016357421875, 0.94952392578125, 1.097412109375, 1.24530029296875, 1.3931884765625, 1.54107666015625, 1.68896484375, 1.83685302734375, 1.9847412109375, 2.13262939453125, 2.280517578125, 2.42840576171875, 2.5762939453125, 2.72418212890625, 2.8720703125, 3.01995849609375, 3.1678466796875, 3.31573486328125, 3.463623046875, 3.61151123046875, 3.7593994140625, 3.90728759765625, 4.05517578125, 4.20306396484375, 4.3509521484375, 4.49884033203125, 4.646728515625, 4.79461669921875, 4.9425048828125, 5.09039306640625, 5.23828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 7.0, 3.0, 2.0, 14.0, 10.0, 27.0, 20.0, 37.0, 59.0, 103.0, 142.0, 243.0, 435.0, 750.0, 1384.0, 2513.0, 5232.0, 11046.0, 25182.0, 60419.0, 165341.0, 1118515.0, 501342.0, 120652.0, 46224.0, 19638.0, 8737.0, 4261.0, 2134.0, 1110.0, 651.0, 337.0, 222.0, 110.0, 75.0, 58.0, 39.0, 29.0, 10.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3505859375, -1.314910888671875, -1.27923583984375, -1.243560791015625, -1.2078857421875, -1.172210693359375, -1.13653564453125, -1.100860595703125, -1.065185546875, -1.029510498046875, -0.99383544921875, -0.958160400390625, -0.9224853515625, -0.886810302734375, -0.85113525390625, -0.815460205078125, -0.77978515625, -0.744110107421875, -0.70843505859375, -0.672760009765625, -0.6370849609375, -0.601409912109375, -0.56573486328125, -0.530059814453125, -0.494384765625, -0.458709716796875, -0.42303466796875, -0.387359619140625, -0.3516845703125, -0.316009521484375, -0.28033447265625, -0.244659423828125, -0.208984375, -0.173309326171875, -0.13763427734375, -0.101959228515625, -0.0662841796875, -0.030609130859375, 0.00506591796875, 0.040740966796875, 0.076416015625, 0.112091064453125, 0.14776611328125, 0.183441162109375, 0.2191162109375, 0.254791259765625, 0.29046630859375, 0.326141357421875, 0.36181640625, 0.397491455078125, 0.43316650390625, 0.468841552734375, 0.5045166015625, 0.540191650390625, 0.57586669921875, 0.611541748046875, 0.647216796875, 0.682891845703125, 0.71856689453125, 0.754241943359375, 0.7899169921875, 0.825592041015625, 0.86126708984375, 0.896942138671875, 0.9326171875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 12.0, 4.0, 7.0, 11.0, 10.0, 10.0, 15.0, 15.0, 18.0, 25.0, 23.0, 40.0, 42.0, 52.0, 83.0, 109.0, 97.0, 84.0, 59.0, 39.0, 38.0, 26.0, 26.0, 21.0, 17.0, 22.0, 9.0, 12.0, 9.0, 8.0, 11.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.11834716796875, -0.11428356170654297, -0.11021995544433594, -0.1061563491821289, -0.10209274291992188, -0.09802913665771484, -0.09396553039550781, -0.08990192413330078, -0.08583831787109375, -0.08177471160888672, -0.07771110534667969, -0.07364749908447266, -0.06958389282226562, -0.0655202865600586, -0.06145668029785156, -0.05739307403564453, -0.0533294677734375, -0.04926586151123047, -0.04520225524902344, -0.041138648986816406, -0.037075042724609375, -0.033011436462402344, -0.028947830200195312, -0.02488422393798828, -0.02082061767578125, -0.01675701141357422, -0.012693405151367188, -0.008629798889160156, -0.004566192626953125, -0.0005025863647460938, 0.0035610198974609375, 0.007624626159667969, 0.011688232421875, 0.01575183868408203, 0.019815444946289062, 0.023879051208496094, 0.027942657470703125, 0.032006263732910156, 0.03606986999511719, 0.04013347625732422, 0.04419708251953125, 0.04826068878173828, 0.05232429504394531, 0.056387901306152344, 0.060451507568359375, 0.0645151138305664, 0.06857872009277344, 0.07264232635498047, 0.0767059326171875, 0.08076953887939453, 0.08483314514160156, 0.0888967514038086, 0.09296035766601562, 0.09702396392822266, 0.10108757019042969, 0.10515117645263672, 0.10921478271484375, 0.11327838897705078, 0.11734199523925781, 0.12140560150146484, 0.12546920776367188, 0.1295328140258789, 0.13359642028808594, 0.13766002655029297, 0.1417236328125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 6.0, 5.0, 8.0, 9.0, 10.0, 10.0, 9.0, 23.0, 29.0, 24.0, 33.0, 38.0, 53.0, 71.0, 87.0, 117.0, 302.0, 1031.0, 10777.0, 760002.0, 266981.0, 7237.0, 876.0, 261.0, 128.0, 88.0, 74.0, 50.0, 41.0, 29.0, 20.0, 25.0, 11.0, 11.0, 10.0, 6.0, 12.0, 5.0, 9.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.509765625, -2.437896728515625, -2.36602783203125, -2.294158935546875, -2.2222900390625, -2.150421142578125, -2.07855224609375, -2.006683349609375, -1.934814453125, -1.862945556640625, -1.79107666015625, -1.719207763671875, -1.6473388671875, -1.575469970703125, -1.50360107421875, -1.431732177734375, -1.35986328125, -1.287994384765625, -1.21612548828125, -1.144256591796875, -1.0723876953125, -1.000518798828125, -0.92864990234375, -0.856781005859375, -0.784912109375, -0.713043212890625, -0.64117431640625, -0.569305419921875, -0.4974365234375, -0.425567626953125, -0.35369873046875, -0.281829833984375, -0.2099609375, -0.138092041015625, -0.06622314453125, 0.005645751953125, 0.0775146484375, 0.149383544921875, 0.22125244140625, 0.293121337890625, 0.364990234375, 0.436859130859375, 0.50872802734375, 0.580596923828125, 0.6524658203125, 0.724334716796875, 0.79620361328125, 0.868072509765625, 0.93994140625, 1.011810302734375, 1.08367919921875, 1.155548095703125, 1.2274169921875, 1.299285888671875, 1.37115478515625, 1.443023681640625, 1.514892578125, 1.586761474609375, 1.65863037109375, 1.730499267578125, 1.8023681640625, 1.874237060546875, 1.94610595703125, 2.017974853515625, 2.08984375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 18.0, 68.0, 190.0, 395.0, 238.0, 76.0, 17.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3928728103637695, -1.3641382455825806, -1.3354036808013916, -1.306668996810913, -1.2779344320297241, -1.2491998672485352, -1.2204653024673462, -1.1917306184768677, -1.1629960536956787, -1.1342614889144897, -1.1055269241333008, -1.0767922401428223, -1.0480576753616333, -1.0193231105804443, -0.9905884861946106, -0.9618539214134216, -0.9331192970275879, -0.9043847322463989, -0.8756501078605652, -0.8469155430793762, -0.8181809186935425, -0.7894463539123535, -0.7607117295265198, -0.7319771647453308, -0.7032425999641418, -0.6745080351829529, -0.6457734107971191, -0.6170388460159302, -0.5883042216300964, -0.5595696568489075, -0.5308350324630737, -0.5021004676818848, -0.473365843296051, -0.4446312487125397, -0.4158966541290283, -0.38716205954551697, -0.3584274649620056, -0.32969290018081665, -0.3009582757949829, -0.27222371101379395, -0.2434891015291214, -0.21475450694561005, -0.1860199123620987, -0.15728533267974854, -0.12855073809623718, -0.09981614351272583, -0.07108154892921448, -0.042346954345703125, -0.013612359762191772, 0.01512223295867443, 0.043856825679540634, 0.07259141653776169, 0.10132601112127304, 0.1300605982542038, 0.15879519283771515, 0.1875297874212265, 0.21626438200473785, 0.2449989765882492, 0.27373355627059937, 0.3024681508541107, 0.33120274543762207, 0.3599373400211334, 0.3886719346046448, 0.41740652918815613, 0.4461411237716675]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 12.0, 8.0, 15.0, 8.0, 12.0, 19.0, 20.0, 27.0, 31.0, 35.0, 21.0, 25.0, 18.0, 44.0, 39.0, 41.0, 40.0, 37.0, 42.0, 25.0, 48.0, 41.0, 31.0, 38.0, 29.0, 33.0, 33.0, 26.0, 20.0, 23.0, 27.0, 14.0, 25.0, 14.0, 11.0, 9.0, 6.0, 6.0, 9.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.17373013496398926, -0.16876357793807983, -0.16379700601100922, -0.1588304489850998, -0.15386389195919037, -0.14889732003211975, -0.14393076300621033, -0.1389642059803009, -0.13399764895439148, -0.12903109192848206, -0.12406452745199203, -0.11909796297550201, -0.11413140594959259, -0.10916484147310257, -0.10419827699661255, -0.09923171997070312, -0.09426514804363251, -0.08929858356714249, -0.08433202654123306, -0.07936546206474304, -0.07439890503883362, -0.0694323405623436, -0.06446577608585358, -0.059499215334653854, -0.05453265458345413, -0.04956609383225441, -0.04459953308105469, -0.03963296860456467, -0.034666407853364944, -0.029699847102165222, -0.02473328448832035, -0.01976672187447548, -0.014800161123275757, -0.00983359944075346, -0.004867037758231163, 9.952392429113388e-05, 0.005066085606813431, 0.010032646358013153, 0.014999208971858025, 0.019965771585702896, 0.02493233233690262, 0.02989889308810234, 0.03486545383930206, 0.039832018315792084, 0.044798579066991806, 0.04976513981819153, 0.05473170429468155, 0.05969826504588127, 0.064664825797081, 0.06963139027357101, 0.07459794729948044, 0.07956451177597046, 0.08453106880187988, 0.0894976332783699, 0.09446419775485992, 0.09943075478076935, 0.10439731925725937, 0.10936388373374939, 0.11433044075965881, 0.11929700523614883, 0.12426356971263885, 0.12923012673854828, 0.1341966837644577, 0.13916325569152832, 0.14412981271743774]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 5.0, 8.0, 11.0, 9.0, 9.0, 8.0, 13.0, 15.0, 22.0, 24.0, 21.0, 18.0, 23.0, 31.0, 38.0, 31.0, 42.0, 37.0, 41.0, 39.0, 44.0, 41.0, 26.0, 39.0, 39.0, 36.0, 35.0, 33.0, 20.0, 24.0, 30.0, 25.0, 22.0, 19.0, 20.0, 14.0, 17.0, 10.0, 11.0, 7.0, 4.0, 7.0, 6.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0], "bins": [-6.3515625, -6.1546630859375, -5.957763671875, -5.7608642578125, -5.56396484375, -5.3670654296875, -5.170166015625, -4.9732666015625, -4.7763671875, -4.5794677734375, -4.382568359375, -4.1856689453125, -3.98876953125, -3.7918701171875, -3.594970703125, -3.3980712890625, -3.201171875, -3.0042724609375, -2.807373046875, -2.6104736328125, -2.41357421875, -2.2166748046875, -2.019775390625, -1.8228759765625, -1.6259765625, -1.4290771484375, -1.232177734375, -1.0352783203125, -0.83837890625, -0.6414794921875, -0.444580078125, -0.2476806640625, -0.05078125, 0.1461181640625, 0.343017578125, 0.5399169921875, 0.73681640625, 0.9337158203125, 1.130615234375, 1.3275146484375, 1.5244140625, 1.7213134765625, 1.918212890625, 2.1151123046875, 2.31201171875, 2.5089111328125, 2.705810546875, 2.9027099609375, 3.099609375, 3.2965087890625, 3.493408203125, 3.6903076171875, 3.88720703125, 4.0841064453125, 4.281005859375, 4.4779052734375, 4.6748046875, 4.8717041015625, 5.068603515625, 5.2655029296875, 5.46240234375, 5.6593017578125, 5.856201171875, 6.0531005859375, 6.25]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 5.0, 12.0, 21.0, 22.0, 25.0, 35.0, 50.0, 69.0, 118.0, 168.0, 249.0, 356.0, 480.0, 711.0, 1127.0, 1721.0, 2807.0, 4602.0, 7906.0, 14189.0, 27260.0, 55221.0, 120055.0, 319446.0, 275359.0, 108112.0, 50789.0, 25301.0, 13048.0, 7390.0, 4267.0, 2657.0, 1704.0, 1001.0, 702.0, 477.0, 314.0, 219.0, 163.0, 109.0, 86.0, 58.0, 38.0, 26.0, 22.0, 13.0, 8.0, 9.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.34375, -8.0650634765625, -7.786376953125, -7.5076904296875, -7.22900390625, -6.9503173828125, -6.671630859375, -6.3929443359375, -6.1142578125, -5.8355712890625, -5.556884765625, -5.2781982421875, -4.99951171875, -4.7208251953125, -4.442138671875, -4.1634521484375, -3.884765625, -3.6060791015625, -3.327392578125, -3.0487060546875, -2.77001953125, -2.4913330078125, -2.212646484375, -1.9339599609375, -1.6552734375, -1.3765869140625, -1.097900390625, -0.8192138671875, -0.54052734375, -0.2618408203125, 0.016845703125, 0.2955322265625, 0.57421875, 0.8529052734375, 1.131591796875, 1.4102783203125, 1.68896484375, 1.9676513671875, 2.246337890625, 2.5250244140625, 2.8037109375, 3.0823974609375, 3.361083984375, 3.6397705078125, 3.91845703125, 4.1971435546875, 4.475830078125, 4.7545166015625, 5.033203125, 5.3118896484375, 5.590576171875, 5.8692626953125, 6.14794921875, 6.4266357421875, 6.705322265625, 6.9840087890625, 7.2626953125, 7.5413818359375, 7.820068359375, 8.0987548828125, 8.37744140625, 8.6561279296875, 8.934814453125, 9.2135009765625, 9.4921875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 4.0, 6.0, 7.0, 10.0, 8.0, 10.0, 7.0, 18.0, 12.0, 11.0, 24.0, 15.0, 33.0, 31.0, 36.0, 31.0, 38.0, 43.0, 68.0, 82.0, 174.0, 1359.0, 370.0, 153.0, 99.0, 50.0, 46.0, 31.0, 33.0, 40.0, 27.0, 26.0, 22.0, 14.0, 17.0, 15.0, 13.0, 16.0, 11.0, 7.0, 5.0, 7.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.19775390625, -16.5830078125, -15.96826171875, -15.353515625, -14.73876953125, -14.1240234375, -13.50927734375, -12.89453125, -12.27978515625, -11.6650390625, -11.05029296875, -10.435546875, -9.82080078125, -9.2060546875, -8.59130859375, -7.9765625, -7.36181640625, -6.7470703125, -6.13232421875, -5.517578125, -4.90283203125, -4.2880859375, -3.67333984375, -3.05859375, -2.44384765625, -1.8291015625, -1.21435546875, -0.599609375, 0.01513671875, 0.6298828125, 1.24462890625, 1.859375, 2.47412109375, 3.0888671875, 3.70361328125, 4.318359375, 4.93310546875, 5.5478515625, 6.16259765625, 6.77734375, 7.39208984375, 8.0068359375, 8.62158203125, 9.236328125, 9.85107421875, 10.4658203125, 11.08056640625, 11.6953125, 12.31005859375, 12.9248046875, 13.53955078125, 14.154296875, 14.76904296875, 15.3837890625, 15.99853515625, 16.61328125, 17.22802734375, 17.8427734375, 18.45751953125, 19.072265625, 19.68701171875, 20.3017578125, 20.91650390625, 21.53125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 5.0, 6.0, 6.0, 4.0, 8.0, 6.0, 12.0, 18.0, 23.0, 24.0, 27.0, 28.0, 49.0, 55.0, 79.0, 82.0, 126.0, 179.0, 255.0, 459.0, 1804.0, 28150.0, 3016125.0, 93433.0, 3077.0, 587.0, 282.0, 174.0, 136.0, 100.0, 80.0, 69.0, 42.0, 47.0, 26.0, 29.0, 20.0, 20.0, 7.0, 11.0, 7.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.875, -60.822265625, -58.76953125, -56.716796875, -54.6640625, -52.611328125, -50.55859375, -48.505859375, -46.453125, -44.400390625, -42.34765625, -40.294921875, -38.2421875, -36.189453125, -34.13671875, -32.083984375, -30.03125, -27.978515625, -25.92578125, -23.873046875, -21.8203125, -19.767578125, -17.71484375, -15.662109375, -13.609375, -11.556640625, -9.50390625, -7.451171875, -5.3984375, -3.345703125, -1.29296875, 0.759765625, 2.8125, 4.865234375, 6.91796875, 8.970703125, 11.0234375, 13.076171875, 15.12890625, 17.181640625, 19.234375, 21.287109375, 23.33984375, 25.392578125, 27.4453125, 29.498046875, 31.55078125, 33.603515625, 35.65625, 37.708984375, 39.76171875, 41.814453125, 43.8671875, 45.919921875, 47.97265625, 50.025390625, 52.078125, 54.130859375, 56.18359375, 58.236328125, 60.2890625, 62.341796875, 64.39453125, 66.447265625, 68.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 22.0, 65.0, 157.0, 243.0, 250.0, 168.0, 70.0, 23.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.608661651611328, -17.197418212890625, -14.786172866821289, -12.37492847442627, -9.96368408203125, -7.5524396896362305, -5.141195297241211, -2.729949951171875, -0.3187065124511719, 2.0925378799438477, 4.503782272338867, 6.915026664733887, 9.326271057128906, 11.737515449523926, 14.148759841918945, 16.56000518798828, 18.971248626708984, 21.382492065429688, 23.793737411499023, 26.20498275756836, 28.616226196289062, 31.027469635009766, 33.43871307373047, 35.84996032714844, 38.26120376586914, 40.672447204589844, 43.08369445800781, 45.494937896728516, 47.90618133544922, 50.31742477416992, 52.728668212890625, 55.139915466308594, 57.55116271972656, 59.962406158447266, 62.37364959716797, 64.78489685058594, 67.19613647460938, 69.60738372802734, 72.01863098144531, 74.42987060546875, 76.84111785888672, 79.25236511230469, 81.66360473632812, 84.0748519897461, 86.48609924316406, 88.8973388671875, 91.30858612060547, 93.71983337402344, 96.13107299804688, 98.54232025146484, 100.95355987548828, 103.36480712890625, 105.77604675292969, 108.18729400634766, 110.59854125976562, 113.00978088378906, 115.42102813720703, 117.832275390625, 120.24351501464844, 122.6547622680664, 125.06600952148438, 127.47724914550781, 129.88848876953125, 132.29974365234375, 134.7109832763672]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 10.0, 9.0, 12.0, 16.0, 9.0, 22.0, 14.0, 23.0, 27.0, 19.0, 35.0, 33.0, 37.0, 35.0, 40.0, 35.0, 53.0, 32.0, 41.0, 36.0, 30.0, 51.0, 44.0, 43.0, 43.0, 33.0, 34.0, 19.0, 29.0, 24.0, 27.0, 15.0, 11.0, 9.0, 8.0, 5.0, 8.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.92280960083008, -43.230770111083984, -41.538726806640625, -39.84668731689453, -38.15464401245117, -36.46260452270508, -34.77056121826172, -33.078521728515625, -31.3864803314209, -29.694438934326172, -28.002397537231445, -26.31035614013672, -24.618316650390625, -22.926273345947266, -21.234233856201172, -19.542192459106445, -17.85015106201172, -16.158109664916992, -14.466068267822266, -12.774027824401855, -11.081986427307129, -9.389945030212402, -7.697904586791992, -6.005863189697266, -4.313821792602539, -2.6217806339263916, -0.9297394752502441, 0.7623014450073242, 2.454342842102051, 4.146384239196777, 5.8384246826171875, 7.530466079711914, 9.222511291503906, 10.914552688598633, 12.60659408569336, 14.29863452911377, 15.990675926208496, 17.682716369628906, 19.374757766723633, 21.06679916381836, 22.758840560913086, 24.450881958007812, 26.14292335510254, 27.834964752197266, 29.52700424194336, 31.21904754638672, 32.91108703613281, 34.603126525878906, 36.295169830322266, 37.98720932006836, 39.67925262451172, 41.37129211425781, 43.06333541870117, 44.755374908447266, 46.447418212890625, 48.13945770263672, 49.83149719238281, 51.523536682128906, 53.215579986572266, 54.90761947631836, 56.59966278076172, 58.29170227050781, 59.983741760253906, 61.675785064697266, 63.367828369140625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 12.0, 10.0, 11.0, 6.0, 14.0, 8.0, 17.0, 20.0, 13.0, 18.0, 34.0, 25.0, 29.0, 31.0, 36.0, 40.0, 53.0, 35.0, 46.0, 42.0, 44.0, 44.0, 31.0, 32.0, 35.0, 33.0, 32.0, 38.0, 29.0, 20.0, 22.0, 17.0, 28.0, 16.0, 14.0, 19.0, 4.0, 7.0, 4.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.31640625, -6.09478759765625, -5.8731689453125, -5.65155029296875, -5.429931640625, -5.20831298828125, -4.9866943359375, -4.76507568359375, -4.54345703125, -4.32183837890625, -4.1002197265625, -3.87860107421875, -3.656982421875, -3.43536376953125, -3.2137451171875, -2.99212646484375, -2.7705078125, -2.54888916015625, -2.3272705078125, -2.10565185546875, -1.884033203125, -1.66241455078125, -1.4407958984375, -1.21917724609375, -0.99755859375, -0.77593994140625, -0.5543212890625, -0.33270263671875, -0.111083984375, 0.11053466796875, 0.3321533203125, 0.55377197265625, 0.775390625, 0.99700927734375, 1.2186279296875, 1.44024658203125, 1.661865234375, 1.88348388671875, 2.1051025390625, 2.32672119140625, 2.54833984375, 2.76995849609375, 2.9915771484375, 3.21319580078125, 3.434814453125, 3.65643310546875, 3.8780517578125, 4.09967041015625, 4.3212890625, 4.54290771484375, 4.7645263671875, 4.98614501953125, 5.207763671875, 5.42938232421875, 5.6510009765625, 5.87261962890625, 6.09423828125, 6.31585693359375, 6.5374755859375, 6.75909423828125, 6.980712890625, 7.20233154296875, 7.4239501953125, 7.64556884765625, 7.8671875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 10.0, 10.0, 13.0, 19.0, 23.0, 34.0, 49.0, 50.0, 76.0, 120.0, 159.0, 299.0, 443.0, 784.0, 1385.0, 2858.0, 6332.0, 18046.0, 75055.0, 554764.0, 2545647.0, 845471.0, 103810.0, 23456.0, 7880.0, 3477.0, 1574.0, 877.0, 536.0, 329.0, 219.0, 132.0, 114.0, 53.0, 35.0, 49.0, 19.0, 13.0, 18.0, 9.0, 3.0, 5.0, 3.0, 7.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0], "bins": [-14.359375, -13.9320068359375, -13.504638671875, -13.0772705078125, -12.64990234375, -12.2225341796875, -11.795166015625, -11.3677978515625, -10.9404296875, -10.5130615234375, -10.085693359375, -9.6583251953125, -9.23095703125, -8.8035888671875, -8.376220703125, -7.9488525390625, -7.521484375, -7.0941162109375, -6.666748046875, -6.2393798828125, -5.81201171875, -5.3846435546875, -4.957275390625, -4.5299072265625, -4.1025390625, -3.6751708984375, -3.247802734375, -2.8204345703125, -2.39306640625, -1.9656982421875, -1.538330078125, -1.1109619140625, -0.68359375, -0.2562255859375, 0.171142578125, 0.5985107421875, 1.02587890625, 1.4532470703125, 1.880615234375, 2.3079833984375, 2.7353515625, 3.1627197265625, 3.590087890625, 4.0174560546875, 4.44482421875, 4.8721923828125, 5.299560546875, 5.7269287109375, 6.154296875, 6.5816650390625, 7.009033203125, 7.4364013671875, 7.86376953125, 8.2911376953125, 8.718505859375, 9.1458740234375, 9.5732421875, 10.0006103515625, 10.427978515625, 10.8553466796875, 11.28271484375, 11.7100830078125, 12.137451171875, 12.5648193359375, 12.9921875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 2.0, 5.0, 4.0, 8.0, 7.0, 17.0, 22.0, 18.0, 26.0, 42.0, 46.0, 54.0, 75.0, 104.0, 156.0, 237.0, 389.0, 592.0, 646.0, 555.0, 347.0, 224.0, 142.0, 93.0, 56.0, 44.0, 34.0, 17.0, 19.0, 23.0, 13.0, 11.0, 12.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.140625, -11.740478515625, -11.34033203125, -10.940185546875, -10.5400390625, -10.139892578125, -9.73974609375, -9.339599609375, -8.939453125, -8.539306640625, -8.13916015625, -7.739013671875, -7.3388671875, -6.938720703125, -6.53857421875, -6.138427734375, -5.73828125, -5.338134765625, -4.93798828125, -4.537841796875, -4.1376953125, -3.737548828125, -3.33740234375, -2.937255859375, -2.537109375, -2.136962890625, -1.73681640625, -1.336669921875, -0.9365234375, -0.536376953125, -0.13623046875, 0.263916015625, 0.6640625, 1.064208984375, 1.46435546875, 1.864501953125, 2.2646484375, 2.664794921875, 3.06494140625, 3.465087890625, 3.865234375, 4.265380859375, 4.66552734375, 5.065673828125, 5.4658203125, 5.865966796875, 6.26611328125, 6.666259765625, 7.06640625, 7.466552734375, 7.86669921875, 8.266845703125, 8.6669921875, 9.067138671875, 9.46728515625, 9.867431640625, 10.267578125, 10.667724609375, 11.06787109375, 11.468017578125, 11.8681640625, 12.268310546875, 12.66845703125, 13.068603515625, 13.46875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 15.0, 12.0, 16.0, 21.0, 17.0, 33.0, 31.0, 71.0, 99.0, 142.0, 332.0, 1119.0, 12389.0, 2200428.0, 1965949.0, 11631.0, 1108.0, 304.0, 157.0, 105.0, 72.0, 60.0, 29.0, 29.0, 20.0, 21.0, 11.0, 11.0, 7.0, 9.0, 3.0, 7.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.375, -61.4541015625, -59.533203125, -57.6123046875, -55.69140625, -53.7705078125, -51.849609375, -49.9287109375, -48.0078125, -46.0869140625, -44.166015625, -42.2451171875, -40.32421875, -38.4033203125, -36.482421875, -34.5615234375, -32.640625, -30.7197265625, -28.798828125, -26.8779296875, -24.95703125, -23.0361328125, -21.115234375, -19.1943359375, -17.2734375, -15.3525390625, -13.431640625, -11.5107421875, -9.58984375, -7.6689453125, -5.748046875, -3.8271484375, -1.90625, 0.0146484375, 1.935546875, 3.8564453125, 5.77734375, 7.6982421875, 9.619140625, 11.5400390625, 13.4609375, 15.3818359375, 17.302734375, 19.2236328125, 21.14453125, 23.0654296875, 24.986328125, 26.9072265625, 28.828125, 30.7490234375, 32.669921875, 34.5908203125, 36.51171875, 38.4326171875, 40.353515625, 42.2744140625, 44.1953125, 46.1162109375, 48.037109375, 49.9580078125, 51.87890625, 53.7998046875, 55.720703125, 57.6416015625, 59.5625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 12.0, 17.0, 47.0, 71.0, 90.0, 132.0, 146.0, 157.0, 140.0, 91.0, 46.0, 20.0, 16.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.80999755859375, -102.61931610107422, -100.42863464355469, -98.23796081542969, -96.04727935791016, -93.85659790039062, -91.6659164428711, -89.47523498535156, -87.28456115722656, -85.09387969970703, -82.9031982421875, -80.7125244140625, -78.52184295654297, -76.33116149902344, -74.1404800415039, -71.94979858398438, -69.75911712646484, -67.56843566894531, -65.37775421142578, -63.187076568603516, -60.99639892578125, -58.80571746826172, -56.61503601074219, -54.424354553222656, -52.23367691040039, -50.04299545288086, -47.852317810058594, -45.66163635253906, -43.47095489501953, -41.280277252197266, -39.089595794677734, -36.89891815185547, -34.708229064941406, -32.517547607421875, -30.32686996459961, -28.136188507080078, -25.94550895690918, -23.75482940673828, -21.56414794921875, -19.37346839904785, -17.182788848876953, -14.992109298706055, -12.80142879486084, -10.610748291015625, -8.420068740844727, -6.229389190673828, -4.038708686828613, -1.8480281829833984, 0.3426513671875, 2.5333313941955566, 4.724011421203613, 6.91469144821167, 9.105371475219727, 11.296051025390625, 13.48673152923584, 15.677412033081055, 17.868091583251953, 20.05877113342285, 22.24945068359375, 24.44013214111328, 26.63081169128418, 28.821491241455078, 31.01217269897461, 33.202850341796875, 35.393531799316406]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 9.0, 7.0, 7.0, 8.0, 5.0, 13.0, 10.0, 20.0, 26.0, 19.0, 25.0, 25.0, 24.0, 27.0, 27.0, 30.0, 29.0, 33.0, 33.0, 34.0, 45.0, 45.0, 40.0, 42.0, 46.0, 28.0, 29.0, 24.0, 43.0, 24.0, 28.0, 27.0, 23.0, 17.0, 19.0, 20.0, 19.0, 17.0, 11.0, 6.0, 7.0, 8.0, 4.0, 4.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-35.264747619628906, -34.132568359375, -33.00038528442383, -31.86820411682129, -30.73602294921875, -29.60384178161621, -28.471660614013672, -27.339479446411133, -26.207298278808594, -25.075117111206055, -23.942935943603516, -22.810754776000977, -21.678573608398438, -20.5463924407959, -19.41421127319336, -18.28203010559082, -17.14984893798828, -16.017667770385742, -14.885486602783203, -13.753305435180664, -12.621124267578125, -11.488943099975586, -10.356761932373047, -9.224580764770508, -8.092399597167969, -6.96021842956543, -5.828037261962891, -4.695856094360352, -3.5636749267578125, -2.4314937591552734, -1.2993125915527344, -0.1671314239501953, 0.9650535583496094, 2.0972347259521484, 3.2294158935546875, 4.361597061157227, 5.493778228759766, 6.625959396362305, 7.758140563964844, 8.890321731567383, 10.022502899169922, 11.154684066772461, 12.286865234375, 13.419046401977539, 14.551227569580078, 15.683408737182617, 16.815589904785156, 17.947771072387695, 19.079952239990234, 20.212133407592773, 21.344314575195312, 22.47649574279785, 23.60867691040039, 24.74085807800293, 25.87303924560547, 27.005220413208008, 28.137401580810547, 29.269582748413086, 30.401763916015625, 31.533945083618164, 32.6661262512207, 33.798309326171875, 34.93048858642578, 36.06266784667969, 37.19485092163086]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 13.0, 5.0, 11.0, 13.0, 18.0, 18.0, 21.0, 30.0, 30.0, 32.0, 32.0, 29.0, 38.0, 68.0, 34.0, 47.0, 49.0, 44.0, 54.0, 35.0, 24.0, 30.0, 37.0, 17.0, 27.0, 35.0, 22.0, 24.0, 21.0, 17.0, 18.0, 21.0, 11.0, 11.0, 10.0, 8.0, 8.0, 4.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7734375, -6.5587158203125, -6.343994140625, -6.1292724609375, -5.91455078125, -5.6998291015625, -5.485107421875, -5.2703857421875, -5.0556640625, -4.8409423828125, -4.626220703125, -4.4114990234375, -4.19677734375, -3.9820556640625, -3.767333984375, -3.5526123046875, -3.337890625, -3.1231689453125, -2.908447265625, -2.6937255859375, -2.47900390625, -2.2642822265625, -2.049560546875, -1.8348388671875, -1.6201171875, -1.4053955078125, -1.190673828125, -0.9759521484375, -0.76123046875, -0.5465087890625, -0.331787109375, -0.1170654296875, 0.09765625, 0.3123779296875, 0.527099609375, 0.7418212890625, 0.95654296875, 1.1712646484375, 1.385986328125, 1.6007080078125, 1.8154296875, 2.0301513671875, 2.244873046875, 2.4595947265625, 2.67431640625, 2.8890380859375, 3.103759765625, 3.3184814453125, 3.533203125, 3.7479248046875, 3.962646484375, 4.1773681640625, 4.39208984375, 4.6068115234375, 4.821533203125, 5.0362548828125, 5.2509765625, 5.4656982421875, 5.680419921875, 5.8951416015625, 6.10986328125, 6.3245849609375, 6.539306640625, 6.7540283203125, 6.96875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 2.0, 10.0, 16.0, 22.0, 33.0, 43.0, 69.0, 129.0, 185.0, 332.0, 466.0, 750.0, 1303.0, 1991.0, 3126.0, 5143.0, 8570.0, 13885.0, 23595.0, 40429.0, 71441.0, 126487.0, 212521.0, 221769.0, 134398.0, 75844.0, 42891.0, 24774.0, 14689.0, 8854.0, 5519.0, 3479.0, 2154.0, 1349.0, 834.0, 583.0, 319.0, 208.0, 115.0, 92.0, 48.0, 36.0, 18.0, 17.0, 8.0, 7.0, 5.0, 2.0, 3.0], "bins": [-1.375, -1.3388671875, -1.302734375, -1.2666015625, -1.23046875, -1.1943359375, -1.158203125, -1.1220703125, -1.0859375, -1.0498046875, -1.013671875, -0.9775390625, -0.94140625, -0.9052734375, -0.869140625, -0.8330078125, -0.796875, -0.7607421875, -0.724609375, -0.6884765625, -0.65234375, -0.6162109375, -0.580078125, -0.5439453125, -0.5078125, -0.4716796875, -0.435546875, -0.3994140625, -0.36328125, -0.3271484375, -0.291015625, -0.2548828125, -0.21875, -0.1826171875, -0.146484375, -0.1103515625, -0.07421875, -0.0380859375, -0.001953125, 0.0341796875, 0.0703125, 0.1064453125, 0.142578125, 0.1787109375, 0.21484375, 0.2509765625, 0.287109375, 0.3232421875, 0.359375, 0.3955078125, 0.431640625, 0.4677734375, 0.50390625, 0.5400390625, 0.576171875, 0.6123046875, 0.6484375, 0.6845703125, 0.720703125, 0.7568359375, 0.79296875, 0.8291015625, 0.865234375, 0.9013671875, 0.9375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 13.0, 2.0, 5.0, 3.0, 12.0, 9.0, 12.0, 14.0, 22.0, 16.0, 22.0, 30.0, 29.0, 27.0, 34.0, 29.0, 32.0, 34.0, 36.0, 37.0, 31.0, 1057.0, 43.0, 42.0, 39.0, 39.0, 38.0, 29.0, 35.0, 27.0, 28.0, 21.0, 31.0, 17.0, 25.0, 16.0, 21.0, 11.0, 11.0, 8.0, 7.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-4.90625, -4.76055908203125, -4.6148681640625, -4.46917724609375, -4.323486328125, -4.17779541015625, -4.0321044921875, -3.88641357421875, -3.74072265625, -3.59503173828125, -3.4493408203125, -3.30364990234375, -3.157958984375, -3.01226806640625, -2.8665771484375, -2.72088623046875, -2.5751953125, -2.42950439453125, -2.2838134765625, -2.13812255859375, -1.992431640625, -1.84674072265625, -1.7010498046875, -1.55535888671875, -1.40966796875, -1.26397705078125, -1.1182861328125, -0.97259521484375, -0.826904296875, -0.68121337890625, -0.5355224609375, -0.38983154296875, -0.244140625, -0.09844970703125, 0.0472412109375, 0.19293212890625, 0.338623046875, 0.48431396484375, 0.6300048828125, 0.77569580078125, 0.92138671875, 1.06707763671875, 1.2127685546875, 1.35845947265625, 1.504150390625, 1.64984130859375, 1.7955322265625, 1.94122314453125, 2.0869140625, 2.23260498046875, 2.3782958984375, 2.52398681640625, 2.669677734375, 2.81536865234375, 2.9610595703125, 3.10675048828125, 3.25244140625, 3.39813232421875, 3.5438232421875, 3.68951416015625, 3.835205078125, 3.98089599609375, 4.1265869140625, 4.27227783203125, 4.41796875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 8.0, 10.0, 17.0, 23.0, 27.0, 54.0, 110.0, 124.0, 229.0, 381.0, 601.0, 1074.0, 1968.0, 3380.0, 6718.0, 13093.0, 27732.0, 60361.0, 147133.0, 659656.0, 889223.0, 161252.0, 65028.0, 29345.0, 14157.0, 7131.0, 3610.0, 1987.0, 1100.0, 627.0, 393.0, 218.0, 135.0, 95.0, 40.0, 28.0, 17.0, 9.0, 9.0, 7.0, 7.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0224609375, -0.988433837890625, -0.95440673828125, -0.920379638671875, -0.8863525390625, -0.852325439453125, -0.81829833984375, -0.784271240234375, -0.750244140625, -0.716217041015625, -0.68218994140625, -0.648162841796875, -0.6141357421875, -0.580108642578125, -0.54608154296875, -0.512054443359375, -0.47802734375, -0.444000244140625, -0.40997314453125, -0.375946044921875, -0.3419189453125, -0.307891845703125, -0.27386474609375, -0.239837646484375, -0.205810546875, -0.171783447265625, -0.13775634765625, -0.103729248046875, -0.0697021484375, -0.035675048828125, -0.00164794921875, 0.032379150390625, 0.06640625, 0.100433349609375, 0.13446044921875, 0.168487548828125, 0.2025146484375, 0.236541748046875, 0.27056884765625, 0.304595947265625, 0.338623046875, 0.372650146484375, 0.40667724609375, 0.440704345703125, 0.4747314453125, 0.508758544921875, 0.54278564453125, 0.576812744140625, 0.61083984375, 0.644866943359375, 0.67889404296875, 0.712921142578125, 0.7469482421875, 0.780975341796875, 0.81500244140625, 0.849029541015625, 0.883056640625, 0.917083740234375, 0.95111083984375, 0.985137939453125, 1.0191650390625, 1.053192138671875, 1.08721923828125, 1.121246337890625, 1.1552734375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 12.0, 9.0, 21.0, 24.0, 32.0, 50.0, 59.0, 84.0, 155.0, 170.0, 117.0, 68.0, 62.0, 38.0, 24.0, 19.0, 13.0, 15.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.400634765625, -0.39155006408691406, -0.3824653625488281, -0.3733806610107422, -0.36429595947265625, -0.3552112579345703, -0.3461265563964844, -0.33704185485839844, -0.3279571533203125, -0.31887245178222656, -0.3097877502441406, -0.3007030487060547, -0.29161834716796875, -0.2825336456298828, -0.2734489440917969, -0.26436424255371094, -0.255279541015625, -0.24619483947753906, -0.23711013793945312, -0.2280254364013672, -0.21894073486328125, -0.2098560333251953, -0.20077133178710938, -0.19168663024902344, -0.1826019287109375, -0.17351722717285156, -0.16443252563476562, -0.1553478240966797, -0.14626312255859375, -0.1371784210205078, -0.12809371948242188, -0.11900901794433594, -0.10992431640625, -0.10083961486816406, -0.09175491333007812, -0.08267021179199219, -0.07358551025390625, -0.06450080871582031, -0.055416107177734375, -0.04633140563964844, -0.0372467041015625, -0.028162002563476562, -0.019077301025390625, -0.009992599487304688, -0.00090789794921875, 0.008176803588867188, 0.017261505126953125, 0.026346206665039062, 0.035430908203125, 0.04451560974121094, 0.053600311279296875, 0.06268501281738281, 0.07176971435546875, 0.08085441589355469, 0.08993911743164062, 0.09902381896972656, 0.1081085205078125, 0.11719322204589844, 0.12627792358398438, 0.1353626251220703, 0.14444732666015625, 0.1535320281982422, 0.16261672973632812, 0.17170143127441406, 0.1807861328125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 6.0, 16.0, 19.0, 32.0, 32.0, 69.0, 143.0, 423.0, 51783.0, 994863.0, 744.0, 179.0, 96.0, 41.0, 33.0, 22.0, 15.0, 10.0, 8.0, 5.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.39892578125, -4.1806640625, -3.96240234375, -3.744140625, -3.52587890625, -3.3076171875, -3.08935546875, -2.87109375, -2.65283203125, -2.4345703125, -2.21630859375, -1.998046875, -1.77978515625, -1.5615234375, -1.34326171875, -1.125, -0.90673828125, -0.6884765625, -0.47021484375, -0.251953125, -0.03369140625, 0.1845703125, 0.40283203125, 0.62109375, 0.83935546875, 1.0576171875, 1.27587890625, 1.494140625, 1.71240234375, 1.9306640625, 2.14892578125, 2.3671875, 2.58544921875, 2.8037109375, 3.02197265625, 3.240234375, 3.45849609375, 3.6767578125, 3.89501953125, 4.11328125, 4.33154296875, 4.5498046875, 4.76806640625, 4.986328125, 5.20458984375, 5.4228515625, 5.64111328125, 5.859375, 6.07763671875, 6.2958984375, 6.51416015625, 6.732421875, 6.95068359375, 7.1689453125, 7.38720703125, 7.60546875, 7.82373046875, 8.0419921875, 8.26025390625, 8.478515625, 8.69677734375, 8.9150390625, 9.13330078125, 9.3515625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 45.0, 161.0, 339.0, 283.0, 122.0, 39.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14567077159881592, -0.12084317207336426, -0.0960155725479126, -0.07118797302246094, -0.04636037349700928, -0.021532773971557617, 0.003294825553894043, 0.028122425079345703, 0.05295002460479736, 0.07777762413024902, 0.10260522365570068, 0.12743282318115234, 0.152260422706604, 0.17708802223205566, 0.20191562175750732, 0.22674322128295898, 0.25157082080841064, 0.2763984203338623, 0.30122601985931396, 0.3260536193847656, 0.3508812189102173, 0.37570881843566895, 0.4005364179611206, 0.42536401748657227, 0.4501916170120239, 0.4750192165374756, 0.49984681606292725, 0.5246744155883789, 0.5495020151138306, 0.5743296146392822, 0.5991572141647339, 0.6239848136901855, 0.6488124132156372, 0.6736400127410889, 0.6984676122665405, 0.7232952117919922, 0.7481228113174438, 0.7729504108428955, 0.7977780103683472, 0.8226056098937988, 0.8474332094192505, 0.8722608089447021, 0.8970884084701538, 0.9219160079956055, 0.9467436075210571, 0.9715712070465088, 0.9963988065719604, 1.021226406097412, 1.0460540056228638, 1.0708816051483154, 1.095709204673767, 1.1205368041992188, 1.1453644037246704, 1.170192003250122, 1.1950196027755737, 1.2198472023010254, 1.244674801826477, 1.2695024013519287, 1.2943300008773804, 1.319157600402832, 1.3439851999282837, 1.3688127994537354, 1.393640398979187, 1.4184679985046387, 1.4432955980300903]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 5.0, 9.0, 11.0, 14.0, 12.0, 17.0, 14.0, 20.0, 24.0, 17.0, 22.0, 35.0, 39.0, 36.0, 30.0, 42.0, 39.0, 40.0, 32.0, 40.0, 40.0, 27.0, 38.0, 38.0, 34.0, 37.0, 38.0, 29.0, 26.0, 19.0, 20.0, 19.0, 19.0, 17.0, 19.0, 9.0, 11.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.16896575689315796, -0.16402976214885712, -0.15909375250339508, -0.15415775775909424, -0.1492217630147934, -0.14428576827049255, -0.13934975862503052, -0.13441376388072968, -0.12947776913642883, -0.1245417669415474, -0.11960577219724655, -0.11466977000236511, -0.10973377525806427, -0.10479777306318283, -0.09986177086830139, -0.09492577612400055, -0.08998976647853851, -0.08505376428365707, -0.08011776953935623, -0.07518176734447479, -0.07024577260017395, -0.06530977040529251, -0.06037376821041107, -0.05543776974081993, -0.05050177127122879, -0.04556577280163765, -0.04062977433204651, -0.03569377213716507, -0.03075777366757393, -0.025821775197982788, -0.020885774865746498, -0.015949774533510208, -0.011013776063919067, -0.006077776663005352, -0.0011417772620916367, 0.0037942221388220787, 0.008730221539735794, 0.013666220009326935, 0.018602220341563225, 0.023538220673799515, 0.028474219143390656, 0.033410217612981796, 0.03834621608257294, 0.043282218277454376, 0.04821821674704552, 0.05315421521663666, 0.0580902174115181, 0.06302621960639954, 0.06796221435070038, 0.07289821654558182, 0.07783421128988266, 0.0827702134847641, 0.08770620822906494, 0.09264221042394638, 0.09757821261882782, 0.10251420736312866, 0.1074502095580101, 0.11238621175289154, 0.11732220649719238, 0.12225820869207382, 0.12719421088695526, 0.1321302056312561, 0.13706620037555695, 0.14200221002101898, 0.14693820476531982]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 8.0, 5.0, 12.0, 9.0, 13.0, 10.0, 25.0, 28.0, 21.0, 21.0, 36.0, 32.0, 33.0, 36.0, 46.0, 38.0, 42.0, 45.0, 48.0, 40.0, 40.0, 43.0, 31.0, 39.0, 35.0, 24.0, 22.0, 22.0, 20.0, 25.0, 23.0, 16.0, 22.0, 9.0, 15.0, 17.0, 7.0, 10.0, 5.0, 13.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.3909912109375, -6.180419921875, -5.9698486328125, -5.75927734375, -5.5487060546875, -5.338134765625, -5.1275634765625, -4.9169921875, -4.7064208984375, -4.495849609375, -4.2852783203125, -4.07470703125, -3.8641357421875, -3.653564453125, -3.4429931640625, -3.232421875, -3.0218505859375, -2.811279296875, -2.6007080078125, -2.39013671875, -2.1795654296875, -1.968994140625, -1.7584228515625, -1.5478515625, -1.3372802734375, -1.126708984375, -0.9161376953125, -0.70556640625, -0.4949951171875, -0.284423828125, -0.0738525390625, 0.13671875, 0.3472900390625, 0.557861328125, 0.7684326171875, 0.97900390625, 1.1895751953125, 1.400146484375, 1.6107177734375, 1.8212890625, 2.0318603515625, 2.242431640625, 2.4530029296875, 2.66357421875, 2.8741455078125, 3.084716796875, 3.2952880859375, 3.505859375, 3.7164306640625, 3.927001953125, 4.1375732421875, 4.34814453125, 4.5587158203125, 4.769287109375, 4.9798583984375, 5.1904296875, 5.4010009765625, 5.611572265625, 5.8221435546875, 6.03271484375, 6.2432861328125, 6.453857421875, 6.6644287109375, 6.875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 8.0, 20.0, 27.0, 34.0, 33.0, 69.0, 103.0, 168.0, 221.0, 338.0, 521.0, 780.0, 1159.0, 1799.0, 2979.0, 4530.0, 7985.0, 13938.0, 26211.0, 53360.0, 127995.0, 405659.0, 235267.0, 81468.0, 37599.0, 19291.0, 10542.0, 6042.0, 3662.0, 2287.0, 1453.0, 1038.0, 647.0, 423.0, 283.0, 178.0, 119.0, 81.0, 79.0, 46.0, 27.0, 30.0, 18.0, 14.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.98828125, -7.73675537109375, -7.4852294921875, -7.23370361328125, -6.982177734375, -6.73065185546875, -6.4791259765625, -6.22760009765625, -5.97607421875, -5.72454833984375, -5.4730224609375, -5.22149658203125, -4.969970703125, -4.71844482421875, -4.4669189453125, -4.21539306640625, -3.9638671875, -3.71234130859375, -3.4608154296875, -3.20928955078125, -2.957763671875, -2.70623779296875, -2.4547119140625, -2.20318603515625, -1.95166015625, -1.70013427734375, -1.4486083984375, -1.19708251953125, -0.945556640625, -0.69403076171875, -0.4425048828125, -0.19097900390625, 0.060546875, 0.31207275390625, 0.5635986328125, 0.81512451171875, 1.066650390625, 1.31817626953125, 1.5697021484375, 1.82122802734375, 2.07275390625, 2.32427978515625, 2.5758056640625, 2.82733154296875, 3.078857421875, 3.33038330078125, 3.5819091796875, 3.83343505859375, 4.0849609375, 4.33648681640625, 4.5880126953125, 4.83953857421875, 5.091064453125, 5.34259033203125, 5.5941162109375, 5.84564208984375, 6.09716796875, 6.34869384765625, 6.6002197265625, 6.85174560546875, 7.103271484375, 7.35479736328125, 7.6063232421875, 7.85784912109375, 8.109375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 2.0, 6.0, 14.0, 13.0, 8.0, 19.0, 10.0, 20.0, 32.0, 22.0, 30.0, 27.0, 42.0, 33.0, 48.0, 57.0, 106.0, 168.0, 1466.0, 357.0, 133.0, 79.0, 52.0, 38.0, 31.0, 27.0, 29.0, 33.0, 21.0, 23.0, 16.0, 16.0, 11.0, 13.0, 9.0, 9.0, 9.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.78125, -21.09619140625, -20.4111328125, -19.72607421875, -19.041015625, -18.35595703125, -17.6708984375, -16.98583984375, -16.30078125, -15.61572265625, -14.9306640625, -14.24560546875, -13.560546875, -12.87548828125, -12.1904296875, -11.50537109375, -10.8203125, -10.13525390625, -9.4501953125, -8.76513671875, -8.080078125, -7.39501953125, -6.7099609375, -6.02490234375, -5.33984375, -4.65478515625, -3.9697265625, -3.28466796875, -2.599609375, -1.91455078125, -1.2294921875, -0.54443359375, 0.140625, 0.82568359375, 1.5107421875, 2.19580078125, 2.880859375, 3.56591796875, 4.2509765625, 4.93603515625, 5.62109375, 6.30615234375, 6.9912109375, 7.67626953125, 8.361328125, 9.04638671875, 9.7314453125, 10.41650390625, 11.1015625, 11.78662109375, 12.4716796875, 13.15673828125, 13.841796875, 14.52685546875, 15.2119140625, 15.89697265625, 16.58203125, 17.26708984375, 17.9521484375, 18.63720703125, 19.322265625, 20.00732421875, 20.6923828125, 21.37744140625, 22.0625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 9.0, 5.0, 7.0, 15.0, 14.0, 27.0, 23.0, 25.0, 33.0, 38.0, 36.0, 65.0, 84.0, 96.0, 143.0, 217.0, 378.0, 862.0, 4949.0, 145166.0, 2942986.0, 45871.0, 2875.0, 692.0, 326.0, 184.0, 129.0, 82.0, 82.0, 54.0, 45.0, 38.0, 28.0, 40.0, 17.0, 16.0, 17.0, 9.0, 4.0, 6.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.875, -42.43017578125, -40.9853515625, -39.54052734375, -38.095703125, -36.65087890625, -35.2060546875, -33.76123046875, -32.31640625, -30.87158203125, -29.4267578125, -27.98193359375, -26.537109375, -25.09228515625, -23.6474609375, -22.20263671875, -20.7578125, -19.31298828125, -17.8681640625, -16.42333984375, -14.978515625, -13.53369140625, -12.0888671875, -10.64404296875, -9.19921875, -7.75439453125, -6.3095703125, -4.86474609375, -3.419921875, -1.97509765625, -0.5302734375, 0.91455078125, 2.359375, 3.80419921875, 5.2490234375, 6.69384765625, 8.138671875, 9.58349609375, 11.0283203125, 12.47314453125, 13.91796875, 15.36279296875, 16.8076171875, 18.25244140625, 19.697265625, 21.14208984375, 22.5869140625, 24.03173828125, 25.4765625, 26.92138671875, 28.3662109375, 29.81103515625, 31.255859375, 32.70068359375, 34.1455078125, 35.59033203125, 37.03515625, 38.47998046875, 39.9248046875, 41.36962890625, 42.814453125, 44.25927734375, 45.7041015625, 47.14892578125, 48.59375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [306.0, 705.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9082670211792, -1.7639751434326172, 9.380316734313965, 20.524608612060547, 31.668899536132812, 42.81319046020508, 53.95748519897461, 65.10177612304688, 76.2460708618164, 87.39036560058594, 98.53465270996094, 109.67894744873047, 120.8232421875, 131.967529296875, 143.11181640625, 154.256103515625, 165.40040588378906, 176.54469299316406, 187.68899536132812, 198.83328247070312, 209.97756958007812, 221.12185668945312, 232.2661590576172, 243.4104461669922, 254.5547332763672, 265.69903564453125, 276.84332275390625, 287.98760986328125, 299.13189697265625, 310.27618408203125, 321.42047119140625, 332.56475830078125, 343.7090759277344, 354.8533630371094, 365.9976501464844, 377.1419677734375, 388.2862548828125, 399.4305419921875, 410.5748291015625, 421.7191162109375, 432.8634033203125, 444.0076904296875, 455.1519775390625, 466.2962646484375, 477.4405822753906, 488.5848693847656, 499.7291564941406, 510.8734436035156, 522.0177612304688, 533.1620483398438, 544.3063354492188, 555.4506225585938, 566.5949096679688, 577.7391967773438, 588.883544921875, 600.02783203125, 611.1720581054688, 622.3163452148438, 633.4606323242188, 644.6049194335938, 655.7492065429688, 666.8934936523438, 678.037841796875, 689.18212890625, 700.326416015625]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 5.0, 2.0, 13.0, 11.0, 10.0, 9.0, 12.0, 18.0, 15.0, 22.0, 18.0, 26.0, 19.0, 23.0, 29.0, 27.0, 32.0, 46.0, 34.0, 38.0, 34.0, 35.0, 39.0, 41.0, 39.0, 38.0, 36.0, 27.0, 31.0, 35.0, 30.0, 28.0, 20.0, 20.0, 17.0, 18.0, 17.0, 18.0, 10.0, 8.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-52.930999755859375, -51.380340576171875, -49.82968521118164, -48.27902603149414, -46.72836685180664, -45.177711486816406, -43.627052307128906, -42.076393127441406, -40.52573776245117, -38.97507858276367, -37.42442321777344, -35.87376403808594, -34.32310485839844, -32.7724494934082, -31.221790313720703, -29.671133041381836, -28.120473861694336, -26.56981658935547, -25.01915740966797, -23.4685001373291, -21.917842864990234, -20.367183685302734, -18.816526412963867, -17.265869140625, -15.715210914611816, -14.164552688598633, -12.613895416259766, -11.063237190246582, -9.512578964233398, -7.961921691894531, -6.411263465881348, -4.8606061935424805, -3.309947967529297, -1.759290099143982, -0.208632230758667, 1.3420257568359375, 2.892683506011963, 4.443341255187988, 5.993999481201172, 7.544656753540039, 9.095314979553223, 10.645973205566406, 12.196630477905273, 13.747288703918457, 15.29794692993164, 16.848604202270508, 18.399261474609375, 19.949920654296875, 21.500577926635742, 23.05123519897461, 24.60189437866211, 26.152551651000977, 27.703208923339844, 29.253868103027344, 30.80452537536621, 32.35518264770508, 33.90584182739258, 35.45650100708008, 37.00715637207031, 38.55781555175781, 40.10847473144531, 41.65913009643555, 43.20978927612305, 44.76044464111328, 46.31110382080078]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 6.0, 5.0, 10.0, 15.0, 12.0, 21.0, 19.0, 30.0, 27.0, 27.0, 23.0, 40.0, 34.0, 38.0, 34.0, 39.0, 47.0, 31.0, 56.0, 38.0, 32.0, 44.0, 35.0, 30.0, 36.0, 27.0, 19.0, 20.0, 15.0, 26.0, 22.0, 19.0, 16.0, 13.0, 16.0, 14.0, 12.0, 12.0, 5.0, 7.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7421875, -6.52301025390625, -6.3038330078125, -6.08465576171875, -5.865478515625, -5.64630126953125, -5.4271240234375, -5.20794677734375, -4.98876953125, -4.76959228515625, -4.5504150390625, -4.33123779296875, -4.112060546875, -3.89288330078125, -3.6737060546875, -3.45452880859375, -3.2353515625, -3.01617431640625, -2.7969970703125, -2.57781982421875, -2.358642578125, -2.13946533203125, -1.9202880859375, -1.70111083984375, -1.48193359375, -1.26275634765625, -1.0435791015625, -0.82440185546875, -0.605224609375, -0.38604736328125, -0.1668701171875, 0.05230712890625, 0.271484375, 0.49066162109375, 0.7098388671875, 0.92901611328125, 1.148193359375, 1.36737060546875, 1.5865478515625, 1.80572509765625, 2.02490234375, 2.24407958984375, 2.4632568359375, 2.68243408203125, 2.901611328125, 3.12078857421875, 3.3399658203125, 3.55914306640625, 3.7783203125, 3.99749755859375, 4.2166748046875, 4.43585205078125, 4.655029296875, 4.87420654296875, 5.0933837890625, 5.31256103515625, 5.53173828125, 5.75091552734375, 5.9700927734375, 6.18927001953125, 6.408447265625, 6.62762451171875, 6.8468017578125, 7.06597900390625, 7.28515625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 14.0, 12.0, 14.0, 26.0, 39.0, 49.0, 74.0, 100.0, 185.0, 324.0, 527.0, 929.0, 1743.0, 3404.0, 7214.0, 18244.0, 59608.0, 297585.0, 1389025.0, 1833406.0, 452578.0, 86221.0, 24285.0, 9547.0, 4228.0, 2120.0, 1155.0, 607.0, 377.0, 216.0, 147.0, 90.0, 59.0, 40.0, 33.0, 20.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.149658203125, -10.79150390625, -10.433349609375, -10.0751953125, -9.717041015625, -9.35888671875, -9.000732421875, -8.642578125, -8.284423828125, -7.92626953125, -7.568115234375, -7.2099609375, -6.851806640625, -6.49365234375, -6.135498046875, -5.77734375, -5.419189453125, -5.06103515625, -4.702880859375, -4.3447265625, -3.986572265625, -3.62841796875, -3.270263671875, -2.912109375, -2.553955078125, -2.19580078125, -1.837646484375, -1.4794921875, -1.121337890625, -0.76318359375, -0.405029296875, -0.046875, 0.311279296875, 0.66943359375, 1.027587890625, 1.3857421875, 1.743896484375, 2.10205078125, 2.460205078125, 2.818359375, 3.176513671875, 3.53466796875, 3.892822265625, 4.2509765625, 4.609130859375, 4.96728515625, 5.325439453125, 5.68359375, 6.041748046875, 6.39990234375, 6.758056640625, 7.1162109375, 7.474365234375, 7.83251953125, 8.190673828125, 8.548828125, 8.906982421875, 9.26513671875, 9.623291015625, 9.9814453125, 10.339599609375, 10.69775390625, 11.055908203125, 11.4140625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 8.0, 7.0, 14.0, 15.0, 16.0, 24.0, 23.0, 49.0, 48.0, 70.0, 73.0, 116.0, 177.0, 259.0, 386.0, 539.0, 578.0, 517.0, 317.0, 206.0, 170.0, 97.0, 71.0, 64.0, 48.0, 37.0, 33.0, 25.0, 21.0, 13.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.40234375, -11.0, -10.59765625, -10.1953125, -9.79296875, -9.390625, -8.98828125, -8.5859375, -8.18359375, -7.78125, -7.37890625, -6.9765625, -6.57421875, -6.171875, -5.76953125, -5.3671875, -4.96484375, -4.5625, -4.16015625, -3.7578125, -3.35546875, -2.953125, -2.55078125, -2.1484375, -1.74609375, -1.34375, -0.94140625, -0.5390625, -0.13671875, 0.265625, 0.66796875, 1.0703125, 1.47265625, 1.875, 2.27734375, 2.6796875, 3.08203125, 3.484375, 3.88671875, 4.2890625, 4.69140625, 5.09375, 5.49609375, 5.8984375, 6.30078125, 6.703125, 7.10546875, 7.5078125, 7.91015625, 8.3125, 8.71484375, 9.1171875, 9.51953125, 9.921875, 10.32421875, 10.7265625, 11.12890625, 11.53125, 11.93359375, 12.3359375, 12.73828125, 13.140625, 13.54296875, 13.9453125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 8.0, 6.0, 8.0, 11.0, 22.0, 19.0, 29.0, 47.0, 59.0, 77.0, 117.0, 141.0, 144.0, 268.0, 469.0, 1134.0, 5622.0, 125586.0, 3874023.0, 177015.0, 6818.0, 1189.0, 492.0, 266.0, 174.0, 133.0, 99.0, 86.0, 60.0, 47.0, 24.0, 26.0, 23.0, 17.0, 3.0, 5.0, 10.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.0, -46.56884765625, -45.1376953125, -43.70654296875, -42.275390625, -40.84423828125, -39.4130859375, -37.98193359375, -36.55078125, -35.11962890625, -33.6884765625, -32.25732421875, -30.826171875, -29.39501953125, -27.9638671875, -26.53271484375, -25.1015625, -23.67041015625, -22.2392578125, -20.80810546875, -19.376953125, -17.94580078125, -16.5146484375, -15.08349609375, -13.65234375, -12.22119140625, -10.7900390625, -9.35888671875, -7.927734375, -6.49658203125, -5.0654296875, -3.63427734375, -2.203125, -0.77197265625, 0.6591796875, 2.09033203125, 3.521484375, 4.95263671875, 6.3837890625, 7.81494140625, 9.24609375, 10.67724609375, 12.1083984375, 13.53955078125, 14.970703125, 16.40185546875, 17.8330078125, 19.26416015625, 20.6953125, 22.12646484375, 23.5576171875, 24.98876953125, 26.419921875, 27.85107421875, 29.2822265625, 30.71337890625, 32.14453125, 33.57568359375, 35.0068359375, 36.43798828125, 37.869140625, 39.30029296875, 40.7314453125, 42.16259765625, 43.59375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 23.0, 69.0, 247.0, 411.0, 198.0, 56.0, 12.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.3002700805664, -82.17893981933594, -76.0576171875, -69.93628692626953, -63.814964294433594, -57.693634033203125, -51.57230758666992, -45.45098114013672, -39.329654693603516, -33.20832824707031, -27.08700180053711, -20.965673446655273, -14.84434700012207, -8.723020553588867, -2.6016921997070312, 3.519634246826172, 9.640960693359375, 15.762287139892578, 21.88361358642578, 28.004941940307617, 34.12626647949219, 40.247596740722656, 46.36892318725586, 52.49024963378906, 58.611576080322266, 64.73290252685547, 70.85423278808594, 76.97555541992188, 83.09688568115234, 89.21820831298828, 95.33953857421875, 101.46086120605469, 107.58219909667969, 113.70352935791016, 119.8248519897461, 125.94618225097656, 132.0675048828125, 138.18882751464844, 144.31016540527344, 150.43148803710938, 156.5528106689453, 162.67413330078125, 168.79547119140625, 174.9167938232422, 181.03811645507812, 187.15943908691406, 193.28077697753906, 199.402099609375, 205.5234375, 211.64476013183594, 217.76609802246094, 223.88742065429688, 230.0087432861328, 236.13006591796875, 242.25140380859375, 248.3727264404297, 254.49404907226562, 260.6153869628906, 266.7366943359375, 272.8580322265625, 278.9793701171875, 285.1006774902344, 291.2220153808594, 297.34332275390625, 303.46466064453125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 3.0, 15.0, 6.0, 10.0, 16.0, 14.0, 16.0, 17.0, 26.0, 27.0, 36.0, 36.0, 48.0, 41.0, 39.0, 41.0, 29.0, 41.0, 38.0, 44.0, 38.0, 37.0, 46.0, 38.0, 31.0, 30.0, 29.0, 28.0, 38.0, 18.0, 11.0, 17.0, 9.0, 9.0, 13.0, 15.0, 9.0, 5.0, 10.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-44.059242248535156, -42.73255920410156, -41.405879974365234, -40.07919692993164, -38.75251770019531, -37.42583465576172, -36.099151611328125, -34.7724723815918, -33.4457893371582, -32.11910629272461, -30.79242706298828, -29.465744018554688, -28.139062881469727, -26.812381744384766, -25.485700607299805, -24.159019470214844, -22.832338333129883, -21.505657196044922, -20.17897605895996, -18.852294921875, -17.525611877441406, -16.198930740356445, -14.872249603271484, -13.545567512512207, -12.218886375427246, -10.892205238342285, -9.565523147583008, -8.238842010498047, -6.912160396575928, -5.585478782653809, -4.258797645568848, -2.9321155548095703, -1.6054344177246094, -0.2787529230117798, 1.0479285717010498, 2.37460994720459, 3.701291561126709, 5.027973175048828, 6.354654312133789, 7.681336402893066, 9.008017539978027, 10.334698677062988, 11.661380767822266, 12.988061904907227, 14.314743041992188, 15.641425132751465, 16.96810531616211, 18.294788360595703, 19.621469497680664, 20.948150634765625, 22.274831771850586, 23.601512908935547, 24.92819595336914, 26.2548770904541, 27.581558227539062, 28.908241271972656, 30.234920501708984, 31.561601638793945, 32.888282775878906, 34.2149658203125, 35.54164505004883, 36.86832809448242, 38.19500732421875, 39.521690368652344, 40.84837341308594]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 6.0, 9.0, 11.0, 11.0, 22.0, 19.0, 18.0, 27.0, 36.0, 35.0, 32.0, 35.0, 33.0, 42.0, 36.0, 48.0, 42.0, 37.0, 37.0, 33.0, 40.0, 39.0, 32.0, 33.0, 29.0, 22.0, 33.0, 22.0, 17.0, 23.0, 18.0, 19.0, 12.0, 14.0, 9.0, 12.0, 10.0, 7.0, 6.0, 3.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.29742431640625, -6.0870361328125, -5.87664794921875, -5.666259765625, -5.45587158203125, -5.2454833984375, -5.03509521484375, -4.82470703125, -4.61431884765625, -4.4039306640625, -4.19354248046875, -3.983154296875, -3.77276611328125, -3.5623779296875, -3.35198974609375, -3.1416015625, -2.93121337890625, -2.7208251953125, -2.51043701171875, -2.300048828125, -2.08966064453125, -1.8792724609375, -1.66888427734375, -1.45849609375, -1.24810791015625, -1.0377197265625, -0.82733154296875, -0.616943359375, -0.40655517578125, -0.1961669921875, 0.01422119140625, 0.224609375, 0.43499755859375, 0.6453857421875, 0.85577392578125, 1.066162109375, 1.27655029296875, 1.4869384765625, 1.69732666015625, 1.90771484375, 2.11810302734375, 2.3284912109375, 2.53887939453125, 2.749267578125, 2.95965576171875, 3.1700439453125, 3.38043212890625, 3.5908203125, 3.80120849609375, 4.0115966796875, 4.22198486328125, 4.432373046875, 4.64276123046875, 4.8531494140625, 5.06353759765625, 5.27392578125, 5.48431396484375, 5.6947021484375, 5.90509033203125, 6.115478515625, 6.32586669921875, 6.5362548828125, 6.74664306640625, 6.95703125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 8.0, 5.0, 13.0, 18.0, 27.0, 58.0, 69.0, 88.0, 156.0, 233.0, 340.0, 487.0, 730.0, 1097.0, 1526.0, 2354.0, 3606.0, 5491.0, 8422.0, 13109.0, 20611.0, 33216.0, 55214.0, 91386.0, 150280.0, 208197.0, 172202.0, 107746.0, 64645.0, 39177.0, 24607.0, 15191.0, 9642.0, 6308.0, 4171.0, 2645.0, 1827.0, 1237.0, 806.0, 515.0, 311.0, 261.0, 158.0, 120.0, 86.0, 51.0, 37.0, 30.0, 16.0, 14.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.005859375, -0.974090576171875, -0.94232177734375, -0.910552978515625, -0.8787841796875, -0.847015380859375, -0.81524658203125, -0.783477783203125, -0.751708984375, -0.719940185546875, -0.68817138671875, -0.656402587890625, -0.6246337890625, -0.592864990234375, -0.56109619140625, -0.529327392578125, -0.49755859375, -0.465789794921875, -0.43402099609375, -0.402252197265625, -0.3704833984375, -0.338714599609375, -0.30694580078125, -0.275177001953125, -0.243408203125, -0.211639404296875, -0.17987060546875, -0.148101806640625, -0.1163330078125, -0.084564208984375, -0.05279541015625, -0.021026611328125, 0.0107421875, 0.042510986328125, 0.07427978515625, 0.106048583984375, 0.1378173828125, 0.169586181640625, 0.20135498046875, 0.233123779296875, 0.264892578125, 0.296661376953125, 0.32843017578125, 0.360198974609375, 0.3919677734375, 0.423736572265625, 0.45550537109375, 0.487274169921875, 0.51904296875, 0.550811767578125, 0.58258056640625, 0.614349365234375, 0.6461181640625, 0.677886962890625, 0.70965576171875, 0.741424560546875, 0.773193359375, 0.804962158203125, 0.83673095703125, 0.868499755859375, 0.9002685546875, 0.932037353515625, 0.96380615234375, 0.995574951171875, 1.02734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 4.0, 7.0, 6.0, 13.0, 9.0, 14.0, 16.0, 26.0, 29.0, 32.0, 23.0, 37.0, 41.0, 33.0, 41.0, 49.0, 44.0, 45.0, 1073.0, 41.0, 56.0, 50.0, 44.0, 45.0, 40.0, 39.0, 30.0, 23.0, 16.0, 20.0, 14.0, 19.0, 15.0, 5.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.0625, -5.8880615234375, -5.713623046875, -5.5391845703125, -5.36474609375, -5.1903076171875, -5.015869140625, -4.8414306640625, -4.6669921875, -4.4925537109375, -4.318115234375, -4.1436767578125, -3.96923828125, -3.7947998046875, -3.620361328125, -3.4459228515625, -3.271484375, -3.0970458984375, -2.922607421875, -2.7481689453125, -2.57373046875, -2.3992919921875, -2.224853515625, -2.0504150390625, -1.8759765625, -1.7015380859375, -1.527099609375, -1.3526611328125, -1.17822265625, -1.0037841796875, -0.829345703125, -0.6549072265625, -0.48046875, -0.3060302734375, -0.131591796875, 0.0428466796875, 0.21728515625, 0.3917236328125, 0.566162109375, 0.7406005859375, 0.9150390625, 1.0894775390625, 1.263916015625, 1.4383544921875, 1.61279296875, 1.7872314453125, 1.961669921875, 2.1361083984375, 2.310546875, 2.4849853515625, 2.659423828125, 2.8338623046875, 3.00830078125, 3.1827392578125, 3.357177734375, 3.5316162109375, 3.7060546875, 3.8804931640625, 4.054931640625, 4.2293701171875, 4.40380859375, 4.5782470703125, 4.752685546875, 4.9271240234375, 5.1015625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 8.0, 7.0, 15.0, 19.0, 24.0, 26.0, 46.0, 78.0, 118.0, 165.0, 270.0, 487.0, 757.0, 1376.0, 2445.0, 5056.0, 11381.0, 28337.0, 79838.0, 271877.0, 1314106.0, 254980.0, 76391.0, 27396.0, 11201.0, 4937.0, 2444.0, 1341.0, 750.0, 461.0, 260.0, 169.0, 121.0, 59.0, 53.0, 40.0, 31.0, 13.0, 13.0, 10.0, 8.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.458984375, -1.4140625, -1.369140625, -1.32421875, -1.279296875, -1.234375, -1.189453125, -1.14453125, -1.099609375, -1.0546875, -1.009765625, -0.96484375, -0.919921875, -0.875, -0.830078125, -0.78515625, -0.740234375, -0.6953125, -0.650390625, -0.60546875, -0.560546875, -0.515625, -0.470703125, -0.42578125, -0.380859375, -0.3359375, -0.291015625, -0.24609375, -0.201171875, -0.15625, -0.111328125, -0.06640625, -0.021484375, 0.0234375, 0.068359375, 0.11328125, 0.158203125, 0.203125, 0.248046875, 0.29296875, 0.337890625, 0.3828125, 0.427734375, 0.47265625, 0.517578125, 0.5625, 0.607421875, 0.65234375, 0.697265625, 0.7421875, 0.787109375, 0.83203125, 0.876953125, 0.921875, 0.966796875, 1.01171875, 1.056640625, 1.1015625, 1.146484375, 1.19140625, 1.236328125, 1.28125, 1.326171875, 1.37109375, 1.416015625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 8.0, 12.0, 8.0, 13.0, 19.0, 10.0, 25.0, 23.0, 24.0, 38.0, 44.0, 40.0, 113.0, 177.0, 146.0, 50.0, 35.0, 32.0, 27.0, 23.0, 26.0, 15.0, 14.0, 7.0, 4.0, 7.0, 4.0, 11.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.25605010986328125, -0.2476959228515625, -0.23934173583984375, -0.230987548828125, -0.22263336181640625, -0.2142791748046875, -0.20592498779296875, -0.19757080078125, -0.18921661376953125, -0.1808624267578125, -0.17250823974609375, -0.164154052734375, -0.15579986572265625, -0.1474456787109375, -0.13909149169921875, -0.1307373046875, -0.12238311767578125, -0.1140289306640625, -0.10567474365234375, -0.097320556640625, -0.08896636962890625, -0.0806121826171875, -0.07225799560546875, -0.06390380859375, -0.05554962158203125, -0.0471954345703125, -0.03884124755859375, -0.030487060546875, -0.02213287353515625, -0.0137786865234375, -0.00542449951171875, 0.0029296875, 0.01128387451171875, 0.0196380615234375, 0.02799224853515625, 0.036346435546875, 0.04470062255859375, 0.0530548095703125, 0.06140899658203125, 0.06976318359375, 0.07811737060546875, 0.0864715576171875, 0.09482574462890625, 0.103179931640625, 0.11153411865234375, 0.1198883056640625, 0.12824249267578125, 0.1365966796875, 0.14495086669921875, 0.1533050537109375, 0.16165924072265625, 0.170013427734375, 0.17836761474609375, 0.1867218017578125, 0.19507598876953125, 0.20343017578125, 0.21178436279296875, 0.2201385498046875, 0.22849273681640625, 0.236846923828125, 0.24520111083984375, 0.2535552978515625, 0.26190948486328125, 0.270263671875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 9.0, 5.0, 7.0, 13.0, 17.0, 21.0, 35.0, 47.0, 39.0, 76.0, 108.0, 184.0, 467.0, 6911.0, 1005521.0, 33441.0, 852.0, 240.0, 151.0, 84.0, 70.0, 54.0, 32.0, 31.0, 18.0, 19.0, 12.0, 8.0, 11.0, 9.0, 5.0, 6.0, 3.0, 6.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.21875, -5.05902099609375, -4.8992919921875, -4.73956298828125, -4.579833984375, -4.42010498046875, -4.2603759765625, -4.10064697265625, -3.94091796875, -3.78118896484375, -3.6214599609375, -3.46173095703125, -3.302001953125, -3.14227294921875, -2.9825439453125, -2.82281494140625, -2.6630859375, -2.50335693359375, -2.3436279296875, -2.18389892578125, -2.024169921875, -1.86444091796875, -1.7047119140625, -1.54498291015625, -1.38525390625, -1.22552490234375, -1.0657958984375, -0.90606689453125, -0.746337890625, -0.58660888671875, -0.4268798828125, -0.26715087890625, -0.107421875, 0.05230712890625, 0.2120361328125, 0.37176513671875, 0.531494140625, 0.69122314453125, 0.8509521484375, 1.01068115234375, 1.17041015625, 1.33013916015625, 1.4898681640625, 1.64959716796875, 1.809326171875, 1.96905517578125, 2.1287841796875, 2.28851318359375, 2.4482421875, 2.60797119140625, 2.7677001953125, 2.92742919921875, 3.087158203125, 3.24688720703125, 3.4066162109375, 3.56634521484375, 3.72607421875, 3.88580322265625, 4.0455322265625, 4.20526123046875, 4.364990234375, 4.52471923828125, 4.6844482421875, 4.84417724609375, 5.00390625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 13.0, 21.0, 35.0, 59.0, 103.0, 159.0, 188.0, 152.0, 115.0, 65.0, 33.0, 20.0, 18.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2705734074115753, -0.25496622920036316, -0.2393590658903122, -0.22375190258026123, -0.20814472436904907, -0.1925375610589981, -0.17693039774894714, -0.16132321953773499, -0.14571605622768402, -0.13010889291763306, -0.1145017147064209, -0.09889455139636993, -0.08328738063573837, -0.06768020987510681, -0.05207304656505585, -0.036465875804424286, -0.020858705043792725, -0.0052515361458063126, 0.0103556327521801, 0.025962799787521362, 0.041569970548152924, 0.057177141308784485, 0.07278430461883545, 0.08839147537946701, 0.10399864614009857, 0.11960581690073013, 0.1352129876613617, 0.15082015097141266, 0.16642731428146362, 0.18203449249267578, 0.19764165580272675, 0.2132488191127777, 0.22885602712631226, 0.24446319043636322, 0.2600703537464142, 0.27567753195762634, 0.2912847101688385, 0.30689185857772827, 0.32249903678894043, 0.3381062150001526, 0.35371339321136475, 0.3693205714225769, 0.3849277198314667, 0.40053489804267883, 0.416142076253891, 0.43174922466278076, 0.4473564028739929, 0.4629635810852051, 0.47857072949409485, 0.494177907705307, 0.5097850561141968, 0.5253922343254089, 0.5409994125366211, 0.5566065907478333, 0.5722137689590454, 0.5878208875656128, 0.603428065776825, 0.6190352439880371, 0.6346424221992493, 0.6502496004104614, 0.6658567190170288, 0.681463897228241, 0.6970710754394531, 0.7126782536506653, 0.7282854318618774]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 8.0, 6.0, 8.0, 7.0, 6.0, 16.0, 11.0, 10.0, 16.0, 17.0, 17.0, 20.0, 31.0, 25.0, 31.0, 45.0, 38.0, 35.0, 37.0, 43.0, 28.0, 28.0, 31.0, 29.0, 33.0, 37.0, 35.0, 45.0, 28.0, 24.0, 23.0, 30.0, 30.0, 26.0, 19.0, 21.0, 14.0, 13.0, 7.0, 12.0, 7.0, 12.0, 8.0, 10.0, 5.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20523911714553833, -0.1985865980386734, -0.19193407893180847, -0.18528154492378235, -0.17862902581691742, -0.1719765067100525, -0.16532397270202637, -0.15867145359516144, -0.1520189344882965, -0.14536641538143158, -0.13871389627456665, -0.13206136226654053, -0.1254088431596756, -0.11875632405281067, -0.11210379749536514, -0.10545127093791962, -0.09879875183105469, -0.09214623272418976, -0.08549370616674423, -0.0788411796092987, -0.07218866050243378, -0.06553614139556885, -0.05888361483812332, -0.052231092005968094, -0.045578569173812866, -0.03892604634165764, -0.03227352350950241, -0.025621000677347183, -0.018968477845191956, -0.012315955013036728, -0.0056634321808815, 0.0009890906512737274, 0.007641613483428955, 0.014294136315584183, 0.02094665914773941, 0.027599181979894638, 0.034251704812049866, 0.04090422764420509, 0.04755675047636032, 0.05420927330851555, 0.060861796140670776, 0.0675143152475357, 0.07416684180498123, 0.08081936836242676, 0.08747188746929169, 0.09412440657615662, 0.10077693313360214, 0.10742945969104767, 0.1140819787979126, 0.12073449790477753, 0.12738701701164246, 0.13403955101966858, 0.1406920701265335, 0.14734458923339844, 0.15399712324142456, 0.1606496423482895, 0.16730216145515442, 0.17395468056201935, 0.18060719966888428, 0.1872597336769104, 0.19391225278377533, 0.20056477189064026, 0.20721730589866638, 0.2138698250055313, 0.22052234411239624]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 9.0, 11.0, 6.0, 13.0, 16.0, 27.0, 22.0, 29.0, 30.0, 31.0, 29.0, 41.0, 40.0, 38.0, 40.0, 41.0, 48.0, 40.0, 39.0, 42.0, 43.0, 32.0, 30.0, 28.0, 29.0, 33.0, 15.0, 27.0, 26.0, 16.0, 19.0, 15.0, 19.0, 10.0, 9.0, 12.0, 7.0, 3.0, 4.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.26171875, -7.045654296875, -6.82958984375, -6.613525390625, -6.3974609375, -6.181396484375, -5.96533203125, -5.749267578125, -5.533203125, -5.317138671875, -5.10107421875, -4.885009765625, -4.6689453125, -4.452880859375, -4.23681640625, -4.020751953125, -3.8046875, -3.588623046875, -3.37255859375, -3.156494140625, -2.9404296875, -2.724365234375, -2.50830078125, -2.292236328125, -2.076171875, -1.860107421875, -1.64404296875, -1.427978515625, -1.2119140625, -0.995849609375, -0.77978515625, -0.563720703125, -0.34765625, -0.131591796875, 0.08447265625, 0.300537109375, 0.5166015625, 0.732666015625, 0.94873046875, 1.164794921875, 1.380859375, 1.596923828125, 1.81298828125, 2.029052734375, 2.2451171875, 2.461181640625, 2.67724609375, 2.893310546875, 3.109375, 3.325439453125, 3.54150390625, 3.757568359375, 3.9736328125, 4.189697265625, 4.40576171875, 4.621826171875, 4.837890625, 5.053955078125, 5.27001953125, 5.486083984375, 5.7021484375, 5.918212890625, 6.13427734375, 6.350341796875, 6.56640625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 7.0, 6.0, 13.0, 24.0, 26.0, 35.0, 47.0, 81.0, 110.0, 154.0, 212.0, 288.0, 479.0, 672.0, 946.0, 1579.0, 2361.0, 3732.0, 5980.0, 9997.0, 17606.0, 31768.0, 63285.0, 136423.0, 276410.0, 253057.0, 118041.0, 56122.0, 28801.0, 15728.0, 9173.0, 5499.0, 3414.0, 2204.0, 1375.0, 917.0, 597.0, 391.0, 312.0, 222.0, 122.0, 85.0, 62.0, 73.0, 29.0, 26.0, 18.0, 16.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-7.89453125, -7.6546630859375, -7.414794921875, -7.1749267578125, -6.93505859375, -6.6951904296875, -6.455322265625, -6.2154541015625, -5.9755859375, -5.7357177734375, -5.495849609375, -5.2559814453125, -5.01611328125, -4.7762451171875, -4.536376953125, -4.2965087890625, -4.056640625, -3.8167724609375, -3.576904296875, -3.3370361328125, -3.09716796875, -2.8572998046875, -2.617431640625, -2.3775634765625, -2.1376953125, -1.8978271484375, -1.657958984375, -1.4180908203125, -1.17822265625, -0.9383544921875, -0.698486328125, -0.4586181640625, -0.21875, 0.0211181640625, 0.260986328125, 0.5008544921875, 0.74072265625, 0.9805908203125, 1.220458984375, 1.4603271484375, 1.7001953125, 1.9400634765625, 2.179931640625, 2.4197998046875, 2.65966796875, 2.8995361328125, 3.139404296875, 3.3792724609375, 3.619140625, 3.8590087890625, 4.098876953125, 4.3387451171875, 4.57861328125, 4.8184814453125, 5.058349609375, 5.2982177734375, 5.5380859375, 5.7779541015625, 6.017822265625, 6.2576904296875, 6.49755859375, 6.7374267578125, 6.977294921875, 7.2171630859375, 7.45703125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 3.0, 7.0, 9.0, 12.0, 14.0, 19.0, 13.0, 15.0, 24.0, 24.0, 26.0, 28.0, 30.0, 41.0, 52.0, 65.0, 72.0, 135.0, 287.0, 1341.0, 223.0, 123.0, 84.0, 50.0, 40.0, 44.0, 41.0, 23.0, 31.0, 19.0, 19.0, 25.0, 16.0, 15.0, 11.0, 15.0, 6.0, 5.0, 6.0, 7.0, 4.0, 4.0, 7.0, 1.0, 1.0, 2.0, 3.0], "bins": [-23.359375, -22.718505859375, -22.07763671875, -21.436767578125, -20.7958984375, -20.155029296875, -19.51416015625, -18.873291015625, -18.232421875, -17.591552734375, -16.95068359375, -16.309814453125, -15.6689453125, -15.028076171875, -14.38720703125, -13.746337890625, -13.10546875, -12.464599609375, -11.82373046875, -11.182861328125, -10.5419921875, -9.901123046875, -9.26025390625, -8.619384765625, -7.978515625, -7.337646484375, -6.69677734375, -6.055908203125, -5.4150390625, -4.774169921875, -4.13330078125, -3.492431640625, -2.8515625, -2.210693359375, -1.56982421875, -0.928955078125, -0.2880859375, 0.352783203125, 0.99365234375, 1.634521484375, 2.275390625, 2.916259765625, 3.55712890625, 4.197998046875, 4.8388671875, 5.479736328125, 6.12060546875, 6.761474609375, 7.40234375, 8.043212890625, 8.68408203125, 9.324951171875, 9.9658203125, 10.606689453125, 11.24755859375, 11.888427734375, 12.529296875, 13.170166015625, 13.81103515625, 14.451904296875, 15.0927734375, 15.733642578125, 16.37451171875, 17.015380859375, 17.65625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 9.0, 18.0, 14.0, 13.0, 16.0, 33.0, 32.0, 33.0, 52.0, 90.0, 108.0, 141.0, 213.0, 316.0, 551.0, 1442.0, 8278.0, 105742.0, 2792083.0, 220279.0, 12425.0, 1987.0, 643.0, 281.0, 239.0, 159.0, 109.0, 92.0, 49.0, 50.0, 45.0, 29.0, 21.0, 18.0, 20.0, 13.0, 10.0, 14.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0], "bins": [-37.0625, -35.95947265625, -34.8564453125, -33.75341796875, -32.650390625, -31.54736328125, -30.4443359375, -29.34130859375, -28.23828125, -27.13525390625, -26.0322265625, -24.92919921875, -23.826171875, -22.72314453125, -21.6201171875, -20.51708984375, -19.4140625, -18.31103515625, -17.2080078125, -16.10498046875, -15.001953125, -13.89892578125, -12.7958984375, -11.69287109375, -10.58984375, -9.48681640625, -8.3837890625, -7.28076171875, -6.177734375, -5.07470703125, -3.9716796875, -2.86865234375, -1.765625, -0.66259765625, 0.4404296875, 1.54345703125, 2.646484375, 3.74951171875, 4.8525390625, 5.95556640625, 7.05859375, 8.16162109375, 9.2646484375, 10.36767578125, 11.470703125, 12.57373046875, 13.6767578125, 14.77978515625, 15.8828125, 16.98583984375, 18.0888671875, 19.19189453125, 20.294921875, 21.39794921875, 22.5009765625, 23.60400390625, 24.70703125, 25.81005859375, 26.9130859375, 28.01611328125, 29.119140625, 30.22216796875, 31.3251953125, 32.42822265625, 33.53125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [3.0, 3.0, 287.0, 684.0, 36.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.933895111083984, -21.49590301513672, -12.057910919189453, -2.6199188232421875, 6.818073272705078, 16.256065368652344, 25.69405746459961, 35.13205337524414, 44.57004165649414, 54.008033752441406, 63.44602584838867, 72.88401794433594, 82.32200622558594, 91.76000213623047, 101.197998046875, 110.635986328125, 120.073974609375, 129.511962890625, 138.949951171875, 148.38795471191406, 157.82594299316406, 167.26393127441406, 176.70193481445312, 186.13992309570312, 195.57791137695312, 205.01589965820312, 214.45388793945312, 223.8918914794922, 233.3298797607422, 242.7678680419922, 252.20587158203125, 261.64385986328125, 271.08184814453125, 280.51983642578125, 289.95782470703125, 299.39581298828125, 308.83380126953125, 318.2718200683594, 327.7098083496094, 337.1477966308594, 346.5857849121094, 356.0237731933594, 365.4617614746094, 374.8997497558594, 384.3377685546875, 393.7757568359375, 403.2137451171875, 412.6517333984375, 422.0897216796875, 431.5277099609375, 440.9656982421875, 450.4036865234375, 459.8416748046875, 469.2796936035156, 478.7176818847656, 488.1556701660156, 497.5936584472656, 507.0316467285156, 516.4696655273438, 525.9076538085938, 535.3456420898438, 544.7836303710938, 554.2216186523438, 563.6596069335938, 573.0975952148438]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 10.0, 7.0, 14.0, 8.0, 7.0, 12.0, 17.0, 17.0, 22.0, 20.0, 25.0, 24.0, 40.0, 30.0, 35.0, 37.0, 34.0, 34.0, 46.0, 34.0, 44.0, 42.0, 34.0, 40.0, 39.0, 32.0, 32.0, 27.0, 32.0, 30.0, 20.0, 22.0, 27.0, 23.0, 23.0, 10.0, 7.0, 7.0, 14.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.67521667480469, -48.023345947265625, -46.37147903442383, -44.719608306884766, -43.06774139404297, -41.415870666503906, -39.763999938964844, -38.11213302612305, -36.460262298583984, -34.80839157104492, -33.156524658203125, -31.504653930664062, -29.852785110473633, -28.200916290283203, -26.549047470092773, -24.897178649902344, -23.245309829711914, -21.593441009521484, -19.941572189331055, -18.289703369140625, -16.637832641601562, -14.985963821411133, -13.334095001220703, -11.682225227355957, -10.030356407165527, -8.378487586975098, -6.726617813110352, -5.074748992919922, -3.422879695892334, -1.771010398864746, -0.1191415786743164, 1.5327281951904297, 3.1845970153808594, 4.836466312408447, 6.488335609436035, 8.140204429626465, 9.792074203491211, 11.44394302368164, 13.09581184387207, 14.747681617736816, 16.399551391601562, 18.051420211791992, 19.703289031982422, 21.355159759521484, 23.007028579711914, 24.658897399902344, 26.310766220092773, 27.962635040283203, 29.614503860473633, 31.266372680664062, 32.918243408203125, 34.57011032104492, 36.221981048583984, 37.87384796142578, 39.525718688964844, 41.177589416503906, 42.8294563293457, 44.481327056884766, 46.13319396972656, 47.785064697265625, 49.43693161010742, 51.088802337646484, 52.74066925048828, 54.392539978027344, 56.044410705566406]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 13.0, 18.0, 10.0, 19.0, 17.0, 34.0, 24.0, 42.0, 33.0, 43.0, 37.0, 34.0, 52.0, 40.0, 48.0, 40.0, 37.0, 43.0, 36.0, 32.0, 44.0, 35.0, 32.0, 26.0, 24.0, 26.0, 19.0, 27.0, 15.0, 16.0, 20.0, 9.0, 8.0, 13.0, 3.0, 9.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.6077880859375, -7.375732421875, -7.1436767578125, -6.91162109375, -6.6795654296875, -6.447509765625, -6.2154541015625, -5.9833984375, -5.7513427734375, -5.519287109375, -5.2872314453125, -5.05517578125, -4.8231201171875, -4.591064453125, -4.3590087890625, -4.126953125, -3.8948974609375, -3.662841796875, -3.4307861328125, -3.19873046875, -2.9666748046875, -2.734619140625, -2.5025634765625, -2.2705078125, -2.0384521484375, -1.806396484375, -1.5743408203125, -1.34228515625, -1.1102294921875, -0.878173828125, -0.6461181640625, -0.4140625, -0.1820068359375, 0.050048828125, 0.2821044921875, 0.51416015625, 0.7462158203125, 0.978271484375, 1.2103271484375, 1.4423828125, 1.6744384765625, 1.906494140625, 2.1385498046875, 2.37060546875, 2.6026611328125, 2.834716796875, 3.0667724609375, 3.298828125, 3.5308837890625, 3.762939453125, 3.9949951171875, 4.22705078125, 4.4591064453125, 4.691162109375, 4.9232177734375, 5.1552734375, 5.3873291015625, 5.619384765625, 5.8514404296875, 6.08349609375, 6.3155517578125, 6.547607421875, 6.7796630859375, 7.01171875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 8.0, 14.0, 17.0, 20.0, 20.0, 37.0, 77.0, 74.0, 118.0, 204.0, 309.0, 541.0, 1033.0, 2059.0, 4286.0, 10478.0, 29729.0, 120237.0, 697800.0, 2323636.0, 811034.0, 137418.0, 33496.0, 11538.0, 5007.0, 2314.0, 1125.0, 640.0, 355.0, 198.0, 139.0, 88.0, 64.0, 49.0, 38.0, 18.0, 15.0, 10.0, 13.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0], "bins": [-12.875, -12.522705078125, -12.17041015625, -11.818115234375, -11.4658203125, -11.113525390625, -10.76123046875, -10.408935546875, -10.056640625, -9.704345703125, -9.35205078125, -8.999755859375, -8.6474609375, -8.295166015625, -7.94287109375, -7.590576171875, -7.23828125, -6.885986328125, -6.53369140625, -6.181396484375, -5.8291015625, -5.476806640625, -5.12451171875, -4.772216796875, -4.419921875, -4.067626953125, -3.71533203125, -3.363037109375, -3.0107421875, -2.658447265625, -2.30615234375, -1.953857421875, -1.6015625, -1.249267578125, -0.89697265625, -0.544677734375, -0.1923828125, 0.159912109375, 0.51220703125, 0.864501953125, 1.216796875, 1.569091796875, 1.92138671875, 2.273681640625, 2.6259765625, 2.978271484375, 3.33056640625, 3.682861328125, 4.03515625, 4.387451171875, 4.73974609375, 5.092041015625, 5.4443359375, 5.796630859375, 6.14892578125, 6.501220703125, 6.853515625, 7.205810546875, 7.55810546875, 7.910400390625, 8.2626953125, 8.614990234375, 8.96728515625, 9.319580078125, 9.671875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 10.0, 11.0, 15.0, 19.0, 23.0, 28.0, 28.0, 51.0, 84.0, 113.0, 168.0, 284.0, 378.0, 581.0, 600.0, 481.0, 365.0, 242.0, 146.0, 108.0, 82.0, 63.0, 50.0, 27.0, 30.0, 13.0, 12.0, 13.0, 11.0, 11.0, 2.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.6451416015625, -8.274658203125, -7.9041748046875, -7.53369140625, -7.1632080078125, -6.792724609375, -6.4222412109375, -6.0517578125, -5.6812744140625, -5.310791015625, -4.9403076171875, -4.56982421875, -4.1993408203125, -3.828857421875, -3.4583740234375, -3.087890625, -2.7174072265625, -2.346923828125, -1.9764404296875, -1.60595703125, -1.2354736328125, -0.864990234375, -0.4945068359375, -0.1240234375, 0.2464599609375, 0.616943359375, 0.9874267578125, 1.35791015625, 1.7283935546875, 2.098876953125, 2.4693603515625, 2.83984375, 3.2103271484375, 3.580810546875, 3.9512939453125, 4.32177734375, 4.6922607421875, 5.062744140625, 5.4332275390625, 5.8037109375, 6.1741943359375, 6.544677734375, 6.9151611328125, 7.28564453125, 7.6561279296875, 8.026611328125, 8.3970947265625, 8.767578125, 9.1380615234375, 9.508544921875, 9.8790283203125, 10.24951171875, 10.6199951171875, 10.990478515625, 11.3609619140625, 11.7314453125, 12.1019287109375, 12.472412109375, 12.8428955078125, 13.21337890625, 13.5838623046875, 13.954345703125, 14.3248291015625, 14.6953125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 15.0, 12.0, 11.0, 14.0, 24.0, 36.0, 43.0, 59.0, 110.0, 148.0, 197.0, 423.0, 1097.0, 6228.0, 90057.0, 3523261.0, 548953.0, 19883.0, 2290.0, 607.0, 294.0, 167.0, 92.0, 72.0, 37.0, 34.0, 29.0, 19.0, 14.0, 14.0, 12.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-47.53125, -46.335205078125, -45.13916015625, -43.943115234375, -42.7470703125, -41.551025390625, -40.35498046875, -39.158935546875, -37.962890625, -36.766845703125, -35.57080078125, -34.374755859375, -33.1787109375, -31.982666015625, -30.78662109375, -29.590576171875, -28.39453125, -27.198486328125, -26.00244140625, -24.806396484375, -23.6103515625, -22.414306640625, -21.21826171875, -20.022216796875, -18.826171875, -17.630126953125, -16.43408203125, -15.238037109375, -14.0419921875, -12.845947265625, -11.64990234375, -10.453857421875, -9.2578125, -8.061767578125, -6.86572265625, -5.669677734375, -4.4736328125, -3.277587890625, -2.08154296875, -0.885498046875, 0.310546875, 1.506591796875, 2.70263671875, 3.898681640625, 5.0947265625, 6.290771484375, 7.48681640625, 8.682861328125, 9.87890625, 11.074951171875, 12.27099609375, 13.467041015625, 14.6630859375, 15.859130859375, 17.05517578125, 18.251220703125, 19.447265625, 20.643310546875, 21.83935546875, 23.035400390625, 24.2314453125, 25.427490234375, 26.62353515625, 27.819580078125, 29.015625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 14.0, 108.0, 382.0, 388.0, 104.0, 13.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.61289978027344, -146.72996520996094, -140.84703063964844, -134.964111328125, -129.0811767578125, -123.1982421875, -117.3153076171875, -111.432373046875, -105.54944610595703, -99.66651153564453, -93.78358459472656, -87.90065002441406, -82.01771545410156, -76.1347885131836, -70.2518539428711, -64.36892700195312, -58.485992431640625, -52.60306167602539, -46.720130920410156, -40.837196350097656, -34.95426559448242, -29.071334838867188, -23.188400268554688, -17.305469512939453, -11.422538757324219, -5.539607048034668, 0.3433246612548828, 6.22625732421875, 12.109188079833984, 17.99211883544922, 23.87505340576172, 29.757984161376953, 35.64093017578125, 41.523860931396484, 47.40679168701172, 53.28972625732422, 59.17265701293945, 65.05558776855469, 70.93852233886719, 76.82145690917969, 82.70438385009766, 88.58731842041016, 94.47024536132812, 100.35317993164062, 106.23611450195312, 112.1190414428711, 118.0019760131836, 123.88490295410156, 129.76783752441406, 135.65077209472656, 141.53370666503906, 147.4166259765625, 153.299560546875, 159.1824951171875, 165.0654296875, 170.9483642578125, 176.831298828125, 182.7142333984375, 188.59716796875, 194.4801025390625, 200.36302185058594, 206.24595642089844, 212.12889099121094, 218.01182556152344, 223.89474487304688]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 6.0, 4.0, 13.0, 12.0, 15.0, 13.0, 12.0, 19.0, 24.0, 26.0, 30.0, 22.0, 31.0, 38.0, 30.0, 39.0, 40.0, 37.0, 33.0, 35.0, 37.0, 46.0, 36.0, 43.0, 42.0, 24.0, 30.0, 37.0, 41.0, 28.0, 21.0, 23.0, 14.0, 12.0, 16.0, 18.0, 6.0, 9.0, 6.0, 10.0, 3.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.40915298461914, -31.302013397216797, -30.194873809814453, -29.08773422241211, -27.980594635009766, -26.873455047607422, -25.766313552856445, -24.6591739654541, -23.552034378051758, -22.444894790649414, -21.33775520324707, -20.230615615844727, -19.12347412109375, -18.016334533691406, -16.909194946289062, -15.802055358886719, -14.694915771484375, -13.587776184082031, -12.480636596679688, -11.373496055603027, -10.266356468200684, -9.15921688079834, -8.05207633972168, -6.944936752319336, -5.837797164916992, -4.730657577514648, -3.6235175132751465, -2.5163776874542236, -1.4092378616333008, -0.30209827423095703, 0.8050417900085449, 1.9121818542480469, 3.019317626953125, 4.126457214355469, 5.233597278594971, 6.340737342834473, 7.447876930236816, 8.55501651763916, 9.66215705871582, 10.769296646118164, 11.876436233520508, 12.983575820922852, 14.090715408325195, 15.197855949401855, 16.304996490478516, 17.41213607788086, 18.519275665283203, 19.626415252685547, 20.73355484008789, 21.840694427490234, 22.947834014892578, 24.054973602294922, 25.162113189697266, 26.26925277709961, 27.376394271850586, 28.48353385925293, 29.590673446655273, 30.697813034057617, 31.80495262145996, 32.91209411621094, 34.01923370361328, 35.126373291015625, 36.23351287841797, 37.34065246582031, 38.447792053222656]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 3.0, 14.0, 21.0, 28.0, 23.0, 27.0, 29.0, 33.0, 40.0, 38.0, 35.0, 37.0, 39.0, 40.0, 45.0, 48.0, 47.0, 52.0, 33.0, 47.0, 43.0, 32.0, 33.0, 25.0, 19.0, 21.0, 26.0, 18.0, 13.0, 10.0, 12.0, 11.0, 11.0, 6.0, 10.0, 1.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1640625, -6.9366455078125, -6.709228515625, -6.4818115234375, -6.25439453125, -6.0269775390625, -5.799560546875, -5.5721435546875, -5.3447265625, -5.1173095703125, -4.889892578125, -4.6624755859375, -4.43505859375, -4.2076416015625, -3.980224609375, -3.7528076171875, -3.525390625, -3.2979736328125, -3.070556640625, -2.8431396484375, -2.61572265625, -2.3883056640625, -2.160888671875, -1.9334716796875, -1.7060546875, -1.4786376953125, -1.251220703125, -1.0238037109375, -0.79638671875, -0.5689697265625, -0.341552734375, -0.1141357421875, 0.11328125, 0.3406982421875, 0.568115234375, 0.7955322265625, 1.02294921875, 1.2503662109375, 1.477783203125, 1.7052001953125, 1.9326171875, 2.1600341796875, 2.387451171875, 2.6148681640625, 2.84228515625, 3.0697021484375, 3.297119140625, 3.5245361328125, 3.751953125, 3.9793701171875, 4.206787109375, 4.4342041015625, 4.66162109375, 4.8890380859375, 5.116455078125, 5.3438720703125, 5.5712890625, 5.7987060546875, 6.026123046875, 6.2535400390625, 6.48095703125, 6.7083740234375, 6.935791015625, 7.1632080078125, 7.390625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 9.0, 14.0, 12.0, 18.0, 39.0, 46.0, 53.0, 81.0, 139.0, 158.0, 225.0, 319.0, 422.0, 615.0, 892.0, 1350.0, 1908.0, 2906.0, 4277.0, 6289.0, 9727.0, 14817.0, 23010.0, 36879.0, 58996.0, 98129.0, 158618.0, 203381.0, 160788.0, 99406.0, 59676.0, 37215.0, 22986.0, 14944.0, 9785.0, 6569.0, 4286.0, 2885.0, 2034.0, 1408.0, 1004.0, 661.0, 450.0, 333.0, 242.0, 165.0, 111.0, 76.0, 64.0, 41.0, 33.0, 27.0, 16.0, 9.0, 8.0, 3.0, 5.0, 2.0, 5.0], "bins": [-0.81689453125, -0.7917709350585938, -0.7666473388671875, -0.7415237426757812, -0.716400146484375, -0.6912765502929688, -0.6661529541015625, -0.6410293579101562, -0.61590576171875, -0.5907821655273438, -0.5656585693359375, -0.5405349731445312, -0.515411376953125, -0.49028778076171875, -0.4651641845703125, -0.44004058837890625, -0.4149169921875, -0.38979339599609375, -0.3646697998046875, -0.33954620361328125, -0.314422607421875, -0.28929901123046875, -0.2641754150390625, -0.23905181884765625, -0.21392822265625, -0.18880462646484375, -0.1636810302734375, -0.13855743408203125, -0.113433837890625, -0.08831024169921875, -0.0631866455078125, -0.03806304931640625, -0.012939453125, 0.01218414306640625, 0.0373077392578125, 0.06243133544921875, 0.087554931640625, 0.11267852783203125, 0.1378021240234375, 0.16292572021484375, 0.18804931640625, 0.21317291259765625, 0.2382965087890625, 0.26342010498046875, 0.288543701171875, 0.31366729736328125, 0.3387908935546875, 0.36391448974609375, 0.3890380859375, 0.41416168212890625, 0.4392852783203125, 0.46440887451171875, 0.489532470703125, 0.5146560668945312, 0.5397796630859375, 0.5649032592773438, 0.59002685546875, 0.6151504516601562, 0.6402740478515625, 0.6653976440429688, 0.690521240234375, 0.7156448364257812, 0.7407684326171875, 0.7658920288085938, 0.791015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 9.0, 7.0, 8.0, 5.0, 11.0, 19.0, 19.0, 20.0, 14.0, 25.0, 30.0, 30.0, 27.0, 37.0, 27.0, 35.0, 41.0, 53.0, 50.0, 1076.0, 44.0, 37.0, 41.0, 43.0, 60.0, 30.0, 29.0, 36.0, 27.0, 21.0, 24.0, 19.0, 13.0, 9.0, 10.0, 10.0, 7.0, 7.0, 9.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.16796875, -5.00726318359375, -4.8465576171875, -4.68585205078125, -4.525146484375, -4.36444091796875, -4.2037353515625, -4.04302978515625, -3.88232421875, -3.72161865234375, -3.5609130859375, -3.40020751953125, -3.239501953125, -3.07879638671875, -2.9180908203125, -2.75738525390625, -2.5966796875, -2.43597412109375, -2.2752685546875, -2.11456298828125, -1.953857421875, -1.79315185546875, -1.6324462890625, -1.47174072265625, -1.31103515625, -1.15032958984375, -0.9896240234375, -0.82891845703125, -0.668212890625, -0.50750732421875, -0.3468017578125, -0.18609619140625, -0.025390625, 0.13531494140625, 0.2960205078125, 0.45672607421875, 0.617431640625, 0.77813720703125, 0.9388427734375, 1.09954833984375, 1.26025390625, 1.42095947265625, 1.5816650390625, 1.74237060546875, 1.903076171875, 2.06378173828125, 2.2244873046875, 2.38519287109375, 2.5458984375, 2.70660400390625, 2.8673095703125, 3.02801513671875, 3.188720703125, 3.34942626953125, 3.5101318359375, 3.67083740234375, 3.83154296875, 3.99224853515625, 4.1529541015625, 4.31365966796875, 4.474365234375, 4.63507080078125, 4.7957763671875, 4.95648193359375, 5.1171875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 20.0, 28.0, 32.0, 57.0, 104.0, 174.0, 303.0, 577.0, 1109.0, 2138.0, 4745.0, 10561.0, 24522.0, 60870.0, 167327.0, 1196999.0, 434337.0, 116362.0, 43645.0, 18120.0, 7875.0, 3581.0, 1738.0, 851.0, 443.0, 228.0, 145.0, 84.0, 53.0, 20.0, 26.0, 10.0, 9.0, 11.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8490982055664062, -0.8148956298828125, -0.7806930541992188, -0.746490478515625, -0.7122879028320312, -0.6780853271484375, -0.6438827514648438, -0.60968017578125, -0.5754776000976562, -0.5412750244140625, -0.5070724487304688, -0.472869873046875, -0.43866729736328125, -0.4044647216796875, -0.37026214599609375, -0.3360595703125, -0.30185699462890625, -0.2676544189453125, -0.23345184326171875, -0.199249267578125, -0.16504669189453125, -0.1308441162109375, -0.09664154052734375, -0.06243896484375, -0.02823638916015625, 0.0059661865234375, 0.04016876220703125, 0.074371337890625, 0.10857391357421875, 0.1427764892578125, 0.17697906494140625, 0.211181640625, 0.24538421630859375, 0.2795867919921875, 0.31378936767578125, 0.347991943359375, 0.38219451904296875, 0.4163970947265625, 0.45059967041015625, 0.48480224609375, 0.5190048217773438, 0.5532073974609375, 0.5874099731445312, 0.621612548828125, 0.6558151245117188, 0.6900177001953125, 0.7242202758789062, 0.7584228515625, 0.7926254272460938, 0.8268280029296875, 0.8610305786132812, 0.895233154296875, 0.9294357299804688, 0.9636383056640625, 0.9978408813476562, 1.03204345703125, 1.0662460327148438, 1.1004486083984375, 1.1346511840820312, 1.168853759765625, 1.2030563354492188, 1.2372589111328125, 1.2714614868164062, 1.3056640625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 9.0, 14.0, 24.0, 15.0, 48.0, 58.0, 81.0, 122.0, 119.0, 138.0, 102.0, 74.0, 46.0, 30.0, 31.0, 21.0, 13.0, 15.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143798828125, -0.13861846923828125, -0.1334381103515625, -0.12825775146484375, -0.123077392578125, -0.11789703369140625, -0.1127166748046875, -0.10753631591796875, -0.10235595703125, -0.09717559814453125, -0.0919952392578125, -0.08681488037109375, -0.081634521484375, -0.07645416259765625, -0.0712738037109375, -0.06609344482421875, -0.0609130859375, -0.05573272705078125, -0.0505523681640625, -0.04537200927734375, -0.040191650390625, -0.03501129150390625, -0.0298309326171875, -0.02465057373046875, -0.01947021484375, -0.01428985595703125, -0.0091094970703125, -0.00392913818359375, 0.001251220703125, 0.00643157958984375, 0.0116119384765625, 0.01679229736328125, 0.02197265625, 0.02715301513671875, 0.0323333740234375, 0.03751373291015625, 0.042694091796875, 0.04787445068359375, 0.0530548095703125, 0.05823516845703125, 0.06341552734375, 0.06859588623046875, 0.0737762451171875, 0.07895660400390625, 0.084136962890625, 0.08931732177734375, 0.0944976806640625, 0.09967803955078125, 0.1048583984375, 0.11003875732421875, 0.1152191162109375, 0.12039947509765625, 0.125579833984375, 0.13076019287109375, 0.1359405517578125, 0.14112091064453125, 0.14630126953125, 0.15148162841796875, 0.1566619873046875, 0.16184234619140625, 0.167022705078125, 0.17220306396484375, 0.1773834228515625, 0.18256378173828125, 0.187744140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 12.0, 13.0, 12.0, 11.0, 20.0, 29.0, 61.0, 84.0, 178.0, 494.0, 348892.0, 697810.0, 503.0, 189.0, 100.0, 47.0, 27.0, 13.0, 19.0, 15.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.47265625, -4.348480224609375, -4.22430419921875, -4.100128173828125, -3.9759521484375, -3.851776123046875, -3.72760009765625, -3.603424072265625, -3.479248046875, -3.355072021484375, -3.23089599609375, -3.106719970703125, -2.9825439453125, -2.858367919921875, -2.73419189453125, -2.610015869140625, -2.48583984375, -2.361663818359375, -2.23748779296875, -2.113311767578125, -1.9891357421875, -1.864959716796875, -1.74078369140625, -1.616607666015625, -1.492431640625, -1.368255615234375, -1.24407958984375, -1.119903564453125, -0.9957275390625, -0.871551513671875, -0.74737548828125, -0.623199462890625, -0.4990234375, -0.374847412109375, -0.25067138671875, -0.126495361328125, -0.0023193359375, 0.121856689453125, 0.24603271484375, 0.370208740234375, 0.494384765625, 0.618560791015625, 0.74273681640625, 0.866912841796875, 0.9910888671875, 1.115264892578125, 1.23944091796875, 1.363616943359375, 1.48779296875, 1.611968994140625, 1.73614501953125, 1.860321044921875, 1.9844970703125, 2.108673095703125, 2.23284912109375, 2.357025146484375, 2.481201171875, 2.605377197265625, 2.72955322265625, 2.853729248046875, 2.9779052734375, 3.102081298828125, 3.22625732421875, 3.350433349609375, 3.474609375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [6.0, 119.0, 643.0, 232.0, 19.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06312727183103561, -0.03839648887515068, -0.013665705919265747, 0.011065073311328888, 0.03579585999250412, 0.06052664667367935, 0.08525741845369339, 0.10998820513486862, 0.13471898436546326, 0.1594497710466385, 0.18418055772781372, 0.20891132950782776, 0.233642116189003, 0.2583729028701782, 0.28310367465019226, 0.3078344464302063, 0.3325652480125427, 0.35729601979255676, 0.3820268213748932, 0.4067575931549072, 0.43148839473724365, 0.4562191665172577, 0.48094993829727173, 0.5056807398796082, 0.5304115414619446, 0.555142343044281, 0.5798730850219727, 0.6046038866043091, 0.6293346881866455, 0.6540654897689819, 0.6787962317466736, 0.70352703332901, 0.7282577753067017, 0.7529885768890381, 0.7777193188667297, 0.8024501204490662, 0.8271809220314026, 0.8519116640090942, 0.8766424655914307, 0.9013732671737671, 0.9261040687561035, 0.9508348703384399, 0.9755656123161316, 1.0002963542938232, 1.0250271558761597, 1.049757957458496, 1.0744887590408325, 1.099219560623169, 1.1239502429962158, 1.1486810445785522, 1.1734118461608887, 1.1981425285339355, 1.222873330116272, 1.2476041316986084, 1.2723349332809448, 1.2970657348632812, 1.3217965364456177, 1.346527338027954, 1.3712581396102905, 1.395988941192627, 1.4207196235656738, 1.4454504251480103, 1.4701812267303467, 1.494912028312683, 1.5196428298950195]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 6.0, 8.0, 18.0, 12.0, 17.0, 21.0, 27.0, 28.0, 22.0, 37.0, 39.0, 34.0, 35.0, 47.0, 26.0, 34.0, 31.0, 43.0, 39.0, 37.0, 36.0, 36.0, 38.0, 32.0, 23.0, 43.0, 30.0, 28.0, 20.0, 26.0, 20.0, 20.0, 17.0, 10.0, 15.0, 7.0, 10.0, 5.0, 2.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11109155416488647, -0.10736467689275742, -0.10363780707120895, -0.0999109297990799, -0.09618405997753143, -0.09245718270540237, -0.08873030543327332, -0.08500343561172485, -0.0812765583395958, -0.07754968106746674, -0.07382281124591827, -0.07009593397378922, -0.06636905670166016, -0.0626421868801117, -0.058915309607982635, -0.055188436061143875, -0.051461562514305115, -0.047734688967466354, -0.044007815420627594, -0.040280938148498535, -0.036554064601659775, -0.032827191054821014, -0.029100315645337105, -0.025373440235853195, -0.021646566689014435, -0.017919693142175674, -0.014192817732691765, -0.01046594325453043, -0.006739068776369095, -0.0030121952295303345, 0.0007146801799535751, 0.004441555589437485, 0.008168429136276245, 0.01189530361443758, 0.015622178092598915, 0.019349053502082825, 0.023075927048921585, 0.026802800595760345, 0.030529676005244255, 0.034256551414728165, 0.037983424961566925, 0.041710298508405685, 0.045437172055244446, 0.049164049327373505, 0.052890922874212265, 0.056617796421051025, 0.060344673693180084, 0.06407155096530914, 0.0677984207868576, 0.07152529805898666, 0.07525216788053513, 0.07897904515266418, 0.08270591497421265, 0.0864327922463417, 0.09015966951847076, 0.09388653934001923, 0.09761341661214828, 0.10134029388427734, 0.1050671637058258, 0.10879404097795486, 0.11252091825008392, 0.11624778807163239, 0.11997466534376144, 0.1237015426158905, 0.12742841243743896]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 7.0, 22.0, 24.0, 36.0, 27.0, 45.0, 36.0, 32.0, 53.0, 31.0, 47.0, 52.0, 42.0, 51.0, 60.0, 32.0, 33.0, 41.0, 48.0, 30.0, 42.0, 28.0, 30.0, 15.0, 20.0, 25.0, 9.0, 7.0, 15.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.6171875, -7.37451171875, -7.1318359375, -6.88916015625, -6.646484375, -6.40380859375, -6.1611328125, -5.91845703125, -5.67578125, -5.43310546875, -5.1904296875, -4.94775390625, -4.705078125, -4.46240234375, -4.2197265625, -3.97705078125, -3.734375, -3.49169921875, -3.2490234375, -3.00634765625, -2.763671875, -2.52099609375, -2.2783203125, -2.03564453125, -1.79296875, -1.55029296875, -1.3076171875, -1.06494140625, -0.822265625, -0.57958984375, -0.3369140625, -0.09423828125, 0.1484375, 0.39111328125, 0.6337890625, 0.87646484375, 1.119140625, 1.36181640625, 1.6044921875, 1.84716796875, 2.08984375, 2.33251953125, 2.5751953125, 2.81787109375, 3.060546875, 3.30322265625, 3.5458984375, 3.78857421875, 4.03125, 4.27392578125, 4.5166015625, 4.75927734375, 5.001953125, 5.24462890625, 5.4873046875, 5.72998046875, 5.97265625, 6.21533203125, 6.4580078125, 6.70068359375, 6.943359375, 7.18603515625, 7.4287109375, 7.67138671875, 7.9140625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 3.0, 5.0, 13.0, 10.0, 13.0, 28.0, 23.0, 23.0, 51.0, 77.0, 145.0, 240.0, 482.0, 848.0, 1856.0, 3996.0, 9628.0, 25801.0, 88221.0, 452672.0, 355952.0, 70929.0, 22159.0, 8465.0, 3536.0, 1558.0, 800.0, 391.0, 201.0, 133.0, 88.0, 55.0, 29.0, 33.0, 23.0, 14.0, 12.0, 8.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6015625, -12.180419921875, -11.75927734375, -11.338134765625, -10.9169921875, -10.495849609375, -10.07470703125, -9.653564453125, -9.232421875, -8.811279296875, -8.39013671875, -7.968994140625, -7.5478515625, -7.126708984375, -6.70556640625, -6.284423828125, -5.86328125, -5.442138671875, -5.02099609375, -4.599853515625, -4.1787109375, -3.757568359375, -3.33642578125, -2.915283203125, -2.494140625, -2.072998046875, -1.65185546875, -1.230712890625, -0.8095703125, -0.388427734375, 0.03271484375, 0.453857421875, 0.875, 1.296142578125, 1.71728515625, 2.138427734375, 2.5595703125, 2.980712890625, 3.40185546875, 3.822998046875, 4.244140625, 4.665283203125, 5.08642578125, 5.507568359375, 5.9287109375, 6.349853515625, 6.77099609375, 7.192138671875, 7.61328125, 8.034423828125, 8.45556640625, 8.876708984375, 9.2978515625, 9.718994140625, 10.14013671875, 10.561279296875, 10.982421875, 11.403564453125, 11.82470703125, 12.245849609375, 12.6669921875, 13.088134765625, 13.50927734375, 13.930419921875, 14.3515625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 6.0, 5.0, 6.0, 12.0, 12.0, 15.0, 24.0, 19.0, 21.0, 10.0, 24.0, 25.0, 36.0, 40.0, 43.0, 38.0, 68.0, 114.0, 163.0, 1394.0, 305.0, 131.0, 92.0, 72.0, 42.0, 43.0, 40.0, 30.0, 28.0, 24.0, 23.0, 25.0, 16.0, 15.0, 21.0, 15.0, 10.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.15380859375, -15.5732421875, -14.99267578125, -14.412109375, -13.83154296875, -13.2509765625, -12.67041015625, -12.08984375, -11.50927734375, -10.9287109375, -10.34814453125, -9.767578125, -9.18701171875, -8.6064453125, -8.02587890625, -7.4453125, -6.86474609375, -6.2841796875, -5.70361328125, -5.123046875, -4.54248046875, -3.9619140625, -3.38134765625, -2.80078125, -2.22021484375, -1.6396484375, -1.05908203125, -0.478515625, 0.10205078125, 0.6826171875, 1.26318359375, 1.84375, 2.42431640625, 3.0048828125, 3.58544921875, 4.166015625, 4.74658203125, 5.3271484375, 5.90771484375, 6.48828125, 7.06884765625, 7.6494140625, 8.22998046875, 8.810546875, 9.39111328125, 9.9716796875, 10.55224609375, 11.1328125, 11.71337890625, 12.2939453125, 12.87451171875, 13.455078125, 14.03564453125, 14.6162109375, 15.19677734375, 15.77734375, 16.35791015625, 16.9384765625, 17.51904296875, 18.099609375, 18.68017578125, 19.2607421875, 19.84130859375, 20.421875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 9.0, 9.0, 17.0, 22.0, 23.0, 33.0, 44.0, 56.0, 65.0, 71.0, 95.0, 106.0, 194.0, 289.0, 526.0, 1305.0, 3984.0, 19167.0, 318015.0, 2712328.0, 75462.0, 9286.0, 2436.0, 854.0, 417.0, 203.0, 143.0, 100.0, 87.0, 61.0, 51.0, 48.0, 35.0, 33.0, 17.0, 16.0, 17.0, 14.0, 13.0, 5.0, 5.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-34.21875, -33.19091796875, -32.1630859375, -31.13525390625, -30.107421875, -29.07958984375, -28.0517578125, -27.02392578125, -25.99609375, -24.96826171875, -23.9404296875, -22.91259765625, -21.884765625, -20.85693359375, -19.8291015625, -18.80126953125, -17.7734375, -16.74560546875, -15.7177734375, -14.68994140625, -13.662109375, -12.63427734375, -11.6064453125, -10.57861328125, -9.55078125, -8.52294921875, -7.4951171875, -6.46728515625, -5.439453125, -4.41162109375, -3.3837890625, -2.35595703125, -1.328125, -0.30029296875, 0.7275390625, 1.75537109375, 2.783203125, 3.81103515625, 4.8388671875, 5.86669921875, 6.89453125, 7.92236328125, 8.9501953125, 9.97802734375, 11.005859375, 12.03369140625, 13.0615234375, 14.08935546875, 15.1171875, 16.14501953125, 17.1728515625, 18.20068359375, 19.228515625, 20.25634765625, 21.2841796875, 22.31201171875, 23.33984375, 24.36767578125, 25.3955078125, 26.42333984375, 27.451171875, 28.47900390625, 29.5068359375, 30.53466796875, 31.5625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [74.0, 907.0, 36.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.8857479095459, -7.051213264465332, 7.783321380615234, 22.617856979370117, 37.452392578125, 52.28692626953125, 67.1214599609375, 81.95599365234375, 96.79052734375, 111.62506103515625, 126.4595947265625, 141.29412841796875, 156.128662109375, 170.96319580078125, 185.7977294921875, 200.63226318359375, 215.46681213378906, 230.3013458251953, 245.13587951660156, 259.9704284667969, 274.8049621582031, 289.6394958496094, 304.4740295410156, 319.3085632324219, 334.1430969238281, 348.9776306152344, 363.8121643066406, 378.6466979980469, 393.4812316894531, 408.3157653808594, 423.1502990722656, 437.9848327636719, 452.8193664550781, 467.6539001464844, 482.4884338378906, 497.3229675292969, 512.1575317382812, 526.9920654296875, 541.8265991210938, 556.6611328125, 571.4956665039062, 586.3302001953125, 601.1647338867188, 615.999267578125, 630.8338012695312, 645.6683349609375, 660.5028686523438, 675.33740234375, 690.1719360351562, 705.0064697265625, 719.8410034179688, 734.675537109375, 749.5100708007812, 764.3446044921875, 779.1791381835938, 794.013671875, 808.8482055664062, 823.6827392578125, 838.5172729492188, 853.351806640625, 868.1863403320312, 883.0208740234375, 897.8554077148438, 912.68994140625, 927.5244750976562]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 11.0, 9.0, 16.0, 11.0, 15.0, 15.0, 21.0, 29.0, 19.0, 28.0, 36.0, 26.0, 41.0, 52.0, 35.0, 29.0, 48.0, 31.0, 47.0, 37.0, 46.0, 30.0, 33.0, 27.0, 33.0, 24.0, 27.0, 28.0, 28.0, 22.0, 28.0, 14.0, 15.0, 8.0, 16.0, 7.0, 14.0, 5.0, 3.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-58.382991790771484, -56.82843780517578, -55.27388381958008, -53.719329833984375, -52.16477584838867, -50.61022186279297, -49.0556640625, -47.50111389160156, -45.946556091308594, -44.39200210571289, -42.83744812011719, -41.282894134521484, -39.72834014892578, -38.17378616333008, -36.619232177734375, -35.064674377441406, -33.51012420654297, -31.955570220947266, -30.401016235351562, -28.84646224975586, -27.291908264160156, -25.737354278564453, -24.182798385620117, -22.628244400024414, -21.07369041442871, -19.519136428833008, -17.964582443237305, -16.41002655029297, -14.855473518371582, -13.300919532775879, -11.74636459350586, -10.191810607910156, -8.637260437011719, -7.082706451416016, -5.528151988983154, -3.973597526550293, -2.41904354095459, -0.8644895553588867, 0.6900653839111328, 2.244619369506836, 3.799173355102539, 5.353727340698242, 6.9082818031311035, 8.462836265563965, 10.017390251159668, 11.571944236755371, 13.12649917602539, 14.681053161621094, 16.235607147216797, 17.7901611328125, 19.344715118408203, 20.899269104003906, 22.45382308959961, 24.008377075195312, 25.56293296813965, 27.11748695373535, 28.672040939331055, 30.226594924926758, 31.78114891052246, 33.3357048034668, 34.8902587890625, 36.4448127746582, 37.999366760253906, 39.55392074584961, 41.10847473144531]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 7.0, 11.0, 7.0, 12.0, 18.0, 31.0, 22.0, 32.0, 35.0, 36.0, 39.0, 43.0, 53.0, 46.0, 55.0, 47.0, 49.0, 63.0, 43.0, 31.0, 32.0, 29.0, 26.0, 36.0, 28.0, 22.0, 23.0, 17.0, 14.0, 13.0, 17.0, 12.0, 5.0, 7.0, 5.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8560791015625, -7.602783203125, -7.3494873046875, -7.09619140625, -6.8428955078125, -6.589599609375, -6.3363037109375, -6.0830078125, -5.8297119140625, -5.576416015625, -5.3231201171875, -5.06982421875, -4.8165283203125, -4.563232421875, -4.3099365234375, -4.056640625, -3.8033447265625, -3.550048828125, -3.2967529296875, -3.04345703125, -2.7901611328125, -2.536865234375, -2.2835693359375, -2.0302734375, -1.7769775390625, -1.523681640625, -1.2703857421875, -1.01708984375, -0.7637939453125, -0.510498046875, -0.2572021484375, -0.00390625, 0.2493896484375, 0.502685546875, 0.7559814453125, 1.00927734375, 1.2625732421875, 1.515869140625, 1.7691650390625, 2.0224609375, 2.2757568359375, 2.529052734375, 2.7823486328125, 3.03564453125, 3.2889404296875, 3.542236328125, 3.7955322265625, 4.048828125, 4.3021240234375, 4.555419921875, 4.8087158203125, 5.06201171875, 5.3153076171875, 5.568603515625, 5.8218994140625, 6.0751953125, 6.3284912109375, 6.581787109375, 6.8350830078125, 7.08837890625, 7.3416748046875, 7.594970703125, 7.8482666015625, 8.1015625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 10.0, 17.0, 21.0, 38.0, 56.0, 74.0, 123.0, 180.0, 251.0, 568.0, 1009.0, 2038.0, 4599.0, 11153.0, 32858.0, 135852.0, 768481.0, 2271454.0, 776271.0, 136846.0, 32820.0, 10750.0, 4425.0, 2074.0, 1003.0, 511.0, 313.0, 150.0, 98.0, 65.0, 45.0, 35.0, 14.0, 25.0, 10.0, 7.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.634033203125, -9.28369140625, -8.933349609375, -8.5830078125, -8.232666015625, -7.88232421875, -7.531982421875, -7.181640625, -6.831298828125, -6.48095703125, -6.130615234375, -5.7802734375, -5.429931640625, -5.07958984375, -4.729248046875, -4.37890625, -4.028564453125, -3.67822265625, -3.327880859375, -2.9775390625, -2.627197265625, -2.27685546875, -1.926513671875, -1.576171875, -1.225830078125, -0.87548828125, -0.525146484375, -0.1748046875, 0.175537109375, 0.52587890625, 0.876220703125, 1.2265625, 1.576904296875, 1.92724609375, 2.277587890625, 2.6279296875, 2.978271484375, 3.32861328125, 3.678955078125, 4.029296875, 4.379638671875, 4.72998046875, 5.080322265625, 5.4306640625, 5.781005859375, 6.13134765625, 6.481689453125, 6.83203125, 7.182373046875, 7.53271484375, 7.883056640625, 8.2333984375, 8.583740234375, 8.93408203125, 9.284423828125, 9.634765625, 9.985107421875, 10.33544921875, 10.685791015625, 11.0361328125, 11.386474609375, 11.73681640625, 12.087158203125, 12.4375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 5.0, 11.0, 10.0, 19.0, 25.0, 39.0, 56.0, 69.0, 119.0, 190.0, 246.0, 436.0, 598.0, 665.0, 500.0, 342.0, 215.0, 126.0, 102.0, 66.0, 48.0, 44.0, 35.0, 18.0, 14.0, 10.0, 14.0, 11.0, 12.0, 7.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3671875, -10.9783935546875, -10.589599609375, -10.2008056640625, -9.81201171875, -9.4232177734375, -9.034423828125, -8.6456298828125, -8.2568359375, -7.8680419921875, -7.479248046875, -7.0904541015625, -6.70166015625, -6.3128662109375, -5.924072265625, -5.5352783203125, -5.146484375, -4.7576904296875, -4.368896484375, -3.9801025390625, -3.59130859375, -3.2025146484375, -2.813720703125, -2.4249267578125, -2.0361328125, -1.6473388671875, -1.258544921875, -0.8697509765625, -0.48095703125, -0.0921630859375, 0.296630859375, 0.6854248046875, 1.07421875, 1.4630126953125, 1.851806640625, 2.2406005859375, 2.62939453125, 3.0181884765625, 3.406982421875, 3.7957763671875, 4.1845703125, 4.5733642578125, 4.962158203125, 5.3509521484375, 5.73974609375, 6.1285400390625, 6.517333984375, 6.9061279296875, 7.294921875, 7.6837158203125, 8.072509765625, 8.4613037109375, 8.85009765625, 9.2388916015625, 9.627685546875, 10.0164794921875, 10.4052734375, 10.7940673828125, 11.182861328125, 11.5716552734375, 11.96044921875, 12.3492431640625, 12.738037109375, 13.1268310546875, 13.515625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 10.0, 2.0, 5.0, 6.0, 13.0, 12.0, 21.0, 21.0, 27.0, 52.0, 52.0, 96.0, 138.0, 217.0, 414.0, 1109.0, 4489.0, 35004.0, 777087.0, 3255101.0, 107310.0, 9902.0, 1826.0, 596.0, 280.0, 174.0, 97.0, 60.0, 41.0, 29.0, 22.0, 19.0, 13.0, 10.0, 11.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.90625, -30.915771484375, -29.92529296875, -28.934814453125, -27.9443359375, -26.953857421875, -25.96337890625, -24.972900390625, -23.982421875, -22.991943359375, -22.00146484375, -21.010986328125, -20.0205078125, -19.030029296875, -18.03955078125, -17.049072265625, -16.05859375, -15.068115234375, -14.07763671875, -13.087158203125, -12.0966796875, -11.106201171875, -10.11572265625, -9.125244140625, -8.134765625, -7.144287109375, -6.15380859375, -5.163330078125, -4.1728515625, -3.182373046875, -2.19189453125, -1.201416015625, -0.2109375, 0.779541015625, 1.77001953125, 2.760498046875, 3.7509765625, 4.741455078125, 5.73193359375, 6.722412109375, 7.712890625, 8.703369140625, 9.69384765625, 10.684326171875, 11.6748046875, 12.665283203125, 13.65576171875, 14.646240234375, 15.63671875, 16.627197265625, 17.61767578125, 18.608154296875, 19.5986328125, 20.589111328125, 21.57958984375, 22.570068359375, 23.560546875, 24.551025390625, 25.54150390625, 26.531982421875, 27.5224609375, 28.512939453125, 29.50341796875, 30.493896484375, 31.484375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 6.0, 17.0, 93.0, 296.0, 340.0, 206.0, 41.0, 10.0, 3.0, 2.0, 0.0, 1.0], "bins": [-263.8110046386719, -259.10791015625, -254.40481567382812, -249.70172119140625, -244.99862670898438, -240.2955322265625, -235.59243774414062, -230.8893585205078, -226.18626403808594, -221.48316955566406, -216.7800750732422, -212.0769805908203, -207.37388610839844, -202.67080688476562, -197.96771240234375, -193.26461791992188, -188.5615234375, -183.85842895507812, -179.15533447265625, -174.45223999023438, -169.7491455078125, -165.04605102539062, -160.34295654296875, -155.63987731933594, -150.936767578125, -146.23367309570312, -141.53057861328125, -136.82748413085938, -132.1243896484375, -127.42130279541016, -122.71820831298828, -118.01512145996094, -113.31201934814453, -108.60892486572266, -103.90583038330078, -99.20274353027344, -94.49964904785156, -89.79655456542969, -85.09346008300781, -80.39036560058594, -75.68727111816406, -70.98417663574219, -66.28108215332031, -61.5779914855957, -56.874900817871094, -52.17180633544922, -47.468711853027344, -42.765621185302734, -38.062530517578125, -33.35943603515625, -28.65634536743164, -23.953250885009766, -19.250158309936523, -14.547065734863281, -9.843971252441406, -5.140880584716797, -0.4377861022949219, 4.2653069496154785, 8.968400001525879, 13.671493530273438, 18.37458610534668, 23.077678680419922, 27.780773162841797, 32.483863830566406, 37.18695831298828]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 0.0, 8.0, 10.0, 4.0, 7.0, 16.0, 13.0, 14.0, 22.0, 19.0, 24.0, 22.0, 27.0, 50.0, 35.0, 54.0, 32.0, 45.0, 39.0, 39.0, 44.0, 45.0, 42.0, 44.0, 41.0, 32.0, 43.0, 24.0, 26.0, 48.0, 20.0, 11.0, 19.0, 15.0, 8.0, 12.0, 11.0, 10.0, 5.0, 3.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.63576889038086, -37.37422180175781, -36.1126708984375, -34.85112380981445, -33.58957290649414, -32.328025817871094, -31.066476821899414, -29.804927825927734, -28.543378829956055, -27.281829833984375, -26.020280838012695, -24.758731842041016, -23.49718475341797, -22.235633850097656, -20.97408676147461, -19.71253776550293, -18.45098876953125, -17.18943977355957, -15.92789077758789, -14.666342735290527, -13.404793739318848, -12.143244743347168, -10.881696701049805, -9.620147705078125, -8.358598709106445, -7.097049713134766, -5.835501194000244, -4.573952674865723, -3.312403678894043, -2.0508546829223633, -0.7893061637878418, 0.4722423553466797, 1.733795166015625, 2.9953439235687256, 4.256892681121826, 5.518441200256348, 6.779990196228027, 8.041539192199707, 9.30308723449707, 10.56463623046875, 11.82618522644043, 13.08773422241211, 14.349283218383789, 15.610831260681152, 16.872379302978516, 18.133930206298828, 19.395477294921875, 20.657026290893555, 21.918575286865234, 23.180124282836914, 24.441673278808594, 25.703222274780273, 26.964771270751953, 28.226318359375, 29.48786735534668, 30.74941635131836, 32.010963439941406, 33.27251052856445, 34.534061431884766, 35.79560852050781, 37.057159423828125, 38.31870651245117, 39.580257415771484, 40.84180450439453, 42.103355407714844]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 8.0, 7.0, 7.0, 13.0, 16.0, 36.0, 19.0, 31.0, 32.0, 30.0, 38.0, 38.0, 43.0, 41.0, 59.0, 40.0, 54.0, 51.0, 47.0, 38.0, 45.0, 39.0, 23.0, 32.0, 36.0, 23.0, 21.0, 24.0, 16.0, 10.0, 23.0, 10.0, 6.0, 11.0, 8.0, 7.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.3515625, -7.11932373046875, -6.8870849609375, -6.65484619140625, -6.422607421875, -6.19036865234375, -5.9581298828125, -5.72589111328125, -5.49365234375, -5.26141357421875, -5.0291748046875, -4.79693603515625, -4.564697265625, -4.33245849609375, -4.1002197265625, -3.86798095703125, -3.6357421875, -3.40350341796875, -3.1712646484375, -2.93902587890625, -2.706787109375, -2.47454833984375, -2.2423095703125, -2.01007080078125, -1.77783203125, -1.54559326171875, -1.3133544921875, -1.08111572265625, -0.848876953125, -0.61663818359375, -0.3843994140625, -0.15216064453125, 0.080078125, 0.31231689453125, 0.5445556640625, 0.77679443359375, 1.009033203125, 1.24127197265625, 1.4735107421875, 1.70574951171875, 1.93798828125, 2.17022705078125, 2.4024658203125, 2.63470458984375, 2.866943359375, 3.09918212890625, 3.3314208984375, 3.56365966796875, 3.7958984375, 4.02813720703125, 4.2603759765625, 4.49261474609375, 4.724853515625, 4.95709228515625, 5.1893310546875, 5.42156982421875, 5.65380859375, 5.88604736328125, 6.1182861328125, 6.35052490234375, 6.582763671875, 6.81500244140625, 7.0472412109375, 7.27947998046875, 7.51171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 4.0, 18.0, 13.0, 22.0, 25.0, 42.0, 57.0, 76.0, 116.0, 159.0, 249.0, 364.0, 518.0, 829.0, 1247.0, 1915.0, 3117.0, 5001.0, 8380.0, 14643.0, 25976.0, 46594.0, 88028.0, 166750.0, 247800.0, 197498.0, 108161.0, 56694.0, 30936.0, 17233.0, 9994.0, 6043.0, 3642.0, 2290.0, 1372.0, 886.0, 544.0, 402.0, 291.0, 174.0, 136.0, 88.0, 63.0, 47.0, 34.0, 25.0, 14.0, 7.0, 16.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.8759765625, -0.8483047485351562, -0.8206329345703125, -0.7929611206054688, -0.765289306640625, -0.7376174926757812, -0.7099456787109375, -0.6822738647460938, -0.65460205078125, -0.6269302368164062, -0.5992584228515625, -0.5715866088867188, -0.543914794921875, -0.5162429809570312, -0.4885711669921875, -0.46089935302734375, -0.4332275390625, -0.40555572509765625, -0.3778839111328125, -0.35021209716796875, -0.322540283203125, -0.29486846923828125, -0.2671966552734375, -0.23952484130859375, -0.21185302734375, -0.18418121337890625, -0.1565093994140625, -0.12883758544921875, -0.101165771484375, -0.07349395751953125, -0.0458221435546875, -0.01815032958984375, 0.009521484375, 0.03719329833984375, 0.0648651123046875, 0.09253692626953125, 0.120208740234375, 0.14788055419921875, 0.1755523681640625, 0.20322418212890625, 0.23089599609375, 0.25856781005859375, 0.2862396240234375, 0.31391143798828125, 0.341583251953125, 0.36925506591796875, 0.3969268798828125, 0.42459869384765625, 0.4522705078125, 0.47994232177734375, 0.5076141357421875, 0.5352859497070312, 0.562957763671875, 0.5906295776367188, 0.6183013916015625, 0.6459732055664062, 0.67364501953125, 0.7013168334960938, 0.7289886474609375, 0.7566604614257812, 0.784332275390625, 0.8120040893554688, 0.8396759033203125, 0.8673477172851562, 0.89501953125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 9.0, 10.0, 10.0, 15.0, 16.0, 15.0, 19.0, 21.0, 28.0, 19.0, 31.0, 33.0, 31.0, 33.0, 27.0, 36.0, 27.0, 34.0, 29.0, 1052.0, 32.0, 29.0, 33.0, 33.0, 40.0, 41.0, 36.0, 27.0, 30.0, 29.0, 21.0, 15.0, 21.0, 23.0, 12.0, 16.0, 11.0, 10.0, 11.0, 11.0, 5.0, 7.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.90625, -3.77978515625, -3.6533203125, -3.52685546875, -3.400390625, -3.27392578125, -3.1474609375, -3.02099609375, -2.89453125, -2.76806640625, -2.6416015625, -2.51513671875, -2.388671875, -2.26220703125, -2.1357421875, -2.00927734375, -1.8828125, -1.75634765625, -1.6298828125, -1.50341796875, -1.376953125, -1.25048828125, -1.1240234375, -0.99755859375, -0.87109375, -0.74462890625, -0.6181640625, -0.49169921875, -0.365234375, -0.23876953125, -0.1123046875, 0.01416015625, 0.140625, 0.26708984375, 0.3935546875, 0.52001953125, 0.646484375, 0.77294921875, 0.8994140625, 1.02587890625, 1.15234375, 1.27880859375, 1.4052734375, 1.53173828125, 1.658203125, 1.78466796875, 1.9111328125, 2.03759765625, 2.1640625, 2.29052734375, 2.4169921875, 2.54345703125, 2.669921875, 2.79638671875, 2.9228515625, 3.04931640625, 3.17578125, 3.30224609375, 3.4287109375, 3.55517578125, 3.681640625, 3.80810546875, 3.9345703125, 4.06103515625, 4.1875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 5.0, 6.0, 17.0, 13.0, 25.0, 42.0, 34.0, 68.0, 96.0, 152.0, 225.0, 422.0, 636.0, 1170.0, 2021.0, 3815.0, 7306.0, 14319.0, 29417.0, 63342.0, 146600.0, 812361.0, 751136.0, 142652.0, 62331.0, 28909.0, 14201.0, 7159.0, 3741.0, 2067.0, 1099.0, 669.0, 368.0, 248.0, 148.0, 104.0, 59.0, 30.0, 36.0, 25.0, 14.0, 7.0, 9.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.80517578125, -0.7783279418945312, -0.7514801025390625, -0.7246322631835938, -0.697784423828125, -0.6709365844726562, -0.6440887451171875, -0.6172409057617188, -0.59039306640625, -0.5635452270507812, -0.5366973876953125, -0.5098495483398438, -0.483001708984375, -0.45615386962890625, -0.4293060302734375, -0.40245819091796875, -0.3756103515625, -0.34876251220703125, -0.3219146728515625, -0.29506683349609375, -0.268218994140625, -0.24137115478515625, -0.2145233154296875, -0.18767547607421875, -0.16082763671875, -0.13397979736328125, -0.1071319580078125, -0.08028411865234375, -0.053436279296875, -0.02658843994140625, 0.0002593994140625, 0.02710723876953125, 0.053955078125, 0.08080291748046875, 0.1076507568359375, 0.13449859619140625, 0.161346435546875, 0.18819427490234375, 0.2150421142578125, 0.24188995361328125, 0.26873779296875, 0.29558563232421875, 0.3224334716796875, 0.34928131103515625, 0.376129150390625, 0.40297698974609375, 0.4298248291015625, 0.45667266845703125, 0.4835205078125, 0.5103683471679688, 0.5372161865234375, 0.5640640258789062, 0.590911865234375, 0.6177597045898438, 0.6446075439453125, 0.6714553833007812, 0.69830322265625, 0.7251510620117188, 0.7519989013671875, 0.7788467407226562, 0.805694580078125, 0.8325424194335938, 0.8593902587890625, 0.8862380981445312, 0.9130859375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 9.0, 11.0, 16.0, 22.0, 33.0, 52.0, 71.0, 86.0, 113.0, 111.0, 107.0, 102.0, 86.0, 58.0, 32.0, 22.0, 17.0, 15.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08898067474365234, -0.08524894714355469, -0.08151721954345703, -0.07778549194335938, -0.07405376434326172, -0.07032203674316406, -0.0665903091430664, -0.06285858154296875, -0.059126853942871094, -0.05539512634277344, -0.05166339874267578, -0.047931671142578125, -0.04419994354248047, -0.04046821594238281, -0.036736488342285156, -0.0330047607421875, -0.029273033142089844, -0.025541305541992188, -0.02180957794189453, -0.018077850341796875, -0.014346122741699219, -0.010614395141601562, -0.006882667541503906, -0.00315093994140625, 0.0005807876586914062, 0.0043125152587890625, 0.008044242858886719, 0.011775970458984375, 0.015507698059082031, 0.019239425659179688, 0.022971153259277344, 0.026702880859375, 0.030434608459472656, 0.03416633605957031, 0.03789806365966797, 0.041629791259765625, 0.04536151885986328, 0.04909324645996094, 0.052824974060058594, 0.05655670166015625, 0.060288429260253906, 0.06402015686035156, 0.06775188446044922, 0.07148361206054688, 0.07521533966064453, 0.07894706726074219, 0.08267879486083984, 0.0864105224609375, 0.09014225006103516, 0.09387397766113281, 0.09760570526123047, 0.10133743286132812, 0.10506916046142578, 0.10880088806152344, 0.1125326156616211, 0.11626434326171875, 0.1199960708618164, 0.12372779846191406, 0.12745952606201172, 0.13119125366210938, 0.13492298126220703, 0.1386547088623047, 0.14238643646240234, 0.1461181640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 11.0, 21.0, 17.0, 35.0, 59.0, 112.0, 213.0, 567.0, 27262.0, 1018423.0, 1150.0, 301.0, 139.0, 73.0, 43.0, 39.0, 24.0, 11.0, 11.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.361328125, -3.275543212890625, -3.18975830078125, -3.103973388671875, -3.0181884765625, -2.932403564453125, -2.84661865234375, -2.760833740234375, -2.675048828125, -2.589263916015625, -2.50347900390625, -2.417694091796875, -2.3319091796875, -2.246124267578125, -2.16033935546875, -2.074554443359375, -1.98876953125, -1.902984619140625, -1.81719970703125, -1.731414794921875, -1.6456298828125, -1.559844970703125, -1.47406005859375, -1.388275146484375, -1.302490234375, -1.216705322265625, -1.13092041015625, -1.045135498046875, -0.9593505859375, -0.873565673828125, -0.78778076171875, -0.701995849609375, -0.6162109375, -0.530426025390625, -0.44464111328125, -0.358856201171875, -0.2730712890625, -0.187286376953125, -0.10150146484375, -0.015716552734375, 0.070068359375, 0.155853271484375, 0.24163818359375, 0.327423095703125, 0.4132080078125, 0.498992919921875, 0.58477783203125, 0.670562744140625, 0.75634765625, 0.842132568359375, 0.92791748046875, 1.013702392578125, 1.0994873046875, 1.185272216796875, 1.27105712890625, 1.356842041015625, 1.442626953125, 1.528411865234375, 1.61419677734375, 1.699981689453125, 1.7857666015625, 1.871551513671875, 1.95733642578125, 2.043121337890625, 2.12890625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 356.0, 650.0, 9.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33576706051826477, -0.30245694518089294, -0.2691468298435211, -0.2358366996049881, -0.20252658426761627, -0.16921646893024445, -0.13590633869171143, -0.1025962233543396, -0.06928610801696777, -0.03597598895430565, -0.002665869891643524, 0.0306442528963089, 0.06395436823368073, 0.09726448357105255, 0.13057461380958557, 0.1638847291469574, 0.19719484448432922, 0.23050495982170105, 0.2638150751590729, 0.2971252202987671, 0.3304353356361389, 0.36374545097351074, 0.39705556631088257, 0.4303656816482544, 0.4636757969856262, 0.49698591232299805, 0.5302960276603699, 0.5636061429977417, 0.5969162583351135, 0.6302263736724854, 0.663536548614502, 0.696846604347229, 0.730156660079956, 0.7634667754173279, 0.7967768907546997, 0.8300870060920715, 0.8633971214294434, 0.8967072367668152, 0.930017352104187, 0.9633275270462036, 0.9966375827789307, 1.0299477577209473, 1.0632578134536743, 1.096567988395691, 1.129878044128418, 1.1631882190704346, 1.1964982748031616, 1.2298084497451782, 1.2631185054779053, 1.2964286804199219, 1.329738736152649, 1.3630489110946655, 1.3963589668273926, 1.4296691417694092, 1.4629791975021362, 1.4962893724441528, 1.5295995473861694, 1.562909722328186, 1.596219778060913, 1.6295299530029297, 1.6628400087356567, 1.6961501836776733, 1.7294602394104004, 1.762770414352417, 1.796080470085144]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 4.0, 5.0, 5.0, 10.0, 10.0, 9.0, 11.0, 12.0, 7.0, 18.0, 12.0, 23.0, 22.0, 30.0, 24.0, 33.0, 26.0, 29.0, 44.0, 45.0, 47.0, 40.0, 31.0, 47.0, 37.0, 36.0, 35.0, 33.0, 38.0, 27.0, 30.0, 33.0, 34.0, 16.0, 14.0, 14.0, 19.0, 18.0, 14.0, 9.0, 9.0, 8.0, 3.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.1301332712173462, -0.1260582059621811, -0.12198314070701599, -0.11790807545185089, -0.11383301019668579, -0.10975794494152069, -0.105682872235775, -0.1016078069806099, -0.0975327417254448, -0.0934576764702797, -0.0893826112151146, -0.0853075459599495, -0.0812324732542038, -0.0771574079990387, -0.0730823427438736, -0.0690072774887085, -0.0649322122335434, -0.060857146978378296, -0.056782081723213196, -0.0527070127427578, -0.0486319474875927, -0.0445568822324276, -0.0404818132519722, -0.0364067479968071, -0.032331682741642, -0.028256617486476898, -0.02418155036866665, -0.0201064832508564, -0.0160314179956913, -0.0119563527405262, -0.00788128562271595, -0.0038062185049057007, 0.0002688467502593994, 0.004343912936747074, 0.008418979123234749, 0.012494045309722424, 0.0165691114962101, 0.0206441767513752, 0.024719243869185448, 0.028794310986995697, 0.0328693762421608, 0.0369444414973259, 0.041019506752491, 0.045094575732946396, 0.049169640988111496, 0.053244706243276596, 0.057319775223731995, 0.061394840478897095, 0.0654699057340622, 0.0695449709892273, 0.0736200362443924, 0.0776951014995575, 0.0817701667547226, 0.0858452320098877, 0.08992030471563339, 0.09399536997079849, 0.09807043522596359, 0.10214550048112869, 0.10622056573629379, 0.11029563099145889, 0.11437070369720459, 0.11844576895236969, 0.12252083420753479, 0.1265958994626999, 0.130670964717865]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 2.0, 8.0, 14.0, 11.0, 18.0, 18.0, 24.0, 28.0, 18.0, 39.0, 32.0, 31.0, 35.0, 47.0, 34.0, 47.0, 49.0, 48.0, 52.0, 50.0, 41.0, 39.0, 39.0, 31.0, 27.0, 28.0, 30.0, 22.0, 21.0, 19.0, 23.0, 15.0, 13.0, 8.0, 7.0, 8.0, 10.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.59375, -7.36346435546875, -7.1331787109375, -6.90289306640625, -6.672607421875, -6.44232177734375, -6.2120361328125, -5.98175048828125, -5.75146484375, -5.52117919921875, -5.2908935546875, -5.06060791015625, -4.830322265625, -4.60003662109375, -4.3697509765625, -4.13946533203125, -3.9091796875, -3.67889404296875, -3.4486083984375, -3.21832275390625, -2.988037109375, -2.75775146484375, -2.5274658203125, -2.29718017578125, -2.06689453125, -1.83660888671875, -1.6063232421875, -1.37603759765625, -1.145751953125, -0.91546630859375, -0.6851806640625, -0.45489501953125, -0.224609375, 0.00567626953125, 0.2359619140625, 0.46624755859375, 0.696533203125, 0.92681884765625, 1.1571044921875, 1.38739013671875, 1.61767578125, 1.84796142578125, 2.0782470703125, 2.30853271484375, 2.538818359375, 2.76910400390625, 2.9993896484375, 3.22967529296875, 3.4599609375, 3.69024658203125, 3.9205322265625, 4.15081787109375, 4.381103515625, 4.61138916015625, 4.8416748046875, 5.07196044921875, 5.30224609375, 5.53253173828125, 5.7628173828125, 5.99310302734375, 6.223388671875, 6.45367431640625, 6.6839599609375, 6.91424560546875, 7.14453125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 11.0, 20.0, 17.0, 21.0, 28.0, 24.0, 45.0, 59.0, 81.0, 144.0, 224.0, 417.0, 1076.0, 2563.0, 7050.0, 21908.0, 91044.0, 599106.0, 259048.0, 45224.0, 12830.0, 4434.0, 1649.0, 676.0, 288.0, 182.0, 97.0, 78.0, 40.0, 45.0, 28.0, 25.0, 14.0, 12.0, 13.0, 12.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.9375, -17.39013671875, -16.8427734375, -16.29541015625, -15.748046875, -15.20068359375, -14.6533203125, -14.10595703125, -13.55859375, -13.01123046875, -12.4638671875, -11.91650390625, -11.369140625, -10.82177734375, -10.2744140625, -9.72705078125, -9.1796875, -8.63232421875, -8.0849609375, -7.53759765625, -6.990234375, -6.44287109375, -5.8955078125, -5.34814453125, -4.80078125, -4.25341796875, -3.7060546875, -3.15869140625, -2.611328125, -2.06396484375, -1.5166015625, -0.96923828125, -0.421875, 0.12548828125, 0.6728515625, 1.22021484375, 1.767578125, 2.31494140625, 2.8623046875, 3.40966796875, 3.95703125, 4.50439453125, 5.0517578125, 5.59912109375, 6.146484375, 6.69384765625, 7.2412109375, 7.78857421875, 8.3359375, 8.88330078125, 9.4306640625, 9.97802734375, 10.525390625, 11.07275390625, 11.6201171875, 12.16748046875, 12.71484375, 13.26220703125, 13.8095703125, 14.35693359375, 14.904296875, 15.45166015625, 15.9990234375, 16.54638671875, 17.09375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 4.0, 1.0, 6.0, 14.0, 9.0, 7.0, 15.0, 17.0, 19.0, 21.0, 22.0, 29.0, 35.0, 46.0, 47.0, 67.0, 74.0, 161.0, 375.0, 1397.0, 176.0, 90.0, 65.0, 51.0, 48.0, 35.0, 40.0, 35.0, 26.0, 15.0, 17.0, 13.0, 12.0, 18.0, 7.0, 9.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.625, -16.99658203125, -16.3681640625, -15.73974609375, -15.111328125, -14.48291015625, -13.8544921875, -13.22607421875, -12.59765625, -11.96923828125, -11.3408203125, -10.71240234375, -10.083984375, -9.45556640625, -8.8271484375, -8.19873046875, -7.5703125, -6.94189453125, -6.3134765625, -5.68505859375, -5.056640625, -4.42822265625, -3.7998046875, -3.17138671875, -2.54296875, -1.91455078125, -1.2861328125, -0.65771484375, -0.029296875, 0.59912109375, 1.2275390625, 1.85595703125, 2.484375, 3.11279296875, 3.7412109375, 4.36962890625, 4.998046875, 5.62646484375, 6.2548828125, 6.88330078125, 7.51171875, 8.14013671875, 8.7685546875, 9.39697265625, 10.025390625, 10.65380859375, 11.2822265625, 11.91064453125, 12.5390625, 13.16748046875, 13.7958984375, 14.42431640625, 15.052734375, 15.68115234375, 16.3095703125, 16.93798828125, 17.56640625, 18.19482421875, 18.8232421875, 19.45166015625, 20.080078125, 20.70849609375, 21.3369140625, 21.96533203125, 22.59375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 21.0, 18.0, 19.0, 39.0, 44.0, 61.0, 93.0, 143.0, 187.0, 333.0, 696.0, 2631.0, 21324.0, 1657371.0, 1438494.0, 19989.0, 2555.0, 689.0, 308.0, 212.0, 128.0, 70.0, 65.0, 44.0, 36.0, 33.0, 18.0, 20.0, 10.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-42.8125, -41.5888671875, -40.365234375, -39.1416015625, -37.91796875, -36.6943359375, -35.470703125, -34.2470703125, -33.0234375, -31.7998046875, -30.576171875, -29.3525390625, -28.12890625, -26.9052734375, -25.681640625, -24.4580078125, -23.234375, -22.0107421875, -20.787109375, -19.5634765625, -18.33984375, -17.1162109375, -15.892578125, -14.6689453125, -13.4453125, -12.2216796875, -10.998046875, -9.7744140625, -8.55078125, -7.3271484375, -6.103515625, -4.8798828125, -3.65625, -2.4326171875, -1.208984375, 0.0146484375, 1.23828125, 2.4619140625, 3.685546875, 4.9091796875, 6.1328125, 7.3564453125, 8.580078125, 9.8037109375, 11.02734375, 12.2509765625, 13.474609375, 14.6982421875, 15.921875, 17.1455078125, 18.369140625, 19.5927734375, 20.81640625, 22.0400390625, 23.263671875, 24.4873046875, 25.7109375, 26.9345703125, 28.158203125, 29.3818359375, 30.60546875, 31.8291015625, 33.052734375, 34.2763671875, 35.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 23.0, 83.0, 197.0, 293.0, 253.0, 117.0, 28.0, 10.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.49787139892578, -62.845359802246094, -60.192848205566406, -57.54033660888672, -54.88782501220703, -52.235313415527344, -49.58280563354492, -46.930294036865234, -44.27778244018555, -41.62527084350586, -38.97275924682617, -36.320247650146484, -33.66773986816406, -31.015226364135742, -28.362716674804688, -25.710205078125, -23.057693481445312, -20.405181884765625, -17.752670288085938, -15.100160598754883, -12.447649002075195, -9.795137405395508, -7.142626762390137, -4.490116119384766, -1.8376045227050781, 0.8149065971374512, 3.4674177169799805, 6.11992883682251, 8.772439956665039, 11.424951553344727, 14.077462196350098, 16.72997283935547, 19.382476806640625, 22.034988403320312, 24.6875, 27.340009689331055, 29.992521286010742, 32.64503479003906, 35.297542572021484, 37.95005416870117, 40.60256576538086, 43.25507736206055, 45.907588958740234, 48.56010055541992, 51.212608337402344, 53.86511993408203, 56.51763153076172, 59.170143127441406, 61.822654724121094, 64.47516632080078, 67.12767791748047, 69.78018951416016, 72.43270111083984, 75.08521270751953, 77.73772430419922, 80.39022827148438, 83.04273986816406, 85.69525146484375, 88.34776306152344, 91.00027465820312, 93.65278625488281, 96.3052978515625, 98.95780944824219, 101.61032104492188, 104.26283264160156]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 13.0, 17.0, 5.0, 16.0, 24.0, 15.0, 18.0, 23.0, 16.0, 33.0, 29.0, 32.0, 37.0, 34.0, 38.0, 32.0, 42.0, 50.0, 37.0, 33.0, 33.0, 34.0, 41.0, 35.0, 37.0, 35.0, 31.0, 27.0, 23.0, 17.0, 12.0, 23.0, 19.0, 15.0, 13.0, 8.0, 5.0, 7.0, 5.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.97601318359375, -47.54582977294922, -46.11564254760742, -44.685455322265625, -43.255271911621094, -41.82508850097656, -40.394901275634766, -38.96471405029297, -37.53453063964844, -36.104347229003906, -34.67416000366211, -33.24397277832031, -31.81378936767578, -30.383604049682617, -28.953418731689453, -27.52323341369629, -26.093048095703125, -24.66286277770996, -23.232677459716797, -21.802492141723633, -20.37230682373047, -18.942121505737305, -17.51193618774414, -16.081750869750977, -14.651565551757812, -13.221380233764648, -11.791194915771484, -10.36100959777832, -8.930824279785156, -7.500638961791992, -6.070453643798828, -4.640268325805664, -3.2100868225097656, -1.7799015045166016, -0.3497161865234375, 1.0804691314697266, 2.5106544494628906, 3.9408397674560547, 5.371025085449219, 6.801210403442383, 8.231395721435547, 9.661581039428711, 11.091766357421875, 12.521951675415039, 13.952136993408203, 15.382322311401367, 16.81250762939453, 18.242692947387695, 19.67287826538086, 21.103063583374023, 22.533248901367188, 23.96343421936035, 25.393619537353516, 26.82380485534668, 28.253990173339844, 29.684175491333008, 31.114360809326172, 32.54454803466797, 33.9747314453125, 35.40491485595703, 36.83510208129883, 38.265289306640625, 39.695472717285156, 41.12565612792969, 42.555843353271484]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 5.0, 10.0, 3.0, 12.0, 22.0, 20.0, 21.0, 18.0, 27.0, 46.0, 40.0, 33.0, 42.0, 44.0, 45.0, 48.0, 53.0, 63.0, 48.0, 41.0, 40.0, 31.0, 40.0, 23.0, 32.0, 19.0, 18.0, 24.0, 20.0, 24.0, 21.0, 10.0, 14.0, 9.0, 9.0, 6.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.99609375, -7.757568359375, -7.51904296875, -7.280517578125, -7.0419921875, -6.803466796875, -6.56494140625, -6.326416015625, -6.087890625, -5.849365234375, -5.61083984375, -5.372314453125, -5.1337890625, -4.895263671875, -4.65673828125, -4.418212890625, -4.1796875, -3.941162109375, -3.70263671875, -3.464111328125, -3.2255859375, -2.987060546875, -2.74853515625, -2.510009765625, -2.271484375, -2.032958984375, -1.79443359375, -1.555908203125, -1.3173828125, -1.078857421875, -0.84033203125, -0.601806640625, -0.36328125, -0.124755859375, 0.11376953125, 0.352294921875, 0.5908203125, 0.829345703125, 1.06787109375, 1.306396484375, 1.544921875, 1.783447265625, 2.02197265625, 2.260498046875, 2.4990234375, 2.737548828125, 2.97607421875, 3.214599609375, 3.453125, 3.691650390625, 3.93017578125, 4.168701171875, 4.4072265625, 4.645751953125, 4.88427734375, 5.122802734375, 5.361328125, 5.599853515625, 5.83837890625, 6.076904296875, 6.3154296875, 6.553955078125, 6.79248046875, 7.031005859375, 7.26953125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 7.0, 6.0, 15.0, 11.0, 12.0, 24.0, 35.0, 37.0, 74.0, 98.0, 121.0, 168.0, 256.0, 336.0, 479.0, 646.0, 1098.0, 1810.0, 2930.0, 5379.0, 10305.0, 21151.0, 49381.0, 140924.0, 478548.0, 1436646.0, 1391509.0, 436403.0, 127613.0, 45735.0, 19726.0, 9571.0, 5089.0, 2980.0, 1677.0, 1091.0, 729.0, 462.0, 313.0, 261.0, 172.0, 129.0, 82.0, 74.0, 42.0, 41.0, 30.0, 18.0, 16.0, 10.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.44921875, -7.20062255859375, -6.9520263671875, -6.70343017578125, -6.454833984375, -6.20623779296875, -5.9576416015625, -5.70904541015625, -5.46044921875, -5.21185302734375, -4.9632568359375, -4.71466064453125, -4.466064453125, -4.21746826171875, -3.9688720703125, -3.72027587890625, -3.4716796875, -3.22308349609375, -2.9744873046875, -2.72589111328125, -2.477294921875, -2.22869873046875, -1.9801025390625, -1.73150634765625, -1.48291015625, -1.23431396484375, -0.9857177734375, -0.73712158203125, -0.488525390625, -0.23992919921875, 0.0086669921875, 0.25726318359375, 0.505859375, 0.75445556640625, 1.0030517578125, 1.25164794921875, 1.500244140625, 1.74884033203125, 1.9974365234375, 2.24603271484375, 2.49462890625, 2.74322509765625, 2.9918212890625, 3.24041748046875, 3.489013671875, 3.73760986328125, 3.9862060546875, 4.23480224609375, 4.4833984375, 4.73199462890625, 4.9805908203125, 5.22918701171875, 5.477783203125, 5.72637939453125, 5.9749755859375, 6.22357177734375, 6.47216796875, 6.72076416015625, 6.9693603515625, 7.21795654296875, 7.466552734375, 7.71514892578125, 7.9637451171875, 8.21234130859375, 8.4609375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 4.0, 7.0, 12.0, 25.0, 36.0, 51.0, 68.0, 104.0, 153.0, 215.0, 403.0, 620.0, 759.0, 575.0, 370.0, 254.0, 108.0, 83.0, 53.0, 50.0, 38.0, 22.0, 18.0, 9.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.359375, -11.9251708984375, -11.490966796875, -11.0567626953125, -10.62255859375, -10.1883544921875, -9.754150390625, -9.3199462890625, -8.8857421875, -8.4515380859375, -8.017333984375, -7.5831298828125, -7.14892578125, -6.7147216796875, -6.280517578125, -5.8463134765625, -5.412109375, -4.9779052734375, -4.543701171875, -4.1094970703125, -3.67529296875, -3.2410888671875, -2.806884765625, -2.3726806640625, -1.9384765625, -1.5042724609375, -1.070068359375, -0.6358642578125, -0.20166015625, 0.2325439453125, 0.666748046875, 1.1009521484375, 1.53515625, 1.9693603515625, 2.403564453125, 2.8377685546875, 3.27197265625, 3.7061767578125, 4.140380859375, 4.5745849609375, 5.0087890625, 5.4429931640625, 5.877197265625, 6.3114013671875, 6.74560546875, 7.1798095703125, 7.614013671875, 8.0482177734375, 8.482421875, 8.9166259765625, 9.350830078125, 9.7850341796875, 10.21923828125, 10.6534423828125, 11.087646484375, 11.5218505859375, 11.9560546875, 12.3902587890625, 12.824462890625, 13.2586669921875, 13.69287109375, 14.1270751953125, 14.561279296875, 14.9954833984375, 15.4296875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 9.0, 13.0, 22.0, 39.0, 44.0, 78.0, 123.0, 198.0, 327.0, 958.0, 5144.0, 86209.0, 3633018.0, 450272.0, 14832.0, 1754.0, 545.0, 253.0, 151.0, 89.0, 66.0, 42.0, 19.0, 16.0, 16.0, 12.0, 5.0, 9.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.875, -39.66259765625, -38.4501953125, -37.23779296875, -36.025390625, -34.81298828125, -33.6005859375, -32.38818359375, -31.17578125, -29.96337890625, -28.7509765625, -27.53857421875, -26.326171875, -25.11376953125, -23.9013671875, -22.68896484375, -21.4765625, -20.26416015625, -19.0517578125, -17.83935546875, -16.626953125, -15.41455078125, -14.2021484375, -12.98974609375, -11.77734375, -10.56494140625, -9.3525390625, -8.14013671875, -6.927734375, -5.71533203125, -4.5029296875, -3.29052734375, -2.078125, -0.86572265625, 0.3466796875, 1.55908203125, 2.771484375, 3.98388671875, 5.1962890625, 6.40869140625, 7.62109375, 8.83349609375, 10.0458984375, 11.25830078125, 12.470703125, 13.68310546875, 14.8955078125, 16.10791015625, 17.3203125, 18.53271484375, 19.7451171875, 20.95751953125, 22.169921875, 23.38232421875, 24.5947265625, 25.80712890625, 27.01953125, 28.23193359375, 29.4443359375, 30.65673828125, 31.869140625, 33.08154296875, 34.2939453125, 35.50634765625, 36.71875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 315.0, 658.0, 35.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.85899353027344, -182.59104919433594, -171.3231201171875, -160.05517578125, -148.7872314453125, -137.519287109375, -126.25135040283203, -114.98341369628906, -103.71546936035156, -92.44752502441406, -81.1795883178711, -69.91165161132812, -58.643707275390625, -47.37576675415039, -36.107826232910156, -24.839889526367188, -13.571945190429688, -2.304004669189453, 8.963935852050781, 20.231876373291016, 31.49981689453125, 42.767757415771484, 54.03569793701172, 65.30363464355469, 76.57157897949219, 87.83952331542969, 99.10746002197266, 110.37539672851562, 121.64334106445312, 132.91128540039062, 144.17922973632812, 155.44715881347656, 166.715087890625, 177.9830322265625, 189.2509765625, 200.51890563964844, 211.78684997558594, 223.05479431152344, 234.32272338867188, 245.59066772460938, 256.8586120605469, 268.1265563964844, 279.3945007324219, 290.6624450683594, 301.93035888671875, 313.19830322265625, 324.46624755859375, 335.73419189453125, 347.00213623046875, 358.27008056640625, 369.53802490234375, 380.80596923828125, 392.07391357421875, 403.3418273925781, 414.6097717285156, 425.8777160644531, 437.1456604003906, 448.4136047363281, 459.6815490722656, 470.9494934082031, 482.2174072265625, 493.4853515625, 504.7532958984375, 516.021240234375, 527.2891845703125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 8.0, 3.0, 8.0, 16.0, 7.0, 12.0, 13.0, 14.0, 17.0, 16.0, 29.0, 24.0, 25.0, 40.0, 40.0, 41.0, 42.0, 41.0, 47.0, 42.0, 42.0, 52.0, 45.0, 45.0, 36.0, 35.0, 28.0, 28.0, 27.0, 27.0, 23.0, 20.0, 20.0, 18.0, 13.0, 12.0, 8.0, 9.0, 3.0, 11.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.55177307128906, -33.365909576416016, -32.18004608154297, -30.99418067932129, -29.808317184448242, -28.622453689575195, -27.436588287353516, -26.25072479248047, -25.064861297607422, -23.878997802734375, -22.693134307861328, -21.50726890563965, -20.3214054107666, -19.135541915893555, -17.949676513671875, -16.763813018798828, -15.577949523925781, -14.392086029052734, -13.206221580505371, -12.020357131958008, -10.834493637084961, -9.648630142211914, -8.46276569366455, -7.2769012451171875, -6.091037750244141, -4.9051737785339355, -3.7193098068237305, -2.5334458351135254, -1.3475818634033203, -0.16171789169311523, 1.0241460800170898, 2.210010528564453, 3.3958702087402344, 4.5817341804504395, 5.7675981521606445, 6.95346212387085, 8.139326095581055, 9.325189590454102, 10.511054039001465, 11.696918487548828, 12.882781982421875, 14.068645477294922, 15.254509925842285, 16.44037437438965, 17.626237869262695, 18.812101364135742, 19.997966766357422, 21.18383026123047, 22.369693756103516, 23.555557250976562, 24.74142074584961, 25.92728614807129, 27.113149642944336, 28.299013137817383, 29.484878540039062, 30.67074203491211, 31.856605529785156, 33.0424690246582, 34.22833251953125, 35.4141960144043, 36.600059509277344, 37.785926818847656, 38.9717903137207, 40.15765380859375, 41.3435173034668]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 10.0, 11.0, 12.0, 10.0, 17.0, 16.0, 19.0, 19.0, 29.0, 24.0, 23.0, 34.0, 37.0, 37.0, 42.0, 35.0, 39.0, 55.0, 54.0, 38.0, 40.0, 35.0, 34.0, 31.0, 39.0, 23.0, 27.0, 12.0, 27.0, 26.0, 18.0, 14.0, 26.0, 16.0, 13.0, 7.0, 5.0, 7.0, 8.0, 7.0, 6.0, 2.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.77423095703125, -5.5679931640625, -5.36175537109375, -5.155517578125, -4.94927978515625, -4.7430419921875, -4.53680419921875, -4.33056640625, -4.12432861328125, -3.9180908203125, -3.71185302734375, -3.505615234375, -3.29937744140625, -3.0931396484375, -2.88690185546875, -2.6806640625, -2.47442626953125, -2.2681884765625, -2.06195068359375, -1.855712890625, -1.64947509765625, -1.4432373046875, -1.23699951171875, -1.03076171875, -0.82452392578125, -0.6182861328125, -0.41204833984375, -0.205810546875, 0.00042724609375, 0.2066650390625, 0.41290283203125, 0.619140625, 0.82537841796875, 1.0316162109375, 1.23785400390625, 1.444091796875, 1.65032958984375, 1.8565673828125, 2.06280517578125, 2.26904296875, 2.47528076171875, 2.6815185546875, 2.88775634765625, 3.093994140625, 3.30023193359375, 3.5064697265625, 3.71270751953125, 3.9189453125, 4.12518310546875, 4.3314208984375, 4.53765869140625, 4.743896484375, 4.95013427734375, 5.1563720703125, 5.36260986328125, 5.56884765625, 5.77508544921875, 5.9813232421875, 6.18756103515625, 6.393798828125, 6.60003662109375, 6.8062744140625, 7.01251220703125, 7.21875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 14.0, 4.0, 19.0, 28.0, 43.0, 60.0, 118.0, 172.0, 300.0, 536.0, 911.0, 1617.0, 2986.0, 5551.0, 10338.0, 20102.0, 41272.0, 87961.0, 187388.0, 295414.0, 204389.0, 96891.0, 45292.0, 22458.0, 11243.0, 6051.0, 3251.0, 1718.0, 991.0, 572.0, 336.0, 200.0, 124.0, 59.0, 49.0, 34.0, 21.0, 17.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1209030151367188, -1.0875091552734375, -1.0541152954101562, -1.020721435546875, -0.9873275756835938, -0.9539337158203125, -0.9205398559570312, -0.88714599609375, -0.8537521362304688, -0.8203582763671875, -0.7869644165039062, -0.753570556640625, -0.7201766967773438, -0.6867828369140625, -0.6533889770507812, -0.6199951171875, -0.5866012573242188, -0.5532073974609375, -0.5198135375976562, -0.486419677734375, -0.45302581787109375, -0.4196319580078125, -0.38623809814453125, -0.35284423828125, -0.31945037841796875, -0.2860565185546875, -0.25266265869140625, -0.219268798828125, -0.18587493896484375, -0.1524810791015625, -0.11908721923828125, -0.085693359375, -0.05229949951171875, -0.0189056396484375, 0.01448822021484375, 0.047882080078125, 0.08127593994140625, 0.1146697998046875, 0.14806365966796875, 0.18145751953125, 0.21485137939453125, 0.2482452392578125, 0.28163909912109375, 0.315032958984375, 0.34842681884765625, 0.3818206787109375, 0.41521453857421875, 0.4486083984375, 0.48200225830078125, 0.5153961181640625, 0.5487899780273438, 0.582183837890625, 0.6155776977539062, 0.6489715576171875, 0.6823654174804688, 0.71575927734375, 0.7491531372070312, 0.7825469970703125, 0.8159408569335938, 0.849334716796875, 0.8827285766601562, 0.9161224365234375, 0.9495162963867188, 0.98291015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 8.0, 9.0, 7.0, 14.0, 9.0, 14.0, 22.0, 22.0, 27.0, 22.0, 28.0, 26.0, 27.0, 40.0, 29.0, 31.0, 43.0, 44.0, 50.0, 1065.0, 41.0, 40.0, 30.0, 39.0, 40.0, 25.0, 28.0, 30.0, 21.0, 35.0, 23.0, 17.0, 21.0, 17.0, 19.0, 9.0, 9.0, 9.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0], "bins": [-4.9609375, -4.823089599609375, -4.68524169921875, -4.547393798828125, -4.4095458984375, -4.271697998046875, -4.13385009765625, -3.996002197265625, -3.858154296875, -3.720306396484375, -3.58245849609375, -3.444610595703125, -3.3067626953125, -3.168914794921875, -3.03106689453125, -2.893218994140625, -2.75537109375, -2.617523193359375, -2.47967529296875, -2.341827392578125, -2.2039794921875, -2.066131591796875, -1.92828369140625, -1.790435791015625, -1.652587890625, -1.514739990234375, -1.37689208984375, -1.239044189453125, -1.1011962890625, -0.963348388671875, -0.82550048828125, -0.687652587890625, -0.5498046875, -0.411956787109375, -0.27410888671875, -0.136260986328125, 0.0015869140625, 0.139434814453125, 0.27728271484375, 0.415130615234375, 0.552978515625, 0.690826416015625, 0.82867431640625, 0.966522216796875, 1.1043701171875, 1.242218017578125, 1.38006591796875, 1.517913818359375, 1.65576171875, 1.793609619140625, 1.93145751953125, 2.069305419921875, 2.2071533203125, 2.345001220703125, 2.48284912109375, 2.620697021484375, 2.758544921875, 2.896392822265625, 3.03424072265625, 3.172088623046875, 3.3099365234375, 3.447784423828125, 3.58563232421875, 3.723480224609375, 3.861328125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 12.0, 15.0, 24.0, 32.0, 30.0, 93.0, 136.0, 218.0, 454.0, 784.0, 1573.0, 3028.0, 6554.0, 14485.0, 33061.0, 80333.0, 212915.0, 1369636.0, 226317.0, 83673.0, 34924.0, 14999.0, 7106.0, 3264.0, 1534.0, 831.0, 462.0, 238.0, 146.0, 81.0, 53.0, 32.0, 26.0, 15.0, 7.0, 6.0, 3.0, 3.0, 3.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.0686569213867188, -1.0377044677734375, -1.0067520141601562, -0.975799560546875, -0.9448471069335938, -0.9138946533203125, -0.8829421997070312, -0.85198974609375, -0.8210372924804688, -0.7900848388671875, -0.7591323852539062, -0.728179931640625, -0.6972274780273438, -0.6662750244140625, -0.6353225708007812, -0.6043701171875, -0.5734176635742188, -0.5424652099609375, -0.5115127563476562, -0.480560302734375, -0.44960784912109375, -0.4186553955078125, -0.38770294189453125, -0.35675048828125, -0.32579803466796875, -0.2948455810546875, -0.26389312744140625, -0.232940673828125, -0.20198822021484375, -0.1710357666015625, -0.14008331298828125, -0.109130859375, -0.07817840576171875, -0.0472259521484375, -0.01627349853515625, 0.014678955078125, 0.04563140869140625, 0.0765838623046875, 0.10753631591796875, 0.13848876953125, 0.16944122314453125, 0.2003936767578125, 0.23134613037109375, 0.262298583984375, 0.29325103759765625, 0.3242034912109375, 0.35515594482421875, 0.3861083984375, 0.41706085205078125, 0.4480133056640625, 0.47896575927734375, 0.509918212890625, 0.5408706665039062, 0.5718231201171875, 0.6027755737304688, 0.63372802734375, 0.6646804809570312, 0.6956329345703125, 0.7265853881835938, 0.757537841796875, 0.7884902954101562, 0.8194427490234375, 0.8503952026367188, 0.88134765625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 1.0, 1.0, 9.0, 7.0, 22.0, 12.0, 15.0, 19.0, 21.0, 33.0, 27.0, 52.0, 48.0, 48.0, 53.0, 54.0, 47.0, 44.0, 43.0, 49.0, 53.0, 47.0, 39.0, 33.0, 39.0, 33.0, 31.0, 23.0, 18.0, 16.0, 5.0, 5.0, 12.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.043121337890625, -0.04175996780395508, -0.040398597717285156, -0.039037227630615234, -0.03767585754394531, -0.03631448745727539, -0.03495311737060547, -0.03359174728393555, -0.032230377197265625, -0.030869007110595703, -0.02950763702392578, -0.02814626693725586, -0.026784896850585938, -0.025423526763916016, -0.024062156677246094, -0.022700786590576172, -0.02133941650390625, -0.019978046417236328, -0.018616676330566406, -0.017255306243896484, -0.015893936157226562, -0.01453256607055664, -0.013171195983886719, -0.011809825897216797, -0.010448455810546875, -0.009087085723876953, -0.007725715637207031, -0.006364345550537109, -0.0050029754638671875, -0.0036416053771972656, -0.0022802352905273438, -0.0009188652038574219, 0.0004425048828125, 0.0018038749694824219, 0.0031652450561523438, 0.004526615142822266, 0.0058879852294921875, 0.007249355316162109, 0.008610725402832031, 0.009972095489501953, 0.011333465576171875, 0.012694835662841797, 0.014056205749511719, 0.01541757583618164, 0.016778945922851562, 0.018140316009521484, 0.019501686096191406, 0.020863056182861328, 0.02222442626953125, 0.023585796356201172, 0.024947166442871094, 0.026308536529541016, 0.027669906616210938, 0.02903127670288086, 0.03039264678955078, 0.0317540168762207, 0.033115386962890625, 0.03447675704956055, 0.03583812713623047, 0.03719949722290039, 0.03856086730957031, 0.039922237396240234, 0.041283607482910156, 0.04264497756958008, 0.04400634765625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 2.0, 5.0, 0.0, 5.0, 4.0, 7.0, 11.0, 13.0, 14.0, 29.0, 43.0, 56.0, 68.0, 78.0, 126.0, 254.0, 555.0, 7327.0, 1034770.0, 3984.0, 496.0, 223.0, 140.0, 94.0, 53.0, 46.0, 44.0, 28.0, 18.0, 14.0, 10.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.224609375, -1.1856689453125, -1.146728515625, -1.1077880859375, -1.06884765625, -1.0299072265625, -0.990966796875, -0.9520263671875, -0.9130859375, -0.8741455078125, -0.835205078125, -0.7962646484375, -0.75732421875, -0.7183837890625, -0.679443359375, -0.6405029296875, -0.6015625, -0.5626220703125, -0.523681640625, -0.4847412109375, -0.44580078125, -0.4068603515625, -0.367919921875, -0.3289794921875, -0.2900390625, -0.2510986328125, -0.212158203125, -0.1732177734375, -0.13427734375, -0.0953369140625, -0.056396484375, -0.0174560546875, 0.021484375, 0.0604248046875, 0.099365234375, 0.1383056640625, 0.17724609375, 0.2161865234375, 0.255126953125, 0.2940673828125, 0.3330078125, 0.3719482421875, 0.410888671875, 0.4498291015625, 0.48876953125, 0.5277099609375, 0.566650390625, 0.6055908203125, 0.64453125, 0.6834716796875, 0.722412109375, 0.7613525390625, 0.80029296875, 0.8392333984375, 0.878173828125, 0.9171142578125, 0.9560546875, 0.9949951171875, 1.033935546875, 1.0728759765625, 1.11181640625, 1.1507568359375, 1.189697265625, 1.2286376953125, 1.267578125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 52.0, 791.0, 164.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10948170721530914, -0.08996988087892532, -0.0704580545425415, -0.050946228206157684, -0.031434401869773865, -0.011922575533390045, 0.007589250802993774, 0.02710108458995819, 0.046612903475761414, 0.06612472981214523, 0.08563655614852905, 0.10514838248491287, 0.12466020882129669, 0.1441720426082611, 0.16368386149406433, 0.18319569528102875, 0.20270751416683197, 0.2222193479537964, 0.2417311668395996, 0.26124298572540283, 0.28075480461120605, 0.30026665329933167, 0.3197784721851349, 0.3392903208732605, 0.3588021397590637, 0.37831395864486694, 0.39782577753067017, 0.4173376262187958, 0.436849445104599, 0.4563612639904022, 0.47587311267852783, 0.49538493156433105, 0.5148967504501343, 0.5344085693359375, 0.5539203882217407, 0.573432207107544, 0.5929440259933472, 0.6124559044837952, 0.6319677233695984, 0.6514795422554016, 0.6709913611412048, 0.6905031800270081, 0.7100149989128113, 0.7295268177986145, 0.7490386962890625, 0.7685505151748657, 0.788062334060669, 0.8075741529464722, 0.8270859718322754, 0.8465977907180786, 0.8661096096038818, 0.8856214284896851, 0.9051332473754883, 0.9246451258659363, 0.9441569447517395, 0.9636687636375427, 0.983180582523346, 1.002692461013794, 1.0222042798995972, 1.0417160987854004, 1.0612279176712036, 1.0807397365570068, 1.10025155544281, 1.1197633743286133, 1.1392751932144165]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 7.0, 9.0, 10.0, 10.0, 12.0, 18.0, 17.0, 25.0, 32.0, 26.0, 31.0, 28.0, 41.0, 50.0, 46.0, 35.0, 53.0, 43.0, 44.0, 45.0, 51.0, 39.0, 38.0, 37.0, 36.0, 30.0, 30.0, 37.0, 24.0, 19.0, 13.0, 18.0, 11.0, 10.0, 11.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07285809516906738, -0.07038619369268417, -0.06791429221630096, -0.06544238328933716, -0.06297048181295395, -0.06049858033657074, -0.05802667513489723, -0.055554769933223724, -0.053082868456840515, -0.050610966980457306, -0.0481390617787838, -0.04566715657711029, -0.04319525510072708, -0.04072335362434387, -0.038251448422670364, -0.03577954322099686, -0.03330764174461365, -0.03083573840558529, -0.02836383506655693, -0.025891931727528572, -0.023420028388500214, -0.020948125049471855, -0.018476221710443497, -0.016004318371415138, -0.01353241503238678, -0.011060511693358421, -0.008588608354330063, -0.006116705015301704, -0.003644801676273346, -0.0011728983372449875, 0.001299005001783371, 0.0037709083408117294, 0.006242811679840088, 0.008714715018868446, 0.011186618357896805, 0.013658521696925163, 0.01613042503595352, 0.01860232837498188, 0.02107423171401024, 0.023546135053038597, 0.026018038392066956, 0.028489941731095314, 0.030961845070123672, 0.03343375027179718, 0.03590565174818039, 0.0383775532245636, 0.040849458426237106, 0.043321363627910614, 0.04579326510429382, 0.04826516658067703, 0.05073707178235054, 0.05320897698402405, 0.05568087846040726, 0.058152779936790466, 0.060624685138463974, 0.06309659034013748, 0.06556849181652069, 0.0680403932929039, 0.07051229476928711, 0.07298420369625092, 0.07545610517263412, 0.07792800664901733, 0.08039991557598114, 0.08287181705236435, 0.08534371852874756]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 1.0, 9.0, 13.0, 9.0, 17.0, 20.0, 19.0, 25.0, 25.0, 29.0, 26.0, 19.0, 36.0, 22.0, 38.0, 47.0, 43.0, 45.0, 38.0, 43.0, 37.0, 42.0, 32.0, 32.0, 35.0, 27.0, 35.0, 27.0, 24.0, 25.0, 21.0, 19.0, 12.0, 16.0, 16.0, 14.0, 9.0, 11.0, 4.0, 11.0, 2.0, 3.0, 2.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.22265625, -6.01934814453125, -5.8160400390625, -5.61273193359375, -5.409423828125, -5.20611572265625, -5.0028076171875, -4.79949951171875, -4.59619140625, -4.39288330078125, -4.1895751953125, -3.98626708984375, -3.782958984375, -3.57965087890625, -3.3763427734375, -3.17303466796875, -2.9697265625, -2.76641845703125, -2.5631103515625, -2.35980224609375, -2.156494140625, -1.95318603515625, -1.7498779296875, -1.54656982421875, -1.34326171875, -1.13995361328125, -0.9366455078125, -0.73333740234375, -0.530029296875, -0.32672119140625, -0.1234130859375, 0.07989501953125, 0.283203125, 0.48651123046875, 0.6898193359375, 0.89312744140625, 1.096435546875, 1.29974365234375, 1.5030517578125, 1.70635986328125, 1.90966796875, 2.11297607421875, 2.3162841796875, 2.51959228515625, 2.722900390625, 2.92620849609375, 3.1295166015625, 3.33282470703125, 3.5361328125, 3.73944091796875, 3.9427490234375, 4.14605712890625, 4.349365234375, 4.55267333984375, 4.7559814453125, 4.95928955078125, 5.16259765625, 5.36590576171875, 5.5692138671875, 5.77252197265625, 5.975830078125, 6.17913818359375, 6.3824462890625, 6.58575439453125, 6.7890625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 7.0, 12.0, 14.0, 18.0, 27.0, 50.0, 62.0, 103.0, 140.0, 193.0, 308.0, 499.0, 703.0, 1108.0, 1809.0, 2887.0, 4690.0, 7837.0, 13347.0, 23670.0, 42373.0, 79913.0, 151869.0, 258738.0, 210770.0, 111869.0, 58794.0, 32197.0, 18049.0, 10263.0, 6030.0, 3884.0, 2199.0, 1448.0, 901.0, 593.0, 365.0, 248.0, 183.0, 120.0, 79.0, 56.0, 38.0, 34.0, 21.0, 11.0, 8.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.75390625, -6.53436279296875, -6.3148193359375, -6.09527587890625, -5.875732421875, -5.65618896484375, -5.4366455078125, -5.21710205078125, -4.99755859375, -4.77801513671875, -4.5584716796875, -4.33892822265625, -4.119384765625, -3.89984130859375, -3.6802978515625, -3.46075439453125, -3.2412109375, -3.02166748046875, -2.8021240234375, -2.58258056640625, -2.363037109375, -2.14349365234375, -1.9239501953125, -1.70440673828125, -1.48486328125, -1.26531982421875, -1.0457763671875, -0.82623291015625, -0.606689453125, -0.38714599609375, -0.1676025390625, 0.05194091796875, 0.271484375, 0.49102783203125, 0.7105712890625, 0.93011474609375, 1.149658203125, 1.36920166015625, 1.5887451171875, 1.80828857421875, 2.02783203125, 2.24737548828125, 2.4669189453125, 2.68646240234375, 2.906005859375, 3.12554931640625, 3.3450927734375, 3.56463623046875, 3.7841796875, 4.00372314453125, 4.2232666015625, 4.44281005859375, 4.662353515625, 4.88189697265625, 5.1014404296875, 5.32098388671875, 5.54052734375, 5.76007080078125, 5.9796142578125, 6.19915771484375, 6.418701171875, 6.63824462890625, 6.8577880859375, 7.07733154296875, 7.296875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 5.0, 10.0, 8.0, 12.0, 21.0, 21.0, 22.0, 25.0, 34.0, 19.0, 49.0, 45.0, 55.0, 72.0, 96.0, 181.0, 1313.0, 332.0, 193.0, 109.0, 84.0, 50.0, 38.0, 44.0, 24.0, 34.0, 18.0, 23.0, 22.0, 9.0, 16.0, 10.0, 9.0, 4.0, 8.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.765625, -16.16650390625, -15.5673828125, -14.96826171875, -14.369140625, -13.77001953125, -13.1708984375, -12.57177734375, -11.97265625, -11.37353515625, -10.7744140625, -10.17529296875, -9.576171875, -8.97705078125, -8.3779296875, -7.77880859375, -7.1796875, -6.58056640625, -5.9814453125, -5.38232421875, -4.783203125, -4.18408203125, -3.5849609375, -2.98583984375, -2.38671875, -1.78759765625, -1.1884765625, -0.58935546875, 0.009765625, 0.60888671875, 1.2080078125, 1.80712890625, 2.40625, 3.00537109375, 3.6044921875, 4.20361328125, 4.802734375, 5.40185546875, 6.0009765625, 6.60009765625, 7.19921875, 7.79833984375, 8.3974609375, 8.99658203125, 9.595703125, 10.19482421875, 10.7939453125, 11.39306640625, 11.9921875, 12.59130859375, 13.1904296875, 13.78955078125, 14.388671875, 14.98779296875, 15.5869140625, 16.18603515625, 16.78515625, 17.38427734375, 17.9833984375, 18.58251953125, 19.181640625, 19.78076171875, 20.3798828125, 20.97900390625, 21.578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 8.0, 8.0, 10.0, 6.0, 13.0, 14.0, 18.0, 22.0, 53.0, 36.0, 72.0, 86.0, 112.0, 192.0, 245.0, 374.0, 753.0, 2210.0, 10947.0, 96159.0, 2238114.0, 745153.0, 42046.0, 5885.0, 1508.0, 563.0, 304.0, 223.0, 136.0, 115.0, 78.0, 38.0, 48.0, 35.0, 28.0, 17.0, 18.0, 11.0, 11.0, 7.0, 9.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.65625, -25.84423828125, -25.0322265625, -24.22021484375, -23.408203125, -22.59619140625, -21.7841796875, -20.97216796875, -20.16015625, -19.34814453125, -18.5361328125, -17.72412109375, -16.912109375, -16.10009765625, -15.2880859375, -14.47607421875, -13.6640625, -12.85205078125, -12.0400390625, -11.22802734375, -10.416015625, -9.60400390625, -8.7919921875, -7.97998046875, -7.16796875, -6.35595703125, -5.5439453125, -4.73193359375, -3.919921875, -3.10791015625, -2.2958984375, -1.48388671875, -0.671875, 0.14013671875, 0.9521484375, 1.76416015625, 2.576171875, 3.38818359375, 4.2001953125, 5.01220703125, 5.82421875, 6.63623046875, 7.4482421875, 8.26025390625, 9.072265625, 9.88427734375, 10.6962890625, 11.50830078125, 12.3203125, 13.13232421875, 13.9443359375, 14.75634765625, 15.568359375, 16.38037109375, 17.1923828125, 18.00439453125, 18.81640625, 19.62841796875, 20.4404296875, 21.25244140625, 22.064453125, 22.87646484375, 23.6884765625, 24.50048828125, 25.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [5.0, 205.0, 739.0, 69.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.383800506591797, -15.29759407043457, -4.211387634277344, 6.874820709228516, 17.96102523803711, 29.047229766845703, 40.13344192504883, 51.21964645385742, 62.305850982666016, 73.39205932617188, 84.47826385498047, 95.56446838378906, 106.65068054199219, 117.73687744140625, 128.82308959960938, 139.9093017578125, 150.99549865722656, 162.0817108154297, 173.16790771484375, 184.25411987304688, 195.34033203125, 206.42652893066406, 217.5127410888672, 228.59893798828125, 239.68515014648438, 250.7713623046875, 261.8575744628906, 272.94378662109375, 284.02996826171875, 295.1161804199219, 306.202392578125, 317.2886047363281, 328.37481689453125, 339.4610290527344, 350.5472412109375, 361.6334228515625, 372.7196350097656, 383.80584716796875, 394.8920593261719, 405.978271484375, 417.064453125, 428.1506652832031, 439.23687744140625, 450.32305908203125, 461.4092712402344, 472.4954833984375, 483.5816955566406, 494.66790771484375, 505.7541198730469, 516.84033203125, 527.926513671875, 539.0127563476562, 550.0989379882812, 561.1851806640625, 572.2713623046875, 583.3575439453125, 594.4437866210938, 605.5299682617188, 616.6162109375, 627.702392578125, 638.7886352539062, 649.8748168945312, 660.9610595703125, 672.0472412109375, 683.1334228515625]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 2.0, 10.0, 9.0, 7.0, 8.0, 13.0, 16.0, 17.0, 21.0, 35.0, 17.0, 32.0, 26.0, 24.0, 39.0, 42.0, 33.0, 32.0, 43.0, 50.0, 40.0, 49.0, 44.0, 35.0, 40.0, 33.0, 36.0, 17.0, 28.0, 40.0, 18.0, 22.0, 12.0, 17.0, 20.0, 11.0, 14.0, 11.0, 8.0, 12.0, 5.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-52.304683685302734, -50.9275016784668, -49.55031967163086, -48.17313766479492, -46.79595184326172, -45.41876983642578, -44.041587829589844, -42.664405822753906, -41.28722381591797, -39.91004180908203, -38.532859802246094, -37.155677795410156, -35.77849578857422, -34.401309967041016, -33.02412796020508, -31.64694595336914, -30.269763946533203, -28.892581939697266, -27.515399932861328, -26.138216018676758, -24.76103401184082, -23.383852005004883, -22.006668090820312, -20.629486083984375, -19.252304077148438, -17.8751220703125, -16.497940063476562, -15.120756149291992, -13.743574142456055, -12.366392135620117, -10.989209175109863, -9.61202621459961, -8.234840393066406, -6.8576579093933105, -5.480475425720215, -4.103292942047119, -2.7261104583740234, -1.3489279747009277, 0.02825450897216797, 1.4054374694824219, 2.7826194763183594, 4.159801959991455, 5.536984443664551, 6.9141669273376465, 8.291349411010742, 9.66853141784668, 11.045714378356934, 12.422897338867188, 13.800079345703125, 15.177261352539062, 16.554443359375, 17.93162727355957, 19.308809280395508, 20.685991287231445, 22.063175201416016, 23.440357208251953, 24.81753921508789, 26.194721221923828, 27.571903228759766, 28.949087142944336, 30.326269149780273, 31.70345115661621, 33.08063507080078, 34.45781707763672, 35.834999084472656]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 6.0, 10.0, 13.0, 16.0, 16.0, 26.0, 20.0, 27.0, 23.0, 37.0, 43.0, 35.0, 40.0, 37.0, 39.0, 42.0, 47.0, 34.0, 51.0, 37.0, 41.0, 41.0, 30.0, 30.0, 29.0, 32.0, 30.0, 28.0, 22.0, 25.0, 15.0, 8.0, 7.0, 7.0, 8.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.0546875, -6.82916259765625, -6.6036376953125, -6.37811279296875, -6.152587890625, -5.92706298828125, -5.7015380859375, -5.47601318359375, -5.25048828125, -5.02496337890625, -4.7994384765625, -4.57391357421875, -4.348388671875, -4.12286376953125, -3.8973388671875, -3.67181396484375, -3.4462890625, -3.22076416015625, -2.9952392578125, -2.76971435546875, -2.544189453125, -2.31866455078125, -2.0931396484375, -1.86761474609375, -1.64208984375, -1.41656494140625, -1.1910400390625, -0.96551513671875, -0.739990234375, -0.51446533203125, -0.2889404296875, -0.06341552734375, 0.162109375, 0.38763427734375, 0.6131591796875, 0.83868408203125, 1.064208984375, 1.28973388671875, 1.5152587890625, 1.74078369140625, 1.96630859375, 2.19183349609375, 2.4173583984375, 2.64288330078125, 2.868408203125, 3.09393310546875, 3.3194580078125, 3.54498291015625, 3.7705078125, 3.99603271484375, 4.2215576171875, 4.44708251953125, 4.672607421875, 4.89813232421875, 5.1236572265625, 5.34918212890625, 5.57470703125, 5.80023193359375, 6.0257568359375, 6.25128173828125, 6.476806640625, 6.70233154296875, 6.9278564453125, 7.15338134765625, 7.37890625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 11.0, 11.0, 25.0, 27.0, 36.0, 81.0, 105.0, 144.0, 228.0, 370.0, 564.0, 904.0, 1495.0, 2607.0, 4455.0, 8754.0, 18087.0, 44253.0, 134028.0, 498792.0, 1620417.0, 1329495.0, 361846.0, 99868.0, 35282.0, 14979.0, 7388.0, 4077.0, 2333.0, 1344.0, 804.0, 487.0, 331.0, 192.0, 141.0, 99.0, 68.0, 44.0, 20.0, 29.0, 17.0, 11.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-9.4765625, -9.21246337890625, -8.9483642578125, -8.68426513671875, -8.420166015625, -8.15606689453125, -7.8919677734375, -7.62786865234375, -7.36376953125, -7.09967041015625, -6.8355712890625, -6.57147216796875, -6.307373046875, -6.04327392578125, -5.7791748046875, -5.51507568359375, -5.2509765625, -4.98687744140625, -4.7227783203125, -4.45867919921875, -4.194580078125, -3.93048095703125, -3.6663818359375, -3.40228271484375, -3.13818359375, -2.87408447265625, -2.6099853515625, -2.34588623046875, -2.081787109375, -1.81768798828125, -1.5535888671875, -1.28948974609375, -1.025390625, -0.76129150390625, -0.4971923828125, -0.23309326171875, 0.031005859375, 0.29510498046875, 0.5592041015625, 0.82330322265625, 1.08740234375, 1.35150146484375, 1.6156005859375, 1.87969970703125, 2.143798828125, 2.40789794921875, 2.6719970703125, 2.93609619140625, 3.2001953125, 3.46429443359375, 3.7283935546875, 3.99249267578125, 4.256591796875, 4.52069091796875, 4.7847900390625, 5.04888916015625, 5.31298828125, 5.57708740234375, 5.8411865234375, 6.10528564453125, 6.369384765625, 6.63348388671875, 6.8975830078125, 7.16168212890625, 7.42578125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 9.0, 16.0, 14.0, 20.0, 17.0, 25.0, 40.0, 67.0, 91.0, 105.0, 176.0, 236.0, 375.0, 535.0, 625.0, 519.0, 348.0, 234.0, 184.0, 120.0, 79.0, 56.0, 48.0, 36.0, 23.0, 14.0, 15.0, 9.0, 11.0, 2.0, 10.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.390625, -10.060302734375, -9.72998046875, -9.399658203125, -9.0693359375, -8.739013671875, -8.40869140625, -8.078369140625, -7.748046875, -7.417724609375, -7.08740234375, -6.757080078125, -6.4267578125, -6.096435546875, -5.76611328125, -5.435791015625, -5.10546875, -4.775146484375, -4.44482421875, -4.114501953125, -3.7841796875, -3.453857421875, -3.12353515625, -2.793212890625, -2.462890625, -2.132568359375, -1.80224609375, -1.471923828125, -1.1416015625, -0.811279296875, -0.48095703125, -0.150634765625, 0.1796875, 0.510009765625, 0.84033203125, 1.170654296875, 1.5009765625, 1.831298828125, 2.16162109375, 2.491943359375, 2.822265625, 3.152587890625, 3.48291015625, 3.813232421875, 4.1435546875, 4.473876953125, 4.80419921875, 5.134521484375, 5.46484375, 5.795166015625, 6.12548828125, 6.455810546875, 6.7861328125, 7.116455078125, 7.44677734375, 7.777099609375, 8.107421875, 8.437744140625, 8.76806640625, 9.098388671875, 9.4287109375, 9.759033203125, 10.08935546875, 10.419677734375, 10.75]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 20.0, 20.0, 29.0, 52.0, 70.0, 88.0, 151.0, 336.0, 867.0, 3226.0, 16218.0, 110954.0, 1823580.0, 2092757.0, 122922.0, 17632.0, 3526.0, 1006.0, 359.0, 136.0, 101.0, 67.0, 38.0, 33.0, 17.0, 15.0, 13.0, 9.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.65625, -22.9609375, -22.265625, -21.5703125, -20.875, -20.1796875, -19.484375, -18.7890625, -18.09375, -17.3984375, -16.703125, -16.0078125, -15.3125, -14.6171875, -13.921875, -13.2265625, -12.53125, -11.8359375, -11.140625, -10.4453125, -9.75, -9.0546875, -8.359375, -7.6640625, -6.96875, -6.2734375, -5.578125, -4.8828125, -4.1875, -3.4921875, -2.796875, -2.1015625, -1.40625, -0.7109375, -0.015625, 0.6796875, 1.375, 2.0703125, 2.765625, 3.4609375, 4.15625, 4.8515625, 5.546875, 6.2421875, 6.9375, 7.6328125, 8.328125, 9.0234375, 9.71875, 10.4140625, 11.109375, 11.8046875, 12.5, 13.1953125, 13.890625, 14.5859375, 15.28125, 15.9765625, 16.671875, 17.3671875, 18.0625, 18.7578125, 19.453125, 20.1484375, 20.84375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 16.0, 19.0, 62.0, 97.0, 168.0, 184.0, 196.0, 129.0, 72.0, 35.0, 22.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.97679901123047, -73.7922592163086, -71.60772705078125, -69.42318725585938, -67.23865509033203, -65.05411529541016, -62.86957931518555, -60.68504333496094, -58.50050735473633, -56.31597137451172, -54.13143539428711, -51.9468994140625, -49.762359619140625, -47.57782745361328, -45.393287658691406, -43.2087516784668, -41.02421569824219, -38.83967971801758, -36.65514373779297, -34.47060775756836, -32.28607177734375, -30.101533889770508, -27.916996002197266, -25.732460021972656, -23.547924041748047, -21.363388061523438, -19.178852081298828, -16.994314193725586, -14.809778213500977, -12.625242233276367, -10.440705299377441, -8.256168365478516, -6.0716400146484375, -3.88710355758667, -1.7025671005249023, 0.48196935653686523, 2.666505813598633, 4.851041793823242, 7.035578727722168, 9.220115661621094, 11.404651641845703, 13.589187622070312, 15.773724555969238, 17.958261489868164, 20.142797470092773, 22.327333450317383, 24.511871337890625, 26.696407318115234, 28.880943298339844, 31.065479278564453, 33.25001525878906, 35.43455123901367, 37.61908721923828, 39.803627014160156, 41.988162994384766, 44.172698974609375, 46.357234954833984, 48.541770935058594, 50.7263069152832, 52.91084289550781, 55.09538269042969, 57.27991485595703, 59.464454650878906, 61.648990631103516, 63.833526611328125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 13.0, 18.0, 10.0, 18.0, 14.0, 16.0, 18.0, 26.0, 29.0, 31.0, 32.0, 26.0, 45.0, 35.0, 35.0, 35.0, 53.0, 47.0, 47.0, 42.0, 29.0, 37.0, 38.0, 33.0, 27.0, 30.0, 27.0, 27.0, 21.0, 25.0, 19.0, 12.0, 10.0, 20.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-31.154857635498047, -30.19528579711914, -29.235713958740234, -28.276142120361328, -27.316570281982422, -26.356998443603516, -25.39742660522461, -24.437854766845703, -23.478282928466797, -22.51871109008789, -21.559139251708984, -20.599567413330078, -19.639995574951172, -18.680423736572266, -17.72085189819336, -16.761280059814453, -15.80171012878418, -14.842138290405273, -13.882566452026367, -12.922994613647461, -11.963422775268555, -11.003850936889648, -10.044280052185059, -9.084708213806152, -8.125136375427246, -7.16556453704834, -6.205992698669434, -5.2464213371276855, -4.286849498748779, -3.327277660369873, -2.367706298828125, -1.4081344604492188, -0.4485607147216797, 0.511011004447937, 1.4705827236175537, 2.430154323577881, 3.389726161956787, 4.349298000335693, 5.308869361877441, 6.268441200256348, 7.228013038635254, 8.18758487701416, 9.147156715393066, 10.106727600097656, 11.066299438476562, 12.025871276855469, 12.985443115234375, 13.945014953613281, 14.904586791992188, 15.864158630371094, 16.82373046875, 17.783302307128906, 18.742874145507812, 19.70244598388672, 20.662017822265625, 21.62158966064453, 22.581161499023438, 23.540733337402344, 24.50030517578125, 25.459877014160156, 26.419448852539062, 27.37902069091797, 28.338592529296875, 29.29816436767578, 30.257734298706055]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 11.0, 9.0, 4.0, 8.0, 13.0, 14.0, 23.0, 20.0, 30.0, 27.0, 44.0, 27.0, 49.0, 41.0, 38.0, 36.0, 63.0, 63.0, 46.0, 47.0, 50.0, 47.0, 35.0, 36.0, 35.0, 29.0, 20.0, 22.0, 19.0, 16.0, 13.0, 7.0, 19.0, 7.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.48046875, -7.23590087890625, -6.9913330078125, -6.74676513671875, -6.502197265625, -6.25762939453125, -6.0130615234375, -5.76849365234375, -5.52392578125, -5.27935791015625, -5.0347900390625, -4.79022216796875, -4.545654296875, -4.30108642578125, -4.0565185546875, -3.81195068359375, -3.5673828125, -3.32281494140625, -3.0782470703125, -2.83367919921875, -2.589111328125, -2.34454345703125, -2.0999755859375, -1.85540771484375, -1.61083984375, -1.36627197265625, -1.1217041015625, -0.87713623046875, -0.632568359375, -0.38800048828125, -0.1434326171875, 0.10113525390625, 0.345703125, 0.59027099609375, 0.8348388671875, 1.07940673828125, 1.323974609375, 1.56854248046875, 1.8131103515625, 2.05767822265625, 2.30224609375, 2.54681396484375, 2.7913818359375, 3.03594970703125, 3.280517578125, 3.52508544921875, 3.7696533203125, 4.01422119140625, 4.2587890625, 4.50335693359375, 4.7479248046875, 4.99249267578125, 5.237060546875, 5.48162841796875, 5.7261962890625, 5.97076416015625, 6.21533203125, 6.45989990234375, 6.7044677734375, 6.94903564453125, 7.193603515625, 7.43817138671875, 7.6827392578125, 7.92730712890625, 8.171875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 19.0, 26.0, 22.0, 29.0, 53.0, 79.0, 108.0, 141.0, 224.0, 303.0, 518.0, 747.0, 1101.0, 1724.0, 2712.0, 4380.0, 6894.0, 11372.0, 19090.0, 32292.0, 55727.0, 97957.0, 162959.0, 213931.0, 175908.0, 108300.0, 62025.0, 35721.0, 20731.0, 12671.0, 7626.0, 4640.0, 2902.0, 1881.0, 1283.0, 788.0, 491.0, 387.0, 264.0, 168.0, 103.0, 72.0, 52.0, 39.0, 26.0, 19.0, 14.0, 15.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.859375, -0.8330078125, -0.806640625, -0.7802734375, -0.75390625, -0.7275390625, -0.701171875, -0.6748046875, -0.6484375, -0.6220703125, -0.595703125, -0.5693359375, -0.54296875, -0.5166015625, -0.490234375, -0.4638671875, -0.4375, -0.4111328125, -0.384765625, -0.3583984375, -0.33203125, -0.3056640625, -0.279296875, -0.2529296875, -0.2265625, -0.2001953125, -0.173828125, -0.1474609375, -0.12109375, -0.0947265625, -0.068359375, -0.0419921875, -0.015625, 0.0107421875, 0.037109375, 0.0634765625, 0.08984375, 0.1162109375, 0.142578125, 0.1689453125, 0.1953125, 0.2216796875, 0.248046875, 0.2744140625, 0.30078125, 0.3271484375, 0.353515625, 0.3798828125, 0.40625, 0.4326171875, 0.458984375, 0.4853515625, 0.51171875, 0.5380859375, 0.564453125, 0.5908203125, 0.6171875, 0.6435546875, 0.669921875, 0.6962890625, 0.72265625, 0.7490234375, 0.775390625, 0.8017578125, 0.828125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 9.0, 5.0, 5.0, 16.0, 16.0, 26.0, 15.0, 23.0, 22.0, 26.0, 37.0, 25.0, 42.0, 41.0, 46.0, 42.0, 37.0, 1059.0, 48.0, 43.0, 39.0, 43.0, 43.0, 39.0, 28.0, 31.0, 33.0, 27.0, 27.0, 20.0, 17.0, 15.0, 18.0, 15.0, 8.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84375, -4.685546875, -4.52734375, -4.369140625, -4.2109375, -4.052734375, -3.89453125, -3.736328125, -3.578125, -3.419921875, -3.26171875, -3.103515625, -2.9453125, -2.787109375, -2.62890625, -2.470703125, -2.3125, -2.154296875, -1.99609375, -1.837890625, -1.6796875, -1.521484375, -1.36328125, -1.205078125, -1.046875, -0.888671875, -0.73046875, -0.572265625, -0.4140625, -0.255859375, -0.09765625, 0.060546875, 0.21875, 0.376953125, 0.53515625, 0.693359375, 0.8515625, 1.009765625, 1.16796875, 1.326171875, 1.484375, 1.642578125, 1.80078125, 1.958984375, 2.1171875, 2.275390625, 2.43359375, 2.591796875, 2.75, 2.908203125, 3.06640625, 3.224609375, 3.3828125, 3.541015625, 3.69921875, 3.857421875, 4.015625, 4.173828125, 4.33203125, 4.490234375, 4.6484375, 4.806640625, 4.96484375, 5.123046875, 5.28125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 6.0, 18.0, 23.0, 29.0, 50.0, 67.0, 119.0, 226.0, 386.0, 735.0, 1432.0, 2814.0, 5629.0, 12348.0, 27676.0, 66064.0, 165838.0, 1276489.0, 343576.0, 111824.0, 45209.0, 19239.0, 8743.0, 4163.0, 2034.0, 1058.0, 558.0, 317.0, 175.0, 101.0, 49.0, 35.0, 20.0, 23.0, 10.0, 12.0, 5.0, 5.0, 4.0, 2.0, 5.0, 5.0], "bins": [-1.26953125, -1.2376251220703125, -1.205718994140625, -1.1738128662109375, -1.14190673828125, -1.1100006103515625, -1.078094482421875, -1.0461883544921875, -1.0142822265625, -0.9823760986328125, -0.950469970703125, -0.9185638427734375, -0.88665771484375, -0.8547515869140625, -0.822845458984375, -0.7909393310546875, -0.759033203125, -0.7271270751953125, -0.695220947265625, -0.6633148193359375, -0.63140869140625, -0.5995025634765625, -0.567596435546875, -0.5356903076171875, -0.5037841796875, -0.4718780517578125, -0.439971923828125, -0.4080657958984375, -0.37615966796875, -0.3442535400390625, -0.312347412109375, -0.2804412841796875, -0.24853515625, -0.2166290283203125, -0.184722900390625, -0.1528167724609375, -0.12091064453125, -0.0890045166015625, -0.057098388671875, -0.0251922607421875, 0.0067138671875, 0.0386199951171875, 0.070526123046875, 0.1024322509765625, 0.13433837890625, 0.1662445068359375, 0.198150634765625, 0.2300567626953125, 0.261962890625, 0.2938690185546875, 0.325775146484375, 0.3576812744140625, 0.38958740234375, 0.4214935302734375, 0.453399658203125, 0.4853057861328125, 0.5172119140625, 0.5491180419921875, 0.581024169921875, 0.6129302978515625, 0.64483642578125, 0.6767425537109375, 0.708648681640625, 0.7405548095703125, 0.7724609375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 8.0, 7.0, 10.0, 13.0, 9.0, 14.0, 14.0, 16.0, 24.0, 29.0, 47.0, 48.0, 49.0, 62.0, 49.0, 63.0, 72.0, 76.0, 65.0, 54.0, 37.0, 41.0, 22.0, 18.0, 23.0, 16.0, 14.0, 18.0, 11.0, 6.0, 7.0, 7.0, 5.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.058929443359375, -0.05719280242919922, -0.05545616149902344, -0.053719520568847656, -0.051982879638671875, -0.050246238708496094, -0.04850959777832031, -0.04677295684814453, -0.04503631591796875, -0.04329967498779297, -0.04156303405761719, -0.039826393127441406, -0.038089752197265625, -0.036353111267089844, -0.03461647033691406, -0.03287982940673828, -0.0311431884765625, -0.02940654754638672, -0.027669906616210938, -0.025933265686035156, -0.024196624755859375, -0.022459983825683594, -0.020723342895507812, -0.01898670196533203, -0.01725006103515625, -0.015513420104980469, -0.013776779174804688, -0.012040138244628906, -0.010303497314453125, -0.008566856384277344, -0.0068302154541015625, -0.005093574523925781, -0.00335693359375, -0.0016202926635742188, 0.0001163482666015625, 0.0018529891967773438, 0.003589630126953125, 0.005326271057128906, 0.0070629119873046875, 0.008799552917480469, 0.01053619384765625, 0.012272834777832031, 0.014009475708007812, 0.015746116638183594, 0.017482757568359375, 0.019219398498535156, 0.020956039428710938, 0.02269268035888672, 0.0244293212890625, 0.02616596221923828, 0.027902603149414062, 0.029639244079589844, 0.031375885009765625, 0.033112525939941406, 0.03484916687011719, 0.03658580780029297, 0.03832244873046875, 0.04005908966064453, 0.04179573059082031, 0.043532371520996094, 0.045269012451171875, 0.047005653381347656, 0.04874229431152344, 0.05047893524169922, 0.052215576171875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 11.0, 12.0, 11.0, 15.0, 12.0, 14.0, 16.0, 28.0, 19.0, 27.0, 45.0, 39.0, 87.0, 128.0, 183.0, 301.0, 763.0, 8708.0, 1020078.0, 16168.0, 847.0, 319.0, 185.0, 125.0, 98.0, 65.0, 42.0, 26.0, 22.0, 25.0, 19.0, 14.0, 17.0, 13.0, 7.0, 5.0, 7.0, 10.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0], "bins": [-1.0947265625, -1.0600433349609375, -1.025360107421875, -0.9906768798828125, -0.95599365234375, -0.9213104248046875, -0.886627197265625, -0.8519439697265625, -0.8172607421875, -0.7825775146484375, -0.747894287109375, -0.7132110595703125, -0.67852783203125, -0.6438446044921875, -0.609161376953125, -0.5744781494140625, -0.539794921875, -0.5051116943359375, -0.470428466796875, -0.4357452392578125, -0.40106201171875, -0.3663787841796875, -0.331695556640625, -0.2970123291015625, -0.2623291015625, -0.2276458740234375, -0.192962646484375, -0.1582794189453125, -0.12359619140625, -0.0889129638671875, -0.054229736328125, -0.0195465087890625, 0.01513671875, 0.0498199462890625, 0.084503173828125, 0.1191864013671875, 0.15386962890625, 0.1885528564453125, 0.223236083984375, 0.2579193115234375, 0.2926025390625, 0.3272857666015625, 0.361968994140625, 0.3966522216796875, 0.43133544921875, 0.4660186767578125, 0.500701904296875, 0.5353851318359375, 0.570068359375, 0.6047515869140625, 0.639434814453125, 0.6741180419921875, 0.70880126953125, 0.7434844970703125, 0.778167724609375, 0.8128509521484375, 0.8475341796875, 0.8822174072265625, 0.916900634765625, 0.9515838623046875, 0.98626708984375, 1.0209503173828125, 1.055633544921875, 1.0903167724609375, 1.125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 10.0, 20.0, 41.0, 89.0, 190.0, 279.0, 213.0, 99.0, 40.0, 20.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09815242141485214, -0.09309753775596619, -0.08804265409708023, -0.08298777043819427, -0.07793288677930832, -0.07287800312042236, -0.06782311201095581, -0.06276823580265045, -0.0577133484184742, -0.05265846475958824, -0.047603581100702286, -0.04254869371652603, -0.037493810057640076, -0.03243892639875412, -0.027384042739868164, -0.022329159080982208, -0.017274275422096252, -0.012219391763210297, -0.007164507173001766, -0.0021096225827932358, 0.00294526107609272, 0.008000144734978676, 0.013055030256509781, 0.018109913915395737, 0.023164797574281693, 0.02821968123316765, 0.033274564892053604, 0.03832945227622986, 0.043384335935115814, 0.04843921959400177, 0.053494103252887726, 0.05854898691177368, 0.06360387802124023, 0.06865876168012619, 0.07371364533901215, 0.0787685289978981, 0.08382341265678406, 0.08887829631567001, 0.09393317997455597, 0.09898807108402252, 0.10404294729232788, 0.10909783095121384, 0.11415271461009979, 0.11920759826898575, 0.1242624819278717, 0.12931737303733826, 0.13437224924564362, 0.13942714035511017, 0.14448201656341553, 0.14953690767288208, 0.15459178388118744, 0.159646674990654, 0.16470155119895935, 0.1697564423084259, 0.17481131851673126, 0.17986620962619781, 0.18492110073566437, 0.18997599184513092, 0.19503086805343628, 0.20008575916290283, 0.2051406353712082, 0.21019552648067474, 0.2152504026889801, 0.22030529379844666, 0.22536017000675201]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 2.0, 8.0, 11.0, 9.0, 13.0, 19.0, 12.0, 14.0, 18.0, 18.0, 24.0, 26.0, 22.0, 28.0, 34.0, 28.0, 28.0, 27.0, 31.0, 54.0, 37.0, 39.0, 46.0, 37.0, 30.0, 41.0, 22.0, 28.0, 23.0, 24.0, 35.0, 24.0, 28.0, 18.0, 16.0, 15.0, 12.0, 10.0, 11.0, 13.0, 11.0, 5.0, 13.0, 5.0, 8.0, 3.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.05248302221298218, -0.05086439102888107, -0.04924575984477997, -0.047627128660678864, -0.04600849747657776, -0.044389866292476654, -0.04277123510837555, -0.041152603924274445, -0.03953397274017334, -0.037915341556072235, -0.03629671037197113, -0.034678079187870026, -0.03305944800376892, -0.031440816819667816, -0.02982218563556671, -0.028203554451465607, -0.026584923267364502, -0.024966292083263397, -0.023347660899162292, -0.021729029715061188, -0.020110398530960083, -0.01849176734685898, -0.016873136162757874, -0.015254504978656769, -0.013635873794555664, -0.01201724261045456, -0.010398611426353455, -0.00877998024225235, -0.007161349058151245, -0.00554271787405014, -0.003924086689949036, -0.002305455505847931, -0.0006868243217468262, 0.0009318068623542786, 0.0025504380464553833, 0.004169069230556488, 0.005787700414657593, 0.0074063315987586975, 0.009024962782859802, 0.010643593966960907, 0.012262225151062012, 0.013880856335163116, 0.015499487519264221, 0.017118118703365326, 0.01873674988746643, 0.020355381071567535, 0.02197401225566864, 0.023592643439769745, 0.02521127462387085, 0.026829905807971954, 0.02844853699207306, 0.030067168176174164, 0.03168579936027527, 0.03330443054437637, 0.03492306172847748, 0.03654169291257858, 0.03816032409667969, 0.03977895528078079, 0.0413975864648819, 0.043016217648983, 0.044634848833084106, 0.04625348001718521, 0.047872111201286316, 0.04949074238538742, 0.051109373569488525]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 13.0, 4.0, 11.0, 9.0, 16.0, 15.0, 26.0, 18.0, 24.0, 26.0, 33.0, 40.0, 34.0, 30.0, 42.0, 43.0, 53.0, 58.0, 49.0, 49.0, 42.0, 46.0, 44.0, 39.0, 28.0, 26.0, 25.0, 21.0, 19.0, 9.0, 22.0, 17.0, 8.0, 12.0, 6.0, 6.0, 6.0, 5.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.328125, -7.0987548828125, -6.869384765625, -6.6400146484375, -6.41064453125, -6.1812744140625, -5.951904296875, -5.7225341796875, -5.4931640625, -5.2637939453125, -5.034423828125, -4.8050537109375, -4.57568359375, -4.3463134765625, -4.116943359375, -3.8875732421875, -3.658203125, -3.4288330078125, -3.199462890625, -2.9700927734375, -2.74072265625, -2.5113525390625, -2.281982421875, -2.0526123046875, -1.8232421875, -1.5938720703125, -1.364501953125, -1.1351318359375, -0.90576171875, -0.6763916015625, -0.447021484375, -0.2176513671875, 0.01171875, 0.2410888671875, 0.470458984375, 0.6998291015625, 0.92919921875, 1.1585693359375, 1.387939453125, 1.6173095703125, 1.8466796875, 2.0760498046875, 2.305419921875, 2.5347900390625, 2.76416015625, 2.9935302734375, 3.222900390625, 3.4522705078125, 3.681640625, 3.9110107421875, 4.140380859375, 4.3697509765625, 4.59912109375, 4.8284912109375, 5.057861328125, 5.2872314453125, 5.5166015625, 5.7459716796875, 5.975341796875, 6.2047119140625, 6.43408203125, 6.6634521484375, 6.892822265625, 7.1221923828125, 7.3515625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 13.0, 10.0, 22.0, 14.0, 19.0, 39.0, 41.0, 57.0, 88.0, 120.0, 202.0, 281.0, 435.0, 735.0, 1113.0, 1714.0, 2995.0, 4995.0, 8897.0, 15772.0, 28541.0, 55344.0, 119517.0, 266040.0, 281843.0, 130233.0, 59261.0, 30669.0, 16773.0, 9193.0, 5376.0, 3140.0, 1923.0, 1081.0, 691.0, 420.0, 313.0, 196.0, 125.0, 77.0, 69.0, 56.0, 30.0, 29.0, 16.0, 15.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.61328125, -7.35992431640625, -7.1065673828125, -6.85321044921875, -6.599853515625, -6.34649658203125, -6.0931396484375, -5.83978271484375, -5.58642578125, -5.33306884765625, -5.0797119140625, -4.82635498046875, -4.572998046875, -4.31964111328125, -4.0662841796875, -3.81292724609375, -3.5595703125, -3.30621337890625, -3.0528564453125, -2.79949951171875, -2.546142578125, -2.29278564453125, -2.0394287109375, -1.78607177734375, -1.53271484375, -1.27935791015625, -1.0260009765625, -0.77264404296875, -0.519287109375, -0.26593017578125, -0.0125732421875, 0.24078369140625, 0.494140625, 0.74749755859375, 1.0008544921875, 1.25421142578125, 1.507568359375, 1.76092529296875, 2.0142822265625, 2.26763916015625, 2.52099609375, 2.77435302734375, 3.0277099609375, 3.28106689453125, 3.534423828125, 3.78778076171875, 4.0411376953125, 4.29449462890625, 4.5478515625, 4.80120849609375, 5.0545654296875, 5.30792236328125, 5.561279296875, 5.81463623046875, 6.0679931640625, 6.32135009765625, 6.57470703125, 6.82806396484375, 7.0814208984375, 7.33477783203125, 7.588134765625, 7.84149169921875, 8.0948486328125, 8.34820556640625, 8.6015625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 9.0, 9.0, 8.0, 13.0, 9.0, 9.0, 19.0, 23.0, 23.0, 18.0, 23.0, 35.0, 33.0, 38.0, 48.0, 61.0, 92.0, 134.0, 219.0, 1336.0, 245.0, 146.0, 89.0, 63.0, 52.0, 30.0, 34.0, 35.0, 38.0, 30.0, 23.0, 18.0, 13.0, 23.0, 10.0, 5.0, 11.0, 4.0, 6.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.34375, -12.841796875, -12.33984375, -11.837890625, -11.3359375, -10.833984375, -10.33203125, -9.830078125, -9.328125, -8.826171875, -8.32421875, -7.822265625, -7.3203125, -6.818359375, -6.31640625, -5.814453125, -5.3125, -4.810546875, -4.30859375, -3.806640625, -3.3046875, -2.802734375, -2.30078125, -1.798828125, -1.296875, -0.794921875, -0.29296875, 0.208984375, 0.7109375, 1.212890625, 1.71484375, 2.216796875, 2.71875, 3.220703125, 3.72265625, 4.224609375, 4.7265625, 5.228515625, 5.73046875, 6.232421875, 6.734375, 7.236328125, 7.73828125, 8.240234375, 8.7421875, 9.244140625, 9.74609375, 10.248046875, 10.75, 11.251953125, 11.75390625, 12.255859375, 12.7578125, 13.259765625, 13.76171875, 14.263671875, 14.765625, 15.267578125, 15.76953125, 16.271484375, 16.7734375, 17.275390625, 17.77734375, 18.279296875, 18.78125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 6.0, 2.0, 7.0, 10.0, 14.0, 22.0, 12.0, 25.0, 42.0, 38.0, 69.0, 101.0, 132.0, 204.0, 338.0, 528.0, 1218.0, 4126.0, 23720.0, 281348.0, 2652874.0, 158990.0, 16307.0, 3082.0, 1007.0, 463.0, 312.0, 202.0, 149.0, 103.0, 56.0, 56.0, 35.0, 32.0, 14.0, 11.0, 11.0, 8.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.34375, -23.515869140625, -22.68798828125, -21.860107421875, -21.0322265625, -20.204345703125, -19.37646484375, -18.548583984375, -17.720703125, -16.892822265625, -16.06494140625, -15.237060546875, -14.4091796875, -13.581298828125, -12.75341796875, -11.925537109375, -11.09765625, -10.269775390625, -9.44189453125, -8.614013671875, -7.7861328125, -6.958251953125, -6.13037109375, -5.302490234375, -4.474609375, -3.646728515625, -2.81884765625, -1.990966796875, -1.1630859375, -0.335205078125, 0.49267578125, 1.320556640625, 2.1484375, 2.976318359375, 3.80419921875, 4.632080078125, 5.4599609375, 6.287841796875, 7.11572265625, 7.943603515625, 8.771484375, 9.599365234375, 10.42724609375, 11.255126953125, 12.0830078125, 12.910888671875, 13.73876953125, 14.566650390625, 15.39453125, 16.222412109375, 17.05029296875, 17.878173828125, 18.7060546875, 19.533935546875, 20.36181640625, 21.189697265625, 22.017578125, 22.845458984375, 23.67333984375, 24.501220703125, 25.3291015625, 26.156982421875, 26.98486328125, 27.812744140625, 28.640625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 13.0, 61.0, 234.0, 422.0, 214.0, 46.0, 17.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.1397933959961, -83.39500427246094, -77.65020751953125, -71.9054183959961, -66.1606216430664, -60.41583251953125, -54.67103958129883, -48.926246643066406, -43.181453704833984, -37.43666076660156, -31.69186782836914, -25.94707679748535, -20.20228385925293, -14.457490921020508, -8.712699890136719, -2.967906951904297, 2.776885986328125, 8.521678924560547, 14.266470909118652, 20.011262893676758, 25.75605583190918, 31.5008487701416, 37.24563980102539, 42.99043273925781, 48.735225677490234, 54.480018615722656, 60.22481155395508, 65.9696044921875, 71.71439361572266, 77.45919036865234, 83.2039794921875, 88.94877624511719, 94.69355773925781, 100.43834686279297, 106.18314361572266, 111.92793273925781, 117.6727294921875, 123.41751861572266, 129.1623077392578, 134.9071044921875, 140.6519012451172, 146.39669799804688, 152.1414794921875, 157.8862762451172, 163.63107299804688, 169.37586975097656, 175.1206512451172, 180.86544799804688, 186.6102294921875, 192.3550262451172, 198.0998077392578, 203.8446044921875, 209.5894012451172, 215.33419799804688, 221.0789794921875, 226.8237762451172, 232.56857299804688, 238.31336975097656, 244.0581512451172, 249.80294799804688, 255.54774475097656, 261.29254150390625, 267.0373229980469, 272.7821044921875, 278.52691650390625]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 5.0, 15.0, 11.0, 18.0, 14.0, 21.0, 19.0, 19.0, 25.0, 24.0, 28.0, 38.0, 32.0, 44.0, 45.0, 39.0, 41.0, 55.0, 45.0, 34.0, 39.0, 28.0, 43.0, 38.0, 36.0, 27.0, 27.0, 23.0, 18.0, 18.0, 24.0, 14.0, 13.0, 13.0, 17.0, 14.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.63214111328125, -37.38907241821289, -36.14600372314453, -34.90293884277344, -33.65987014770508, -32.41680145263672, -31.17373275756836, -29.930665969848633, -28.687599182128906, -27.444530487060547, -26.20146369934082, -24.95839500427246, -23.715328216552734, -22.472259521484375, -21.229190826416016, -19.98612403869629, -18.74305534362793, -17.49998664855957, -16.256919860839844, -15.013851165771484, -13.770784378051758, -12.527715682983398, -11.284647941589355, -10.041580200195312, -8.79851245880127, -7.555444717407227, -6.312376976013184, -5.069308757781982, -3.8262410163879395, -2.5831732749938965, -1.3401050567626953, -0.09703731536865234, 1.1460304260253906, 2.3890981674194336, 3.6321661472320557, 4.875234127044678, 6.118301868438721, 7.361369609832764, 8.604437828063965, 9.847505569458008, 11.09057331085205, 12.333641052246094, 13.576708793640137, 14.81977653503418, 16.06284523010254, 17.305912017822266, 18.548980712890625, 19.792049407958984, 21.03511619567871, 22.27818489074707, 23.521251678466797, 24.764320373535156, 26.007387161254883, 27.250455856323242, 28.49352264404297, 29.736591339111328, 30.979660034179688, 32.22272872924805, 33.465797424316406, 34.7088623046875, 35.95193099975586, 37.19499969482422, 38.43806838989258, 39.68113708496094, 40.92420196533203]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 13.0, 10.0, 15.0, 13.0, 6.0, 16.0, 20.0, 28.0, 39.0, 27.0, 29.0, 45.0, 38.0, 54.0, 42.0, 44.0, 58.0, 37.0, 42.0, 56.0, 53.0, 27.0, 39.0, 30.0, 35.0, 24.0, 20.0, 25.0, 17.0, 22.0, 10.0, 10.0, 8.0, 7.0, 8.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4140625, -7.1663818359375, -6.918701171875, -6.6710205078125, -6.42333984375, -6.1756591796875, -5.927978515625, -5.6802978515625, -5.4326171875, -5.1849365234375, -4.937255859375, -4.6895751953125, -4.44189453125, -4.1942138671875, -3.946533203125, -3.6988525390625, -3.451171875, -3.2034912109375, -2.955810546875, -2.7081298828125, -2.46044921875, -2.2127685546875, -1.965087890625, -1.7174072265625, -1.4697265625, -1.2220458984375, -0.974365234375, -0.7266845703125, -0.47900390625, -0.2313232421875, 0.016357421875, 0.2640380859375, 0.51171875, 0.7593994140625, 1.007080078125, 1.2547607421875, 1.50244140625, 1.7501220703125, 1.997802734375, 2.2454833984375, 2.4931640625, 2.7408447265625, 2.988525390625, 3.2362060546875, 3.48388671875, 3.7315673828125, 3.979248046875, 4.2269287109375, 4.474609375, 4.7222900390625, 4.969970703125, 5.2176513671875, 5.46533203125, 5.7130126953125, 5.960693359375, 6.2083740234375, 6.4560546875, 6.7037353515625, 6.951416015625, 7.1990966796875, 7.44677734375, 7.6944580078125, 7.942138671875, 8.1898193359375, 8.4375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 2.0, 5.0, 8.0, 9.0, 8.0, 13.0, 10.0, 12.0, 18.0, 15.0, 36.0, 39.0, 46.0, 36.0, 67.0, 89.0, 127.0, 167.0, 231.0, 444.0, 1025.0, 5582.0, 217258.0, 3927406.0, 37064.0, 2676.0, 731.0, 309.0, 222.0, 155.0, 90.0, 73.0, 65.0, 43.0, 35.0, 27.0, 28.0, 21.0, 18.0, 8.0, 18.0, 9.0, 10.0, 5.0, 11.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-50.96875, -49.34130859375, -47.7138671875, -46.08642578125, -44.458984375, -42.83154296875, -41.2041015625, -39.57666015625, -37.94921875, -36.32177734375, -34.6943359375, -33.06689453125, -31.439453125, -29.81201171875, -28.1845703125, -26.55712890625, -24.9296875, -23.30224609375, -21.6748046875, -20.04736328125, -18.419921875, -16.79248046875, -15.1650390625, -13.53759765625, -11.91015625, -10.28271484375, -8.6552734375, -7.02783203125, -5.400390625, -3.77294921875, -2.1455078125, -0.51806640625, 1.109375, 2.73681640625, 4.3642578125, 5.99169921875, 7.619140625, 9.24658203125, 10.8740234375, 12.50146484375, 14.12890625, 15.75634765625, 17.3837890625, 19.01123046875, 20.638671875, 22.26611328125, 23.8935546875, 25.52099609375, 27.1484375, 28.77587890625, 30.4033203125, 32.03076171875, 33.658203125, 35.28564453125, 36.9130859375, 38.54052734375, 40.16796875, 41.79541015625, 43.4228515625, 45.05029296875, 46.677734375, 48.30517578125, 49.9326171875, 51.56005859375, 53.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 9.0, 10.0, 5.0, 15.0, 23.0, 13.0, 28.0, 57.0, 64.0, 87.0, 143.0, 197.0, 333.0, 608.0, 759.0, 604.0, 394.0, 238.0, 145.0, 96.0, 60.0, 49.0, 33.0, 25.0, 21.0, 10.0, 11.0, 8.0, 6.0, 6.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9627685546875, -10.566162109375, -10.1695556640625, -9.77294921875, -9.3763427734375, -8.979736328125, -8.5831298828125, -8.1865234375, -7.7899169921875, -7.393310546875, -6.9967041015625, -6.60009765625, -6.2034912109375, -5.806884765625, -5.4102783203125, -5.013671875, -4.6170654296875, -4.220458984375, -3.8238525390625, -3.42724609375, -3.0306396484375, -2.634033203125, -2.2374267578125, -1.8408203125, -1.4442138671875, -1.047607421875, -0.6510009765625, -0.25439453125, 0.1422119140625, 0.538818359375, 0.9354248046875, 1.33203125, 1.7286376953125, 2.125244140625, 2.5218505859375, 2.91845703125, 3.3150634765625, 3.711669921875, 4.1082763671875, 4.5048828125, 4.9014892578125, 5.298095703125, 5.6947021484375, 6.09130859375, 6.4879150390625, 6.884521484375, 7.2811279296875, 7.677734375, 8.0743408203125, 8.470947265625, 8.8675537109375, 9.26416015625, 9.6607666015625, 10.057373046875, 10.4539794921875, 10.8505859375, 11.2471923828125, 11.643798828125, 12.0404052734375, 12.43701171875, 12.8336181640625, 13.230224609375, 13.6268310546875, 14.0234375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 8.0, 9.0, 10.0, 9.0, 19.0, 28.0, 42.0, 64.0, 89.0, 172.0, 329.0, 616.0, 1438.0, 4085.0, 20614.0, 240609.0, 3654317.0, 244086.0, 20642.0, 4178.0, 1421.0, 633.0, 315.0, 205.0, 120.0, 59.0, 49.0, 31.0, 22.0, 19.0, 10.0, 11.0, 11.0, 9.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.328125, -25.334716796875, -24.34130859375, -23.347900390625, -22.3544921875, -21.361083984375, -20.36767578125, -19.374267578125, -18.380859375, -17.387451171875, -16.39404296875, -15.400634765625, -14.4072265625, -13.413818359375, -12.42041015625, -11.427001953125, -10.43359375, -9.440185546875, -8.44677734375, -7.453369140625, -6.4599609375, -5.466552734375, -4.47314453125, -3.479736328125, -2.486328125, -1.492919921875, -0.49951171875, 0.493896484375, 1.4873046875, 2.480712890625, 3.47412109375, 4.467529296875, 5.4609375, 6.454345703125, 7.44775390625, 8.441162109375, 9.4345703125, 10.427978515625, 11.42138671875, 12.414794921875, 13.408203125, 14.401611328125, 15.39501953125, 16.388427734375, 17.3818359375, 18.375244140625, 19.36865234375, 20.362060546875, 21.35546875, 22.348876953125, 23.34228515625, 24.335693359375, 25.3291015625, 26.322509765625, 27.31591796875, 28.309326171875, 29.302734375, 30.296142578125, 31.28955078125, 32.282958984375, 33.2763671875, 34.269775390625, 35.26318359375, 36.256591796875, 37.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 19.0, 29.0, 58.0, 111.0, 160.0, 173.0, 173.0, 140.0, 71.0, 42.0, 13.0, 13.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.17195892333984, -124.71599578857422, -122.2600326538086, -119.80406951904297, -117.34810638427734, -114.89214324951172, -112.4361801147461, -109.98021697998047, -107.52425384521484, -105.06829071044922, -102.6123275756836, -100.15636444091797, -97.70040130615234, -95.24443817138672, -92.7884750366211, -90.33251190185547, -87.87654113769531, -85.42057800292969, -82.96461486816406, -80.50865173339844, -78.05268859863281, -75.59672546386719, -73.14076232910156, -70.68479919433594, -68.22883605957031, -65.77287292480469, -63.31690979003906, -60.86094665527344, -58.40498352050781, -55.94902038574219, -53.49305725097656, -51.03709411621094, -48.581138610839844, -46.12517547607422, -43.669212341308594, -41.21324920654297, -38.757286071777344, -36.30132293701172, -33.845359802246094, -31.389394760131836, -28.933429718017578, -26.477466583251953, -24.021503448486328, -21.565540313720703, -19.109577178955078, -16.653614044189453, -14.197649002075195, -11.74168586730957, -9.285722732543945, -6.82975959777832, -4.373795986175537, -1.917832374572754, 0.5381307601928711, 2.994093894958496, 5.4500579833984375, 7.9060211181640625, 10.361984252929688, 12.817947387695312, 15.273910522460938, 17.729873657226562, 20.185836791992188, 22.641799926757812, 25.09776496887207, 27.553728103637695, 30.00969123840332]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 7.0, 10.0, 12.0, 9.0, 8.0, 11.0, 13.0, 18.0, 24.0, 21.0, 28.0, 22.0, 30.0, 39.0, 30.0, 37.0, 32.0, 37.0, 42.0, 35.0, 42.0, 37.0, 44.0, 48.0, 36.0, 32.0, 34.0, 27.0, 22.0, 34.0, 22.0, 23.0, 17.0, 14.0, 14.0, 12.0, 16.0, 4.0, 9.0, 8.0, 9.0, 2.0, 8.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-30.647640228271484, -29.681854248046875, -28.7160701751709, -27.75028419494629, -26.784500122070312, -25.818714141845703, -24.852928161621094, -23.887144088745117, -22.921358108520508, -21.9555721282959, -20.989788055419922, -20.024002075195312, -19.058218002319336, -18.092432022094727, -17.12664794921875, -16.16086196899414, -15.195076942443848, -14.229291915893555, -13.263506889343262, -12.297721862792969, -11.33193588256836, -10.366150856018066, -9.400365829467773, -8.434579849243164, -7.468795299530029, -6.503010272979736, -5.537224769592285, -4.571439743041992, -3.60565447807312, -2.639869213104248, -1.674084186553955, -0.7082986831665039, 0.25748634338378906, 1.2232716083526611, 2.189056873321533, 3.154841899871826, 4.120627403259277, 5.08641242980957, 6.052197456359863, 7.0179829597473145, 7.983767986297607, 8.949553489685059, 9.915338516235352, 10.881123542785645, 11.846908569335938, 12.812694549560547, 13.778478622436523, 14.744264602661133, 15.710049629211426, 16.67583465576172, 17.641620635986328, 18.607404708862305, 19.573190689086914, 20.53897476196289, 21.5047607421875, 22.47054672241211, 23.436330795288086, 24.402116775512695, 25.367900848388672, 26.33368682861328, 27.299470901489258, 28.265256881713867, 29.231040954589844, 30.196826934814453, 31.162612915039062]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 11.0, 16.0, 18.0, 4.0, 26.0, 27.0, 26.0, 33.0, 33.0, 30.0, 38.0, 39.0, 53.0, 47.0, 67.0, 35.0, 43.0, 51.0, 57.0, 37.0, 42.0, 53.0, 38.0, 24.0, 28.0, 22.0, 10.0, 17.0, 9.0, 8.0, 16.0, 8.0, 4.0, 2.0, 3.0, 2.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.8807373046875, -6.620849609375, -6.3609619140625, -6.10107421875, -5.8411865234375, -5.581298828125, -5.3214111328125, -5.0615234375, -4.8016357421875, -4.541748046875, -4.2818603515625, -4.02197265625, -3.7620849609375, -3.502197265625, -3.2423095703125, -2.982421875, -2.7225341796875, -2.462646484375, -2.2027587890625, -1.94287109375, -1.6829833984375, -1.423095703125, -1.1632080078125, -0.9033203125, -0.6434326171875, -0.383544921875, -0.1236572265625, 0.13623046875, 0.3961181640625, 0.656005859375, 0.9158935546875, 1.17578125, 1.4356689453125, 1.695556640625, 1.9554443359375, 2.21533203125, 2.4752197265625, 2.735107421875, 2.9949951171875, 3.2548828125, 3.5147705078125, 3.774658203125, 4.0345458984375, 4.29443359375, 4.5543212890625, 4.814208984375, 5.0740966796875, 5.333984375, 5.5938720703125, 5.853759765625, 6.1136474609375, 6.37353515625, 6.6334228515625, 6.893310546875, 7.1531982421875, 7.4130859375, 7.6729736328125, 7.932861328125, 8.1927490234375, 8.45263671875, 8.7125244140625, 8.972412109375, 9.2322998046875, 9.4921875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 13.0, 23.0, 28.0, 36.0, 52.0, 57.0, 79.0, 132.0, 165.0, 285.0, 342.0, 536.0, 806.0, 1329.0, 2172.0, 3779.0, 7711.0, 16902.0, 41179.0, 111075.0, 292477.0, 337988.0, 139912.0, 50834.0, 20332.0, 9164.0, 4480.0, 2421.0, 1409.0, 901.0, 570.0, 424.0, 259.0, 182.0, 141.0, 107.0, 68.0, 55.0, 34.0, 20.0, 11.0, 14.0, 7.0, 8.0, 8.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9326171875, -1.8704986572265625, -1.808380126953125, -1.7462615966796875, -1.68414306640625, -1.6220245361328125, -1.559906005859375, -1.4977874755859375, -1.4356689453125, -1.3735504150390625, -1.311431884765625, -1.2493133544921875, -1.18719482421875, -1.1250762939453125, -1.062957763671875, -1.0008392333984375, -0.938720703125, -0.8766021728515625, -0.814483642578125, -0.7523651123046875, -0.69024658203125, -0.6281280517578125, -0.566009521484375, -0.5038909912109375, -0.4417724609375, -0.3796539306640625, -0.317535400390625, -0.2554168701171875, -0.19329833984375, -0.1311798095703125, -0.069061279296875, -0.0069427490234375, 0.05517578125, 0.1172943115234375, 0.179412841796875, 0.2415313720703125, 0.30364990234375, 0.3657684326171875, 0.427886962890625, 0.4900054931640625, 0.5521240234375, 0.6142425537109375, 0.676361083984375, 0.7384796142578125, 0.80059814453125, 0.8627166748046875, 0.924835205078125, 0.9869537353515625, 1.049072265625, 1.1111907958984375, 1.173309326171875, 1.2354278564453125, 1.29754638671875, 1.3596649169921875, 1.421783447265625, 1.4839019775390625, 1.5460205078125, 1.6081390380859375, 1.670257568359375, 1.7323760986328125, 1.79449462890625, 1.8566131591796875, 1.918731689453125, 1.9808502197265625, 2.04296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 8.0, 4.0, 9.0, 7.0, 5.0, 11.0, 12.0, 18.0, 19.0, 20.0, 24.0, 24.0, 24.0, 28.0, 42.0, 42.0, 37.0, 57.0, 40.0, 53.0, 1063.0, 33.0, 48.0, 49.0, 35.0, 41.0, 31.0, 36.0, 28.0, 31.0, 38.0, 24.0, 21.0, 7.0, 13.0, 10.0, 11.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.52734375, -6.349609375, -6.171875, -5.994140625, -5.81640625, -5.638671875, -5.4609375, -5.283203125, -5.10546875, -4.927734375, -4.75, -4.572265625, -4.39453125, -4.216796875, -4.0390625, -3.861328125, -3.68359375, -3.505859375, -3.328125, -3.150390625, -2.97265625, -2.794921875, -2.6171875, -2.439453125, -2.26171875, -2.083984375, -1.90625, -1.728515625, -1.55078125, -1.373046875, -1.1953125, -1.017578125, -0.83984375, -0.662109375, -0.484375, -0.306640625, -0.12890625, 0.048828125, 0.2265625, 0.404296875, 0.58203125, 0.759765625, 0.9375, 1.115234375, 1.29296875, 1.470703125, 1.6484375, 1.826171875, 2.00390625, 2.181640625, 2.359375, 2.537109375, 2.71484375, 2.892578125, 3.0703125, 3.248046875, 3.42578125, 3.603515625, 3.78125, 3.958984375, 4.13671875, 4.314453125, 4.4921875, 4.669921875, 4.84765625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 6.0, 9.0, 14.0, 26.0, 33.0, 43.0, 60.0, 111.0, 139.0, 201.0, 337.0, 507.0, 794.0, 1308.0, 2183.0, 3978.0, 7812.0, 17794.0, 45869.0, 143948.0, 1074606.0, 609233.0, 117449.0, 39312.0, 15341.0, 7004.0, 3581.0, 2066.0, 1199.0, 751.0, 501.0, 277.0, 218.0, 137.0, 94.0, 46.0, 38.0, 34.0, 25.0, 13.0, 5.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.478179931640625, -1.42706298828125, -1.375946044921875, -1.3248291015625, -1.273712158203125, -1.22259521484375, -1.171478271484375, -1.120361328125, -1.069244384765625, -1.01812744140625, -0.967010498046875, -0.9158935546875, -0.864776611328125, -0.81365966796875, -0.762542724609375, -0.71142578125, -0.660308837890625, -0.60919189453125, -0.558074951171875, -0.5069580078125, -0.455841064453125, -0.40472412109375, -0.353607177734375, -0.302490234375, -0.251373291015625, -0.20025634765625, -0.149139404296875, -0.0980224609375, -0.046905517578125, 0.00421142578125, 0.055328369140625, 0.1064453125, 0.157562255859375, 0.20867919921875, 0.259796142578125, 0.3109130859375, 0.362030029296875, 0.41314697265625, 0.464263916015625, 0.515380859375, 0.566497802734375, 0.61761474609375, 0.668731689453125, 0.7198486328125, 0.770965576171875, 0.82208251953125, 0.873199462890625, 0.92431640625, 0.975433349609375, 1.02655029296875, 1.077667236328125, 1.1287841796875, 1.179901123046875, 1.23101806640625, 1.282135009765625, 1.333251953125, 1.384368896484375, 1.43548583984375, 1.486602783203125, 1.5377197265625, 1.588836669921875, 1.63995361328125, 1.691070556640625, 1.7421875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 12.0, 23.0, 88.0, 423.0, 309.0, 75.0, 25.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74267578125, -0.7116012573242188, -0.6805267333984375, -0.6494522094726562, -0.618377685546875, -0.5873031616210938, -0.5562286376953125, -0.5251541137695312, -0.49407958984375, -0.46300506591796875, -0.4319305419921875, -0.40085601806640625, -0.369781494140625, -0.33870697021484375, -0.3076324462890625, -0.27655792236328125, -0.2454833984375, -0.21440887451171875, -0.1833343505859375, -0.15225982666015625, -0.121185302734375, -0.09011077880859375, -0.0590362548828125, -0.02796173095703125, 0.00311279296875, 0.03418731689453125, 0.0652618408203125, 0.09633636474609375, 0.127410888671875, 0.15848541259765625, 0.1895599365234375, 0.22063446044921875, 0.251708984375, 0.28278350830078125, 0.3138580322265625, 0.34493255615234375, 0.376007080078125, 0.40708160400390625, 0.4381561279296875, 0.46923065185546875, 0.50030517578125, 0.5313796997070312, 0.5624542236328125, 0.5935287475585938, 0.624603271484375, 0.6556777954101562, 0.6867523193359375, 0.7178268432617188, 0.7489013671875, 0.7799758911132812, 0.8110504150390625, 0.8421249389648438, 0.873199462890625, 0.9042739868164062, 0.9353485107421875, 0.9664230346679688, 0.99749755859375, 1.0285720825195312, 1.0596466064453125, 1.0907211303710938, 1.121795654296875, 1.1528701782226562, 1.1839447021484375, 1.2150192260742188, 1.24609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 1.0, 4.0, 1.0, 6.0, 11.0, 10.0, 14.0, 43.0, 84.0, 420.0, 7333.0, 1036801.0, 3373.0, 299.0, 71.0, 24.0, 13.0, 7.0, 5.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.125, -22.5523681640625, -21.979736328125, -21.4071044921875, -20.83447265625, -20.2618408203125, -19.689208984375, -19.1165771484375, -18.5439453125, -17.9713134765625, -17.398681640625, -16.8260498046875, -16.25341796875, -15.6807861328125, -15.108154296875, -14.5355224609375, -13.962890625, -13.3902587890625, -12.817626953125, -12.2449951171875, -11.67236328125, -11.0997314453125, -10.527099609375, -9.9544677734375, -9.3818359375, -8.8092041015625, -8.236572265625, -7.6639404296875, -7.09130859375, -6.5186767578125, -5.946044921875, -5.3734130859375, -4.80078125, -4.2281494140625, -3.655517578125, -3.0828857421875, -2.51025390625, -1.9376220703125, -1.364990234375, -0.7923583984375, -0.2197265625, 0.3529052734375, 0.925537109375, 1.4981689453125, 2.07080078125, 2.6434326171875, 3.216064453125, 3.7886962890625, 4.361328125, 4.9339599609375, 5.506591796875, 6.0792236328125, 6.65185546875, 7.2244873046875, 7.797119140625, 8.3697509765625, 8.9423828125, 9.5150146484375, 10.087646484375, 10.6602783203125, 11.23291015625, 11.8055419921875, 12.378173828125, 12.9508056640625, 13.5234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 19.0, 45.0, 119.0, 325.0, 311.0, 128.0, 40.0, 15.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9082821607589722, -1.8553962707519531, -1.802510380744934, -1.749624490737915, -1.6967384815216064, -1.6438525915145874, -1.5909667015075684, -1.5380808115005493, -1.4851949214935303, -1.4323090314865112, -1.3794231414794922, -1.3265371322631836, -1.2736512422561646, -1.2207653522491455, -1.1678794622421265, -1.1149935722351074, -1.0621075630187988, -1.0092216730117798, -0.956335723400116, -0.9034498333930969, -0.8505638837814331, -0.7976779937744141, -0.744792103767395, -0.691906213760376, -0.6390202641487122, -0.5861343741416931, -0.5332484245300293, -0.48036253452301025, -0.4274766147136688, -0.3745906949043274, -0.32170480489730835, -0.2688188850879669, -0.21593284606933594, -0.1630469262599945, -0.11016102135181427, -0.05727511644363403, -0.0043891966342926025, 0.04849672317504883, 0.10138261318206787, 0.1542685329914093, 0.20715445280075073, 0.26004037261009216, 0.3129262924194336, 0.36581218242645264, 0.41869810223579407, 0.4715840220451355, 0.5244699120521545, 0.5773558616638184, 0.6302417516708374, 0.6831276416778564, 0.7360135912895203, 0.7888994812965393, 0.8417854309082031, 0.8946713209152222, 0.9475572109222412, 1.0004431009292603, 1.0533289909362793, 1.1062148809432983, 1.1591007709503174, 1.211986780166626, 1.264872670173645, 1.317758560180664, 1.370644450187683, 1.4235303401947021, 1.4764163494110107]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 7.0, 3.0, 5.0, 7.0, 14.0, 11.0, 9.0, 18.0, 14.0, 17.0, 15.0, 28.0, 28.0, 22.0, 28.0, 29.0, 36.0, 36.0, 38.0, 42.0, 32.0, 36.0, 48.0, 31.0, 36.0, 24.0, 31.0, 28.0, 38.0, 29.0, 25.0, 22.0, 27.0, 21.0, 27.0, 16.0, 15.0, 15.0, 9.0, 13.0, 13.0, 9.0, 5.0, 5.0, 4.0, 5.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2979714274406433, -0.28837889432907104, -0.2787863612174988, -0.2691938281059265, -0.25960129499435425, -0.250008761882782, -0.24041621387004852, -0.23082368075847626, -0.221231147646904, -0.21163861453533173, -0.20204608142375946, -0.1924535483121872, -0.18286100029945374, -0.17326846718788147, -0.1636759340763092, -0.15408340096473694, -0.14449086785316467, -0.1348983347415924, -0.12530580163002014, -0.11571326106786728, -0.10612072795629501, -0.09652819484472275, -0.08693565428256989, -0.07734312117099762, -0.06775058805942535, -0.05815805494785309, -0.048565518110990524, -0.03897298127412796, -0.029380448162555695, -0.01978791505098343, -0.010195378214120865, -0.0006028413772583008, 0.008989691734313965, 0.01858222670853138, 0.028174761682748795, 0.03776729851961136, 0.047359831631183624, 0.05695236474275589, 0.06654490530490875, 0.07613743841648102, 0.08572997152805328, 0.09532250463962555, 0.10491503775119781, 0.11450757831335068, 0.12410011142492294, 0.1336926519870758, 0.14328518509864807, 0.15287771821022034, 0.1624702513217926, 0.17206278443336487, 0.18165531754493713, 0.1912478506565094, 0.20084038376808167, 0.21043291687965393, 0.2200254648923874, 0.22961799800395966, 0.23921053111553192, 0.2488030642271042, 0.25839561223983765, 0.2679881453514099, 0.2775806784629822, 0.28717321157455444, 0.2967657446861267, 0.306358277797699, 0.31595081090927124]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 10.0, 1.0, 8.0, 6.0, 7.0, 19.0, 14.0, 21.0, 16.0, 16.0, 29.0, 29.0, 29.0, 37.0, 32.0, 33.0, 46.0, 47.0, 35.0, 57.0, 37.0, 41.0, 53.0, 46.0, 44.0, 30.0, 37.0, 39.0, 26.0, 15.0, 31.0, 16.0, 15.0, 8.0, 9.0, 8.0, 9.0, 7.0, 9.0, 5.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.90692138671875, -6.6771240234375, -6.44732666015625, -6.217529296875, -5.98773193359375, -5.7579345703125, -5.52813720703125, -5.29833984375, -5.06854248046875, -4.8387451171875, -4.60894775390625, -4.379150390625, -4.14935302734375, -3.9195556640625, -3.68975830078125, -3.4599609375, -3.23016357421875, -3.0003662109375, -2.77056884765625, -2.540771484375, -2.31097412109375, -2.0811767578125, -1.85137939453125, -1.62158203125, -1.39178466796875, -1.1619873046875, -0.93218994140625, -0.702392578125, -0.47259521484375, -0.2427978515625, -0.01300048828125, 0.216796875, 0.44659423828125, 0.6763916015625, 0.90618896484375, 1.135986328125, 1.36578369140625, 1.5955810546875, 1.82537841796875, 2.05517578125, 2.28497314453125, 2.5147705078125, 2.74456787109375, 2.974365234375, 3.20416259765625, 3.4339599609375, 3.66375732421875, 3.8935546875, 4.12335205078125, 4.3531494140625, 4.58294677734375, 4.812744140625, 5.04254150390625, 5.2723388671875, 5.50213623046875, 5.73193359375, 5.96173095703125, 6.1915283203125, 6.42132568359375, 6.651123046875, 6.88092041015625, 7.1107177734375, 7.34051513671875, 7.5703125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 8.0, 11.0, 19.0, 17.0, 26.0, 30.0, 41.0, 52.0, 96.0, 102.0, 168.0, 278.0, 445.0, 724.0, 1356.0, 2749.0, 5697.0, 12637.0, 29003.0, 69201.0, 165482.0, 325345.0, 248244.0, 106743.0, 44413.0, 18820.0, 8457.0, 3865.0, 1930.0, 1017.0, 528.0, 332.0, 206.0, 126.0, 99.0, 67.0, 53.0, 34.0, 42.0, 15.0, 26.0, 12.0, 12.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.921875, -8.6219482421875, -8.322021484375, -8.0220947265625, -7.72216796875, -7.4222412109375, -7.122314453125, -6.8223876953125, -6.5224609375, -6.2225341796875, -5.922607421875, -5.6226806640625, -5.32275390625, -5.0228271484375, -4.722900390625, -4.4229736328125, -4.123046875, -3.8231201171875, -3.523193359375, -3.2232666015625, -2.92333984375, -2.6234130859375, -2.323486328125, -2.0235595703125, -1.7236328125, -1.4237060546875, -1.123779296875, -0.8238525390625, -0.52392578125, -0.2239990234375, 0.075927734375, 0.3758544921875, 0.67578125, 0.9757080078125, 1.275634765625, 1.5755615234375, 1.87548828125, 2.1754150390625, 2.475341796875, 2.7752685546875, 3.0751953125, 3.3751220703125, 3.675048828125, 3.9749755859375, 4.27490234375, 4.5748291015625, 4.874755859375, 5.1746826171875, 5.474609375, 5.7745361328125, 6.074462890625, 6.3743896484375, 6.67431640625, 6.9742431640625, 7.274169921875, 7.5740966796875, 7.8740234375, 8.1739501953125, 8.473876953125, 8.7738037109375, 9.07373046875, 9.3736572265625, 9.673583984375, 9.9735107421875, 10.2734375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 10.0, 8.0, 9.0, 15.0, 24.0, 24.0, 39.0, 35.0, 48.0, 61.0, 92.0, 129.0, 212.0, 1397.0, 284.0, 185.0, 125.0, 77.0, 59.0, 55.0, 46.0, 25.0, 19.0, 9.0, 12.0, 10.0, 10.0, 7.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-24.484375, -23.7138671875, -22.943359375, -22.1728515625, -21.40234375, -20.6318359375, -19.861328125, -19.0908203125, -18.3203125, -17.5498046875, -16.779296875, -16.0087890625, -15.23828125, -14.4677734375, -13.697265625, -12.9267578125, -12.15625, -11.3857421875, -10.615234375, -9.8447265625, -9.07421875, -8.3037109375, -7.533203125, -6.7626953125, -5.9921875, -5.2216796875, -4.451171875, -3.6806640625, -2.91015625, -2.1396484375, -1.369140625, -0.5986328125, 0.171875, 0.9423828125, 1.712890625, 2.4833984375, 3.25390625, 4.0244140625, 4.794921875, 5.5654296875, 6.3359375, 7.1064453125, 7.876953125, 8.6474609375, 9.41796875, 10.1884765625, 10.958984375, 11.7294921875, 12.5, 13.2705078125, 14.041015625, 14.8115234375, 15.58203125, 16.3525390625, 17.123046875, 17.8935546875, 18.6640625, 19.4345703125, 20.205078125, 20.9755859375, 21.74609375, 22.5166015625, 23.287109375, 24.0576171875, 24.828125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 11.0, 4.0, 13.0, 16.0, 19.0, 34.0, 39.0, 69.0, 90.0, 140.0, 208.0, 320.0, 643.0, 1724.0, 16363.0, 3101583.0, 20993.0, 1765.0, 690.0, 333.0, 205.0, 141.0, 89.0, 52.0, 43.0, 34.0, 25.0, 17.0, 13.0, 13.0, 7.0, 3.0, 0.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.0, -79.5537109375, -77.107421875, -74.6611328125, -72.21484375, -69.7685546875, -67.322265625, -64.8759765625, -62.4296875, -59.9833984375, -57.537109375, -55.0908203125, -52.64453125, -50.1982421875, -47.751953125, -45.3056640625, -42.859375, -40.4130859375, -37.966796875, -35.5205078125, -33.07421875, -30.6279296875, -28.181640625, -25.7353515625, -23.2890625, -20.8427734375, -18.396484375, -15.9501953125, -13.50390625, -11.0576171875, -8.611328125, -6.1650390625, -3.71875, -1.2724609375, 1.173828125, 3.6201171875, 6.06640625, 8.5126953125, 10.958984375, 13.4052734375, 15.8515625, 18.2978515625, 20.744140625, 23.1904296875, 25.63671875, 28.0830078125, 30.529296875, 32.9755859375, 35.421875, 37.8681640625, 40.314453125, 42.7607421875, 45.20703125, 47.6533203125, 50.099609375, 52.5458984375, 54.9921875, 57.4384765625, 59.884765625, 62.3310546875, 64.77734375, 67.2236328125, 69.669921875, 72.1162109375, 74.5625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 27.0, 74.0, 184.0, 338.0, 247.0, 93.0, 24.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.49199676513672, -103.90157318115234, -98.31114196777344, -92.72071838378906, -87.13028717041016, -81.53986358642578, -75.94943237304688, -70.3590087890625, -64.76858520507812, -59.178157806396484, -53.587730407714844, -47.99730682373047, -42.40687561035156, -36.81645202636719, -31.226024627685547, -25.635597229003906, -20.045166015625, -14.45473861694336, -8.864312171936035, -3.273885726928711, 2.3165416717529297, 7.90696907043457, 13.497394561767578, 19.08782196044922, 24.67824935913086, 30.2686767578125, 35.85910415649414, 41.44953155517578, 47.039955139160156, 52.63038635253906, 58.22080993652344, 63.81123733520508, 69.40165710449219, 74.99208068847656, 80.58251190185547, 86.17293548583984, 91.76336669921875, 97.35379028320312, 102.9442138671875, 108.5346450805664, 114.12507629394531, 119.71549987792969, 125.3059310913086, 130.8963623046875, 136.48678588867188, 142.07720947265625, 147.66763305664062, 153.258056640625, 158.84848022460938, 164.43890380859375, 170.02932739257812, 175.61976623535156, 181.21018981933594, 186.8006134033203, 192.3910369873047, 197.98147583007812, 203.5718994140625, 209.16232299804688, 214.75274658203125, 220.3431854248047, 225.93360900878906, 231.52403259277344, 237.1144561767578, 242.70489501953125, 248.29531860351562]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 12.0, 9.0, 8.0, 12.0, 19.0, 17.0, 21.0, 21.0, 25.0, 33.0, 16.0, 28.0, 25.0, 38.0, 37.0, 32.0, 36.0, 32.0, 39.0, 41.0, 37.0, 41.0, 42.0, 37.0, 36.0, 29.0, 33.0, 29.0, 29.0, 17.0, 24.0, 21.0, 14.0, 16.0, 16.0, 12.0, 8.0, 8.0, 8.0, 8.0, 4.0, 3.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0], "bins": [-60.11222839355469, -58.45820236206055, -56.804176330566406, -55.150150299072266, -53.496124267578125, -51.84209442138672, -50.18806838989258, -48.53404235839844, -46.8800163269043, -45.225990295410156, -43.571964263916016, -41.917938232421875, -40.26390838623047, -38.609886169433594, -36.95585632324219, -35.30183029174805, -33.647804260253906, -31.993778228759766, -30.339752197265625, -28.68572425842285, -27.03169822692871, -25.37767219543457, -23.723644256591797, -22.069618225097656, -20.415592193603516, -18.761566162109375, -17.107540130615234, -15.453512191772461, -13.79948616027832, -12.14546012878418, -10.491433143615723, -8.837406158447266, -7.183376312255859, -5.5293498039245605, -3.8753232955932617, -2.221296787261963, -0.5672702789306641, 1.0867557525634766, 2.7407827377319336, 4.394809722900391, 6.048835754394531, 7.70286226272583, 9.356888771057129, 11.010915756225586, 12.664941787719727, 14.318967819213867, 15.972994804382324, 17.62702178955078, 19.281047821044922, 20.935073852539062, 22.589099884033203, 24.243127822875977, 25.897153854370117, 27.551179885864258, 29.20520782470703, 30.859233856201172, 32.51325988769531, 34.16728591918945, 35.821311950683594, 37.475337982177734, 39.129364013671875, 40.78339385986328, 42.43741989135742, 44.09144592285156, 45.7454719543457]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 6.0, 7.0, 6.0, 13.0, 8.0, 12.0, 13.0, 19.0, 22.0, 19.0, 22.0, 37.0, 32.0, 38.0, 34.0, 38.0, 43.0, 45.0, 41.0, 36.0, 37.0, 34.0, 49.0, 40.0, 33.0, 35.0, 37.0, 26.0, 32.0, 20.0, 21.0, 30.0, 10.0, 11.0, 20.0, 8.0, 11.0, 10.0, 8.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-7.26953125, -7.05224609375, -6.8349609375, -6.61767578125, -6.400390625, -6.18310546875, -5.9658203125, -5.74853515625, -5.53125, -5.31396484375, -5.0966796875, -4.87939453125, -4.662109375, -4.44482421875, -4.2275390625, -4.01025390625, -3.79296875, -3.57568359375, -3.3583984375, -3.14111328125, -2.923828125, -2.70654296875, -2.4892578125, -2.27197265625, -2.0546875, -1.83740234375, -1.6201171875, -1.40283203125, -1.185546875, -0.96826171875, -0.7509765625, -0.53369140625, -0.31640625, -0.09912109375, 0.1181640625, 0.33544921875, 0.552734375, 0.77001953125, 0.9873046875, 1.20458984375, 1.421875, 1.63916015625, 1.8564453125, 2.07373046875, 2.291015625, 2.50830078125, 2.7255859375, 2.94287109375, 3.16015625, 3.37744140625, 3.5947265625, 3.81201171875, 4.029296875, 4.24658203125, 4.4638671875, 4.68115234375, 4.8984375, 5.11572265625, 5.3330078125, 5.55029296875, 5.767578125, 5.98486328125, 6.2021484375, 6.41943359375, 6.63671875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 23.0, 19.0, 42.0, 94.0, 165.0, 340.0, 750.0, 1980.0, 6817.0, 49741.0, 2712747.0, 1381576.0, 31642.0, 5281.0, 1746.0, 656.0, 302.0, 149.0, 84.0, 37.0, 28.0, 18.0, 11.0, 10.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -38.00146484375, -36.8466796875, -35.69189453125, -34.537109375, -33.38232421875, -32.2275390625, -31.07275390625, -29.91796875, -28.76318359375, -27.6083984375, -26.45361328125, -25.298828125, -24.14404296875, -22.9892578125, -21.83447265625, -20.6796875, -19.52490234375, -18.3701171875, -17.21533203125, -16.060546875, -14.90576171875, -13.7509765625, -12.59619140625, -11.44140625, -10.28662109375, -9.1318359375, -7.97705078125, -6.822265625, -5.66748046875, -4.5126953125, -3.35791015625, -2.203125, -1.04833984375, 0.1064453125, 1.26123046875, 2.416015625, 3.57080078125, 4.7255859375, 5.88037109375, 7.03515625, 8.18994140625, 9.3447265625, 10.49951171875, 11.654296875, 12.80908203125, 13.9638671875, 15.11865234375, 16.2734375, 17.42822265625, 18.5830078125, 19.73779296875, 20.892578125, 22.04736328125, 23.2021484375, 24.35693359375, 25.51171875, 26.66650390625, 27.8212890625, 28.97607421875, 30.130859375, 31.28564453125, 32.4404296875, 33.59521484375, 34.75]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 8.0, 4.0, 8.0, 9.0, 15.0, 25.0, 25.0, 32.0, 47.0, 54.0, 84.0, 115.0, 145.0, 211.0, 288.0, 388.0, 518.0, 527.0, 424.0, 287.0, 223.0, 140.0, 134.0, 79.0, 72.0, 53.0, 37.0, 32.0, 25.0, 13.0, 12.0, 12.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.37744140625, -10.9970703125, -10.61669921875, -10.236328125, -9.85595703125, -9.4755859375, -9.09521484375, -8.71484375, -8.33447265625, -7.9541015625, -7.57373046875, -7.193359375, -6.81298828125, -6.4326171875, -6.05224609375, -5.671875, -5.29150390625, -4.9111328125, -4.53076171875, -4.150390625, -3.77001953125, -3.3896484375, -3.00927734375, -2.62890625, -2.24853515625, -1.8681640625, -1.48779296875, -1.107421875, -0.72705078125, -0.3466796875, 0.03369140625, 0.4140625, 0.79443359375, 1.1748046875, 1.55517578125, 1.935546875, 2.31591796875, 2.6962890625, 3.07666015625, 3.45703125, 3.83740234375, 4.2177734375, 4.59814453125, 4.978515625, 5.35888671875, 5.7392578125, 6.11962890625, 6.5, 6.88037109375, 7.2607421875, 7.64111328125, 8.021484375, 8.40185546875, 8.7822265625, 9.16259765625, 9.54296875, 9.92333984375, 10.3037109375, 10.68408203125, 11.064453125, 11.44482421875, 11.8251953125, 12.20556640625, 12.5859375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 12.0, 17.0, 30.0, 30.0, 57.0, 70.0, 152.0, 218.0, 296.0, 493.0, 793.0, 1349.0, 2648.0, 6444.0, 25066.0, 186356.0, 2621848.0, 1225325.0, 97167.0, 16097.0, 4799.0, 2036.0, 1126.0, 640.0, 399.0, 284.0, 171.0, 94.0, 75.0, 57.0, 35.0, 26.0, 22.0, 14.0, 8.0, 3.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.890625, -20.19091796875, -19.4912109375, -18.79150390625, -18.091796875, -17.39208984375, -16.6923828125, -15.99267578125, -15.29296875, -14.59326171875, -13.8935546875, -13.19384765625, -12.494140625, -11.79443359375, -11.0947265625, -10.39501953125, -9.6953125, -8.99560546875, -8.2958984375, -7.59619140625, -6.896484375, -6.19677734375, -5.4970703125, -4.79736328125, -4.09765625, -3.39794921875, -2.6982421875, -1.99853515625, -1.298828125, -0.59912109375, 0.1005859375, 0.80029296875, 1.5, 2.19970703125, 2.8994140625, 3.59912109375, 4.298828125, 4.99853515625, 5.6982421875, 6.39794921875, 7.09765625, 7.79736328125, 8.4970703125, 9.19677734375, 9.896484375, 10.59619140625, 11.2958984375, 11.99560546875, 12.6953125, 13.39501953125, 14.0947265625, 14.79443359375, 15.494140625, 16.19384765625, 16.8935546875, 17.59326171875, 18.29296875, 18.99267578125, 19.6923828125, 20.39208984375, 21.091796875, 21.79150390625, 22.4912109375, 23.19091796875, 23.890625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 46.0, 168.0, 358.0, 307.0, 103.0, 16.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.52845764160156, -113.49405670166016, -107.45966339111328, -101.42526245117188, -95.390869140625, -89.3564682006836, -83.32206726074219, -77.28767395019531, -71.2532730102539, -65.2188720703125, -59.184478759765625, -53.15007781982422, -47.11568069458008, -41.08128356933594, -35.04688262939453, -29.01248550415039, -22.97808837890625, -16.94369125366211, -10.909292221069336, -4.8748931884765625, 1.1595039367675781, 7.193901062011719, 13.228302001953125, 19.262699127197266, 25.297096252441406, 31.331493377685547, 37.36589050292969, 43.400291442871094, 49.434688568115234, 55.469085693359375, 61.50348663330078, 67.53788757324219, 73.57229614257812, 79.60669708251953, 85.6410903930664, 91.67549133300781, 97.70988464355469, 103.7442855834961, 109.7786865234375, 115.81307983398438, 121.84748077392578, 127.88188171386719, 133.91627502441406, 139.95068359375, 145.98507690429688, 152.01947021484375, 158.05386352539062, 164.08827209472656, 170.12266540527344, 176.1570587158203, 182.19146728515625, 188.22586059570312, 194.26025390625, 200.29464721679688, 206.3290557861328, 212.3634490966797, 218.39785766601562, 224.4322509765625, 230.46665954589844, 236.5010528564453, 242.5354461669922, 248.56985473632812, 254.604248046875, 260.6386413574219, 266.67303466796875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 9.0, 11.0, 9.0, 17.0, 17.0, 25.0, 24.0, 28.0, 26.0, 30.0, 36.0, 33.0, 39.0, 42.0, 47.0, 46.0, 56.0, 50.0, 37.0, 32.0, 44.0, 47.0, 24.0, 40.0, 28.0, 26.0, 25.0, 27.0, 20.0, 17.0, 13.0, 8.0, 11.0, 13.0, 9.0, 5.0, 3.0, 1.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.992488861083984, -51.53632736206055, -50.080169677734375, -48.62400817871094, -47.1678466796875, -45.71168518066406, -44.25552749633789, -42.79936599731445, -41.34320831298828, -39.887046813964844, -38.43088912963867, -36.974727630615234, -35.5185661315918, -34.062408447265625, -32.60624694824219, -31.15008544921875, -29.693923950195312, -28.237764358520508, -26.78160285949707, -25.325443267822266, -23.869281768798828, -22.413122177124023, -20.95696258544922, -19.50080108642578, -18.044641494750977, -16.588481903076172, -15.132320404052734, -13.67616081237793, -12.220000267028809, -10.763839721679688, -9.307680130004883, -7.851519584655762, -6.395362854003906, -4.939202308654785, -3.4830422401428223, -2.0268821716308594, -0.5707216262817383, 0.8854389190673828, 2.3415985107421875, 3.7977590560913086, 5.25391960144043, 6.710080146789551, 8.166240692138672, 9.622400283813477, 11.078560829162598, 12.534721374511719, 13.990880966186523, 15.447041511535645, 16.903202056884766, 18.35936164855957, 19.815523147583008, 21.271682739257812, 22.72784423828125, 24.184003829956055, 25.64016342163086, 27.096324920654297, 28.5524845123291, 30.008644104003906, 31.464805603027344, 32.92096710205078, 34.37712478637695, 35.83328628540039, 37.28944396972656, 38.74560546875, 40.20176696777344]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 8.0, 11.0, 11.0, 14.0, 18.0, 16.0, 18.0, 39.0, 23.0, 26.0, 35.0, 33.0, 43.0, 34.0, 43.0, 40.0, 39.0, 39.0, 46.0, 45.0, 45.0, 42.0, 24.0, 32.0, 25.0, 36.0, 32.0, 29.0, 30.0, 18.0, 9.0, 9.0, 15.0, 10.0, 8.0, 11.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3671875, -6.16961669921875, -5.9720458984375, -5.77447509765625, -5.576904296875, -5.37933349609375, -5.1817626953125, -4.98419189453125, -4.78662109375, -4.58905029296875, -4.3914794921875, -4.19390869140625, -3.996337890625, -3.79876708984375, -3.6011962890625, -3.40362548828125, -3.2060546875, -3.00848388671875, -2.8109130859375, -2.61334228515625, -2.415771484375, -2.21820068359375, -2.0206298828125, -1.82305908203125, -1.62548828125, -1.42791748046875, -1.2303466796875, -1.03277587890625, -0.835205078125, -0.63763427734375, -0.4400634765625, -0.24249267578125, -0.044921875, 0.15264892578125, 0.3502197265625, 0.54779052734375, 0.745361328125, 0.94293212890625, 1.1405029296875, 1.33807373046875, 1.53564453125, 1.73321533203125, 1.9307861328125, 2.12835693359375, 2.325927734375, 2.52349853515625, 2.7210693359375, 2.91864013671875, 3.1162109375, 3.31378173828125, 3.5113525390625, 3.70892333984375, 3.906494140625, 4.10406494140625, 4.3016357421875, 4.49920654296875, 4.69677734375, 4.89434814453125, 5.0919189453125, 5.28948974609375, 5.487060546875, 5.68463134765625, 5.8822021484375, 6.07977294921875, 6.27734375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 6.0, 6.0, 9.0, 16.0, 25.0, 34.0, 67.0, 98.0, 161.0, 230.0, 384.0, 611.0, 1034.0, 1678.0, 2696.0, 4568.0, 7986.0, 13672.0, 23964.0, 42787.0, 77219.0, 138741.0, 215579.0, 211537.0, 134235.0, 74769.0, 41367.0, 23106.0, 12997.0, 7557.0, 4493.0, 2689.0, 1547.0, 969.0, 673.0, 377.0, 242.0, 149.0, 91.0, 52.0, 43.0, 40.0, 9.0, 15.0, 9.0, 4.0, 1.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.9951171875, -0.964935302734375, -0.93475341796875, -0.904571533203125, -0.8743896484375, -0.844207763671875, -0.81402587890625, -0.783843994140625, -0.753662109375, -0.723480224609375, -0.69329833984375, -0.663116455078125, -0.6329345703125, -0.602752685546875, -0.57257080078125, -0.542388916015625, -0.51220703125, -0.482025146484375, -0.45184326171875, -0.421661376953125, -0.3914794921875, -0.361297607421875, -0.33111572265625, -0.300933837890625, -0.270751953125, -0.240570068359375, -0.21038818359375, -0.180206298828125, -0.1500244140625, -0.119842529296875, -0.08966064453125, -0.059478759765625, -0.029296875, 0.000885009765625, 0.03106689453125, 0.061248779296875, 0.0914306640625, 0.121612548828125, 0.15179443359375, 0.181976318359375, 0.212158203125, 0.242340087890625, 0.27252197265625, 0.302703857421875, 0.3328857421875, 0.363067626953125, 0.39324951171875, 0.423431396484375, 0.45361328125, 0.483795166015625, 0.51397705078125, 0.544158935546875, 0.5743408203125, 0.604522705078125, 0.63470458984375, 0.664886474609375, 0.695068359375, 0.725250244140625, 0.75543212890625, 0.785614013671875, 0.8157958984375, 0.845977783203125, 0.87615966796875, 0.906341552734375, 0.9365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 10.0, 2.0, 7.0, 12.0, 11.0, 13.0, 20.0, 21.0, 15.0, 26.0, 34.0, 31.0, 32.0, 40.0, 36.0, 28.0, 32.0, 38.0, 36.0, 1072.0, 45.0, 48.0, 29.0, 32.0, 36.0, 28.0, 33.0, 32.0, 32.0, 23.0, 27.0, 31.0, 20.0, 12.0, 9.0, 13.0, 12.0, 8.0, 4.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.23046875, -4.10003662109375, -3.9696044921875, -3.83917236328125, -3.708740234375, -3.57830810546875, -3.4478759765625, -3.31744384765625, -3.18701171875, -3.05657958984375, -2.9261474609375, -2.79571533203125, -2.665283203125, -2.53485107421875, -2.4044189453125, -2.27398681640625, -2.1435546875, -2.01312255859375, -1.8826904296875, -1.75225830078125, -1.621826171875, -1.49139404296875, -1.3609619140625, -1.23052978515625, -1.10009765625, -0.96966552734375, -0.8392333984375, -0.70880126953125, -0.578369140625, -0.44793701171875, -0.3175048828125, -0.18707275390625, -0.056640625, 0.07379150390625, 0.2042236328125, 0.33465576171875, 0.465087890625, 0.59552001953125, 0.7259521484375, 0.85638427734375, 0.98681640625, 1.11724853515625, 1.2476806640625, 1.37811279296875, 1.508544921875, 1.63897705078125, 1.7694091796875, 1.89984130859375, 2.0302734375, 2.16070556640625, 2.2911376953125, 2.42156982421875, 2.552001953125, 2.68243408203125, 2.8128662109375, 2.94329833984375, 3.07373046875, 3.20416259765625, 3.3345947265625, 3.46502685546875, 3.595458984375, 3.72589111328125, 3.8563232421875, 3.98675537109375, 4.1171875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 10.0, 10.0, 29.0, 27.0, 36.0, 65.0, 104.0, 173.0, 282.0, 498.0, 975.0, 1768.0, 3718.0, 7553.0, 16540.0, 37688.0, 88014.0, 229122.0, 1201425.0, 314063.0, 110076.0, 46416.0, 20151.0, 9354.0, 4383.0, 2161.0, 1069.0, 610.0, 347.0, 168.0, 106.0, 65.0, 41.0, 27.0, 20.0, 13.0, 11.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.828125, -0.7991943359375, -0.770263671875, -0.7413330078125, -0.71240234375, -0.6834716796875, -0.654541015625, -0.6256103515625, -0.5966796875, -0.5677490234375, -0.538818359375, -0.5098876953125, -0.48095703125, -0.4520263671875, -0.423095703125, -0.3941650390625, -0.365234375, -0.3363037109375, -0.307373046875, -0.2784423828125, -0.24951171875, -0.2205810546875, -0.191650390625, -0.1627197265625, -0.1337890625, -0.1048583984375, -0.075927734375, -0.0469970703125, -0.01806640625, 0.0108642578125, 0.039794921875, 0.0687255859375, 0.09765625, 0.1265869140625, 0.155517578125, 0.1844482421875, 0.21337890625, 0.2423095703125, 0.271240234375, 0.3001708984375, 0.3291015625, 0.3580322265625, 0.386962890625, 0.4158935546875, 0.44482421875, 0.4737548828125, 0.502685546875, 0.5316162109375, 0.560546875, 0.5894775390625, 0.618408203125, 0.6473388671875, 0.67626953125, 0.7052001953125, 0.734130859375, 0.7630615234375, 0.7919921875, 0.8209228515625, 0.849853515625, 0.8787841796875, 0.90771484375, 0.9366455078125, 0.965576171875, 0.9945068359375, 1.0234375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 3.0, 11.0, 5.0, 9.0, 23.0, 11.0, 10.0, 30.0, 38.0, 64.0, 99.0, 176.0, 183.0, 105.0, 72.0, 33.0, 15.0, 10.0, 17.0, 10.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2081298828125, -0.20067787170410156, -0.19322586059570312, -0.1857738494873047, -0.17832183837890625, -0.1708698272705078, -0.16341781616210938, -0.15596580505371094, -0.1485137939453125, -0.14106178283691406, -0.13360977172851562, -0.1261577606201172, -0.11870574951171875, -0.11125373840332031, -0.10380172729492188, -0.09634971618652344, -0.088897705078125, -0.08144569396972656, -0.07399368286132812, -0.06654167175292969, -0.05908966064453125, -0.05163764953613281, -0.044185638427734375, -0.03673362731933594, -0.0292816162109375, -0.021829605102539062, -0.014377593994140625, -0.0069255828857421875, 0.00052642822265625, 0.007978439331054688, 0.015430450439453125, 0.022882461547851562, 0.03033447265625, 0.03778648376464844, 0.045238494873046875, 0.05269050598144531, 0.06014251708984375, 0.06759452819824219, 0.07504653930664062, 0.08249855041503906, 0.0899505615234375, 0.09740257263183594, 0.10485458374023438, 0.11230659484863281, 0.11975860595703125, 0.1272106170654297, 0.13466262817382812, 0.14211463928222656, 0.149566650390625, 0.15701866149902344, 0.16447067260742188, 0.1719226837158203, 0.17937469482421875, 0.1868267059326172, 0.19427871704101562, 0.20173072814941406, 0.2091827392578125, 0.21663475036621094, 0.22408676147460938, 0.2315387725830078, 0.23899078369140625, 0.2464427947998047, 0.2538948059082031, 0.26134681701660156, 0.268798828125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 8.0, 3.0, 4.0, 4.0, 10.0, 10.0, 14.0, 38.0, 34.0, 54.0, 83.0, 150.0, 356.0, 1603.0, 1007132.0, 37620.0, 724.0, 270.0, 132.0, 70.0, 71.0, 37.0, 32.0, 13.0, 10.0, 10.0, 9.0, 5.0, 7.0, 5.0, 7.0, 6.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0], "bins": [-5.8046875, -5.64697265625, -5.4892578125, -5.33154296875, -5.173828125, -5.01611328125, -4.8583984375, -4.70068359375, -4.54296875, -4.38525390625, -4.2275390625, -4.06982421875, -3.912109375, -3.75439453125, -3.5966796875, -3.43896484375, -3.28125, -3.12353515625, -2.9658203125, -2.80810546875, -2.650390625, -2.49267578125, -2.3349609375, -2.17724609375, -2.01953125, -1.86181640625, -1.7041015625, -1.54638671875, -1.388671875, -1.23095703125, -1.0732421875, -0.91552734375, -0.7578125, -0.60009765625, -0.4423828125, -0.28466796875, -0.126953125, 0.03076171875, 0.1884765625, 0.34619140625, 0.50390625, 0.66162109375, 0.8193359375, 0.97705078125, 1.134765625, 1.29248046875, 1.4501953125, 1.60791015625, 1.765625, 1.92333984375, 2.0810546875, 2.23876953125, 2.396484375, 2.55419921875, 2.7119140625, 2.86962890625, 3.02734375, 3.18505859375, 3.3427734375, 3.50048828125, 3.658203125, 3.81591796875, 3.9736328125, 4.13134765625, 4.2890625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 16.0, 46.0, 85.0, 157.0, 228.0, 194.0, 124.0, 70.0, 41.0, 24.0, 7.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5944207906723022, -0.5831496715545654, -0.5718786120414734, -0.5606074929237366, -0.5493364334106445, -0.5380653142929077, -0.5267942547798157, -0.5155231356620789, -0.5042520761489868, -0.4929809868335724, -0.48170989751815796, -0.47043880820274353, -0.4591677188873291, -0.4478965997695923, -0.43662554025650024, -0.4253544211387634, -0.4140833020210266, -0.4028122127056122, -0.39154112339019775, -0.3802700340747833, -0.3689989447593689, -0.3577278256416321, -0.34645676612854004, -0.3351856470108032, -0.3239145874977112, -0.31264349818229675, -0.3013724088668823, -0.2901013195514679, -0.27883023023605347, -0.26755911111831665, -0.2562880516052246, -0.2450169324874878, -0.23374585807323456, -0.22247476875782013, -0.2112036794424057, -0.19993257522583008, -0.18866148591041565, -0.17739039659500122, -0.1661193072795868, -0.15484821796417236, -0.14357712864875793, -0.1323060393333435, -0.12103494256734848, -0.10976385325193405, -0.09849275648593903, -0.0872216671705246, -0.07595057785511017, -0.06467948108911514, -0.05340838432312012, -0.04213729128241539, -0.030866200104355812, -0.019595108926296234, -0.008324015885591507, 0.00294707715511322, 0.014218166470527649, 0.025489263236522675, 0.0367603525519371, 0.04803144559264183, 0.05930253863334656, 0.07057362794876099, 0.08184471726417542, 0.09311581403017044, 0.10438690334558487, 0.1156580001115799, 0.12692908942699432]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 6.0, 8.0, 8.0, 11.0, 14.0, 19.0, 15.0, 20.0, 32.0, 16.0, 26.0, 26.0, 29.0, 32.0, 40.0, 38.0, 45.0, 49.0, 43.0, 46.0, 41.0, 36.0, 26.0, 38.0, 22.0, 40.0, 42.0, 28.0, 25.0, 28.0, 24.0, 19.0, 18.0, 12.0, 11.0, 9.0, 14.0, 11.0, 6.0, 3.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2128503918647766, -0.20623408257961273, -0.19961777329444885, -0.19300146400928497, -0.1863851547241211, -0.17976884543895721, -0.17315253615379333, -0.16653621196746826, -0.15991991758346558, -0.1533036082983017, -0.14668729901313782, -0.14007098972797394, -0.13345468044281006, -0.12683837115764618, -0.1202220544219017, -0.11360574513673782, -0.10698942840099335, -0.10037311911582947, -0.09375680983066559, -0.08714050054550171, -0.08052419126033783, -0.07390788197517395, -0.06729156523942947, -0.060675255954265594, -0.054058946669101715, -0.047442637383937836, -0.040826328098773956, -0.03421001508831978, -0.0275937058031559, -0.02097739651799202, -0.014361083507537842, -0.007744774222373962, -0.001128464937210083, 0.005487845279276371, 0.012104155495762825, 0.018720466643571854, 0.025336775928735733, 0.03195308521389961, 0.03856939822435379, 0.04518570750951767, 0.05180201679468155, 0.05841832607984543, 0.06503463536500931, 0.07165095210075378, 0.07826726138591766, 0.08488357067108154, 0.09149987995624542, 0.0981161892414093, 0.10473249852657318, 0.11134880781173706, 0.11796511709690094, 0.12458142638206482, 0.1311977356672287, 0.13781404495239258, 0.14443036913871765, 0.15104666352272034, 0.1576629877090454, 0.1642792969942093, 0.17089560627937317, 0.17751191556453705, 0.18412822484970093, 0.1907445341348648, 0.1973608434200287, 0.20397716760635376, 0.21059346199035645]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 3.0, 3.0, 10.0, 13.0, 15.0, 11.0, 12.0, 23.0, 20.0, 31.0, 29.0, 32.0, 36.0, 44.0, 45.0, 38.0, 43.0, 55.0, 59.0, 50.0, 39.0, 45.0, 45.0, 33.0, 33.0, 34.0, 27.0, 26.0, 34.0, 19.0, 16.0, 10.0, 20.0, 9.0, 8.0, 3.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9140625, -6.69427490234375, -6.4744873046875, -6.25469970703125, -6.034912109375, -5.81512451171875, -5.5953369140625, -5.37554931640625, -5.15576171875, -4.93597412109375, -4.7161865234375, -4.49639892578125, -4.276611328125, -4.05682373046875, -3.8370361328125, -3.61724853515625, -3.3974609375, -3.17767333984375, -2.9578857421875, -2.73809814453125, -2.518310546875, -2.29852294921875, -2.0787353515625, -1.85894775390625, -1.63916015625, -1.41937255859375, -1.1995849609375, -0.97979736328125, -0.760009765625, -0.54022216796875, -0.3204345703125, -0.10064697265625, 0.119140625, 0.33892822265625, 0.5587158203125, 0.77850341796875, 0.998291015625, 1.21807861328125, 1.4378662109375, 1.65765380859375, 1.87744140625, 2.09722900390625, 2.3170166015625, 2.53680419921875, 2.756591796875, 2.97637939453125, 3.1961669921875, 3.41595458984375, 3.6357421875, 3.85552978515625, 4.0753173828125, 4.29510498046875, 4.514892578125, 4.73468017578125, 4.9544677734375, 5.17425537109375, 5.39404296875, 5.61383056640625, 5.8336181640625, 6.05340576171875, 6.273193359375, 6.49298095703125, 6.7127685546875, 6.93255615234375, 7.15234375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 10.0, 13.0, 10.0, 31.0, 38.0, 50.0, 73.0, 84.0, 135.0, 213.0, 276.0, 400.0, 690.0, 1110.0, 2070.0, 3920.0, 8509.0, 19021.0, 46472.0, 130425.0, 437748.0, 260383.0, 80439.0, 30559.0, 12936.0, 5844.0, 3000.0, 1536.0, 890.0, 573.0, 322.0, 210.0, 144.0, 102.0, 82.0, 56.0, 50.0, 27.0, 18.0, 25.0, 17.0, 12.0, 11.0, 11.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.765625, -10.4371337890625, -10.108642578125, -9.7801513671875, -9.45166015625, -9.1231689453125, -8.794677734375, -8.4661865234375, -8.1376953125, -7.8092041015625, -7.480712890625, -7.1522216796875, -6.82373046875, -6.4952392578125, -6.166748046875, -5.8382568359375, -5.509765625, -5.1812744140625, -4.852783203125, -4.5242919921875, -4.19580078125, -3.8673095703125, -3.538818359375, -3.2103271484375, -2.8818359375, -2.5533447265625, -2.224853515625, -1.8963623046875, -1.56787109375, -1.2393798828125, -0.910888671875, -0.5823974609375, -0.25390625, 0.0745849609375, 0.403076171875, 0.7315673828125, 1.06005859375, 1.3885498046875, 1.717041015625, 2.0455322265625, 2.3740234375, 2.7025146484375, 3.031005859375, 3.3594970703125, 3.68798828125, 4.0164794921875, 4.344970703125, 4.6734619140625, 5.001953125, 5.3304443359375, 5.658935546875, 5.9874267578125, 6.31591796875, 6.6444091796875, 6.972900390625, 7.3013916015625, 7.6298828125, 7.9583740234375, 8.286865234375, 8.6153564453125, 8.94384765625, 9.2723388671875, 9.600830078125, 9.9293212890625, 10.2578125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 5.0, 8.0, 8.0, 2.0, 15.0, 16.0, 11.0, 24.0, 16.0, 36.0, 36.0, 40.0, 46.0, 66.0, 69.0, 122.0, 170.0, 1317.0, 303.0, 192.0, 118.0, 114.0, 60.0, 43.0, 29.0, 31.0, 26.0, 20.0, 17.0, 15.0, 18.0, 8.0, 14.0, 4.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.078125, -15.522216796875, -14.96630859375, -14.410400390625, -13.8544921875, -13.298583984375, -12.74267578125, -12.186767578125, -11.630859375, -11.074951171875, -10.51904296875, -9.963134765625, -9.4072265625, -8.851318359375, -8.29541015625, -7.739501953125, -7.18359375, -6.627685546875, -6.07177734375, -5.515869140625, -4.9599609375, -4.404052734375, -3.84814453125, -3.292236328125, -2.736328125, -2.180419921875, -1.62451171875, -1.068603515625, -0.5126953125, 0.043212890625, 0.59912109375, 1.155029296875, 1.7109375, 2.266845703125, 2.82275390625, 3.378662109375, 3.9345703125, 4.490478515625, 5.04638671875, 5.602294921875, 6.158203125, 6.714111328125, 7.27001953125, 7.825927734375, 8.3818359375, 8.937744140625, 9.49365234375, 10.049560546875, 10.60546875, 11.161376953125, 11.71728515625, 12.273193359375, 12.8291015625, 13.385009765625, 13.94091796875, 14.496826171875, 15.052734375, 15.608642578125, 16.16455078125, 16.720458984375, 17.2763671875, 17.832275390625, 18.38818359375, 18.944091796875, 19.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 9.0, 10.0, 17.0, 12.0, 21.0, 32.0, 43.0, 58.0, 80.0, 103.0, 174.0, 288.0, 478.0, 966.0, 2263.0, 8378.0, 306322.0, 2803186.0, 17152.0, 3285.0, 1199.0, 599.0, 312.0, 197.0, 160.0, 77.0, 75.0, 40.0, 34.0, 32.0, 18.0, 12.0, 9.0, 8.0, 8.0, 6.0, 2.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0], "bins": [-59.875, -58.2197265625, -56.564453125, -54.9091796875, -53.25390625, -51.5986328125, -49.943359375, -48.2880859375, -46.6328125, -44.9775390625, -43.322265625, -41.6669921875, -40.01171875, -38.3564453125, -36.701171875, -35.0458984375, -33.390625, -31.7353515625, -30.080078125, -28.4248046875, -26.76953125, -25.1142578125, -23.458984375, -21.8037109375, -20.1484375, -18.4931640625, -16.837890625, -15.1826171875, -13.52734375, -11.8720703125, -10.216796875, -8.5615234375, -6.90625, -5.2509765625, -3.595703125, -1.9404296875, -0.28515625, 1.3701171875, 3.025390625, 4.6806640625, 6.3359375, 7.9912109375, 9.646484375, 11.3017578125, 12.95703125, 14.6123046875, 16.267578125, 17.9228515625, 19.578125, 21.2333984375, 22.888671875, 24.5439453125, 26.19921875, 27.8544921875, 29.509765625, 31.1650390625, 32.8203125, 34.4755859375, 36.130859375, 37.7861328125, 39.44140625, 41.0966796875, 42.751953125, 44.4072265625, 46.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 11.0, 12.0, 49.0, 89.0, 217.0, 302.0, 196.0, 83.0, 28.0, 15.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.4060516357422, -126.72715759277344, -119.04825592041016, -111.3693618774414, -103.69046020507812, -96.01156616210938, -88.33267211914062, -80.65377807617188, -72.9748764038086, -65.29598236083984, -57.61708068847656, -49.93818664550781, -42.2592887878418, -34.58039093017578, -26.90149688720703, -19.222599029541016, -11.543701171875, -3.864804267883301, 3.8140926361083984, 11.492988586425781, 19.171886444091797, 26.850784301757812, 34.52967834472656, 42.20857620239258, 49.887474060058594, 57.56637191772461, 65.24526977539062, 72.92416381835938, 80.60305786132812, 88.2819595336914, 95.96085357666016, 103.63975524902344, 111.31863403320312, 118.99752807617188, 126.67642974853516, 134.35531616210938, 142.0342254638672, 149.71311950683594, 157.3920135498047, 165.07090759277344, 172.74981689453125, 180.4287109375, 188.10760498046875, 195.7864990234375, 203.4654083251953, 211.14430236816406, 218.8231964111328, 226.50209045410156, 234.1809844970703, 241.85987854003906, 249.5387725830078, 257.2176818847656, 264.8965759277344, 272.5754699707031, 280.2543640136719, 287.9332580566406, 295.6121520996094, 303.2910461425781, 310.9699401855469, 318.6488342285156, 326.3277282714844, 334.00665283203125, 341.685546875, 349.36444091796875, 357.0433349609375]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 9.0, 7.0, 10.0, 8.0, 14.0, 13.0, 14.0, 20.0, 19.0, 22.0, 29.0, 28.0, 23.0, 39.0, 36.0, 35.0, 37.0, 46.0, 42.0, 35.0, 30.0, 47.0, 35.0, 40.0, 37.0, 26.0, 32.0, 35.0, 33.0, 31.0, 18.0, 21.0, 17.0, 12.0, 15.0, 19.0, 16.0, 12.0, 8.0, 2.0, 8.0, 10.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-58.33087158203125, -56.54862976074219, -54.766387939453125, -52.98414611816406, -51.201904296875, -49.41966247558594, -47.637420654296875, -45.85517883300781, -44.07293701171875, -42.29069519042969, -40.508453369140625, -38.72621154785156, -36.9439697265625, -35.16172790527344, -33.379486083984375, -31.597244262695312, -29.815004348754883, -28.03276252746582, -26.250520706176758, -24.468278884887695, -22.686037063598633, -20.903797149658203, -19.12155532836914, -17.339313507080078, -15.5570707321167, -13.774828910827637, -11.992587089538574, -10.210346221923828, -8.428104400634766, -6.645862579345703, -4.863620758056641, -3.081378936767578, -1.2991371154785156, 0.4831045866012573, 2.2653462886810303, 4.047587871551514, 5.829829692840576, 7.6120710372924805, 9.394312858581543, 11.176554679870605, 12.958796501159668, 14.74103832244873, 16.523279190063477, 18.30552101135254, 20.0877628326416, 21.870004653930664, 23.652246475219727, 25.43448829650879, 27.21673011779785, 28.998971939086914, 30.781213760375977, 32.563453674316406, 34.34569549560547, 36.12793731689453, 37.910179138183594, 39.692420959472656, 41.47466278076172, 43.25690460205078, 45.039146423339844, 46.821388244628906, 48.60363006591797, 50.38587188720703, 52.168113708496094, 53.950355529785156, 55.73259735107422]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 6.0, 6.0, 10.0, 8.0, 16.0, 18.0, 19.0, 22.0, 19.0, 21.0, 35.0, 39.0, 47.0, 45.0, 38.0, 57.0, 47.0, 53.0, 49.0, 39.0, 47.0, 45.0, 43.0, 35.0, 40.0, 38.0, 18.0, 36.0, 24.0, 18.0, 17.0, 9.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.71832275390625, -7.4757080078125, -7.23309326171875, -6.990478515625, -6.74786376953125, -6.5052490234375, -6.26263427734375, -6.02001953125, -5.77740478515625, -5.5347900390625, -5.29217529296875, -5.049560546875, -4.80694580078125, -4.5643310546875, -4.32171630859375, -4.0791015625, -3.83648681640625, -3.5938720703125, -3.35125732421875, -3.108642578125, -2.86602783203125, -2.6234130859375, -2.38079833984375, -2.13818359375, -1.89556884765625, -1.6529541015625, -1.41033935546875, -1.167724609375, -0.92510986328125, -0.6824951171875, -0.43988037109375, -0.197265625, 0.04534912109375, 0.2879638671875, 0.53057861328125, 0.773193359375, 1.01580810546875, 1.2584228515625, 1.50103759765625, 1.74365234375, 1.98626708984375, 2.2288818359375, 2.47149658203125, 2.714111328125, 2.95672607421875, 3.1993408203125, 3.44195556640625, 3.6845703125, 3.92718505859375, 4.1697998046875, 4.41241455078125, 4.655029296875, 4.89764404296875, 5.1402587890625, 5.38287353515625, 5.62548828125, 5.86810302734375, 6.1107177734375, 6.35333251953125, 6.595947265625, 6.83856201171875, 7.0811767578125, 7.32379150390625, 7.56640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 16.0, 36.0, 50.0, 101.0, 213.0, 340.0, 625.0, 1265.0, 2800.0, 7883.0, 37499.0, 716910.0, 3191976.0, 205563.0, 19701.0, 5057.0, 2032.0, 994.0, 517.0, 307.0, 159.0, 97.0, 37.0, 32.0, 11.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-26.625, -25.80126953125, -24.9775390625, -24.15380859375, -23.330078125, -22.50634765625, -21.6826171875, -20.85888671875, -20.03515625, -19.21142578125, -18.3876953125, -17.56396484375, -16.740234375, -15.91650390625, -15.0927734375, -14.26904296875, -13.4453125, -12.62158203125, -11.7978515625, -10.97412109375, -10.150390625, -9.32666015625, -8.5029296875, -7.67919921875, -6.85546875, -6.03173828125, -5.2080078125, -4.38427734375, -3.560546875, -2.73681640625, -1.9130859375, -1.08935546875, -0.265625, 0.55810546875, 1.3818359375, 2.20556640625, 3.029296875, 3.85302734375, 4.6767578125, 5.50048828125, 6.32421875, 7.14794921875, 7.9716796875, 8.79541015625, 9.619140625, 10.44287109375, 11.2666015625, 12.09033203125, 12.9140625, 13.73779296875, 14.5615234375, 15.38525390625, 16.208984375, 17.03271484375, 17.8564453125, 18.68017578125, 19.50390625, 20.32763671875, 21.1513671875, 21.97509765625, 22.798828125, 23.62255859375, 24.4462890625, 25.27001953125, 26.09375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 8.0, 5.0, 9.0, 15.0, 16.0, 23.0, 31.0, 47.0, 56.0, 97.0, 112.0, 179.0, 235.0, 300.0, 422.0, 550.0, 528.0, 416.0, 294.0, 204.0, 165.0, 107.0, 80.0, 45.0, 37.0, 27.0, 21.0, 11.0, 9.0, 10.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.203125, -11.7933349609375, -11.383544921875, -10.9737548828125, -10.56396484375, -10.1541748046875, -9.744384765625, -9.3345947265625, -8.9248046875, -8.5150146484375, -8.105224609375, -7.6954345703125, -7.28564453125, -6.8758544921875, -6.466064453125, -6.0562744140625, -5.646484375, -5.2366943359375, -4.826904296875, -4.4171142578125, -4.00732421875, -3.5975341796875, -3.187744140625, -2.7779541015625, -2.3681640625, -1.9583740234375, -1.548583984375, -1.1387939453125, -0.72900390625, -0.3192138671875, 0.090576171875, 0.5003662109375, 0.91015625, 1.3199462890625, 1.729736328125, 2.1395263671875, 2.54931640625, 2.9591064453125, 3.368896484375, 3.7786865234375, 4.1884765625, 4.5982666015625, 5.008056640625, 5.4178466796875, 5.82763671875, 6.2374267578125, 6.647216796875, 7.0570068359375, 7.466796875, 7.8765869140625, 8.286376953125, 8.6961669921875, 9.10595703125, 9.5157470703125, 9.925537109375, 10.3353271484375, 10.7451171875, 11.1549072265625, 11.564697265625, 11.9744873046875, 12.38427734375, 12.7940673828125, 13.203857421875, 13.6136474609375, 14.0234375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 5.0, 13.0, 12.0, 10.0, 21.0, 23.0, 26.0, 37.0, 52.0, 81.0, 107.0, 214.0, 306.0, 512.0, 991.0, 2107.0, 5296.0, 19933.0, 187283.0, 3434187.0, 497211.0, 32969.0, 7409.0, 2641.0, 1153.0, 646.0, 340.0, 215.0, 140.0, 102.0, 58.0, 43.0, 38.0, 28.0, 22.0, 13.0, 10.0, 8.0, 4.0, 8.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.265625, -28.369140625, -27.47265625, -26.576171875, -25.6796875, -24.783203125, -23.88671875, -22.990234375, -22.09375, -21.197265625, -20.30078125, -19.404296875, -18.5078125, -17.611328125, -16.71484375, -15.818359375, -14.921875, -14.025390625, -13.12890625, -12.232421875, -11.3359375, -10.439453125, -9.54296875, -8.646484375, -7.75, -6.853515625, -5.95703125, -5.060546875, -4.1640625, -3.267578125, -2.37109375, -1.474609375, -0.578125, 0.318359375, 1.21484375, 2.111328125, 3.0078125, 3.904296875, 4.80078125, 5.697265625, 6.59375, 7.490234375, 8.38671875, 9.283203125, 10.1796875, 11.076171875, 11.97265625, 12.869140625, 13.765625, 14.662109375, 15.55859375, 16.455078125, 17.3515625, 18.248046875, 19.14453125, 20.041015625, 20.9375, 21.833984375, 22.73046875, 23.626953125, 24.5234375, 25.419921875, 26.31640625, 27.212890625, 28.109375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 149.0, 743.0, 110.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-850.8346557617188, -834.6129760742188, -818.3912963867188, -802.169677734375, -785.947998046875, -769.726318359375, -753.504638671875, -737.282958984375, -721.0613403320312, -704.8396606445312, -688.6179809570312, -672.3963623046875, -656.1746826171875, -639.9530029296875, -623.7313232421875, -607.5096435546875, -591.2879638671875, -575.0662841796875, -558.8446044921875, -542.6229858398438, -526.4013061523438, -510.17962646484375, -493.95794677734375, -477.7362976074219, -461.5146484375, -445.29296875, -429.0713195800781, -412.8496398925781, -396.62799072265625, -380.40631103515625, -364.18463134765625, -347.9629821777344, -331.74139404296875, -315.51971435546875, -299.2980651855469, -283.0763854980469, -266.854736328125, -250.633056640625, -234.41139221191406, -218.18972778320312, -201.96804809570312, -185.7463836669922, -169.52471923828125, -153.30303955078125, -137.08139038085938, -120.8597183227539, -104.63804626464844, -88.4163818359375, -72.19471740722656, -55.973052978515625, -39.75138473510742, -23.52971649169922, -7.308052062988281, 8.913612365722656, 25.135284423828125, 41.35694885253906, 57.57861328125, 73.80027770996094, 90.02194213867188, 106.24361419677734, 122.46527862548828, 138.68695068359375, 154.9086151123047, 171.13027954101562, 187.35194396972656]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 7.0, 11.0, 14.0, 28.0, 27.0, 31.0, 43.0, 32.0, 29.0, 44.0, 43.0, 60.0, 45.0, 51.0, 54.0, 54.0, 57.0, 50.0, 50.0, 34.0, 49.0, 38.0, 30.0, 22.0, 26.0, 8.0, 11.0, 7.0, 8.0, 9.0, 2.0, 5.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.5804557800293, -61.82351303100586, -60.066566467285156, -58.30962371826172, -56.55268096923828, -54.795738220214844, -53.038795471191406, -51.2818489074707, -49.524906158447266, -47.76796340942383, -46.011016845703125, -44.25407409667969, -42.49713134765625, -40.74018859863281, -38.983245849609375, -37.22629928588867, -35.469356536865234, -33.7124137878418, -31.955469131469727, -30.198524475097656, -28.44158172607422, -26.68463897705078, -24.92769432067871, -23.17074966430664, -21.413806915283203, -19.656864166259766, -17.899919509887695, -16.142974853515625, -14.386032104492188, -12.629088401794434, -10.87214469909668, -9.115200996398926, -7.3582611083984375, -5.601317405700684, -3.8443737030029297, -2.087430000305176, -0.3304862976074219, 1.426457405090332, 3.183401107788086, 4.94034481048584, 6.697288513183594, 8.454232215881348, 10.211175918579102, 11.968119621276855, 13.72506332397461, 15.482007026672363, 17.238950729370117, 18.995895385742188, 20.752838134765625, 22.509780883789062, 24.266725540161133, 26.023670196533203, 27.78061294555664, 29.537555694580078, 31.29450035095215, 33.05144500732422, 34.808387756347656, 36.565330505371094, 38.32227325439453, 40.079219818115234, 41.83616256713867, 43.59310531616211, 45.35005187988281, 47.10699462890625, 48.86393737792969]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 8.0, 5.0, 10.0, 8.0, 6.0, 11.0, 13.0, 19.0, 17.0, 32.0, 28.0, 42.0, 35.0, 30.0, 31.0, 39.0, 27.0, 42.0, 38.0, 48.0, 42.0, 32.0, 41.0, 30.0, 37.0, 31.0, 31.0, 38.0, 25.0, 38.0, 20.0, 24.0, 22.0, 11.0, 11.0, 15.0, 12.0, 9.0, 7.0, 7.0, 5.0, 1.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.4140625, -6.23529052734375, -6.0565185546875, -5.87774658203125, -5.698974609375, -5.52020263671875, -5.3414306640625, -5.16265869140625, -4.98388671875, -4.80511474609375, -4.6263427734375, -4.44757080078125, -4.268798828125, -4.09002685546875, -3.9112548828125, -3.73248291015625, -3.5537109375, -3.37493896484375, -3.1961669921875, -3.01739501953125, -2.838623046875, -2.65985107421875, -2.4810791015625, -2.30230712890625, -2.12353515625, -1.94476318359375, -1.7659912109375, -1.58721923828125, -1.408447265625, -1.22967529296875, -1.0509033203125, -0.87213134765625, -0.693359375, -0.51458740234375, -0.3358154296875, -0.15704345703125, 0.021728515625, 0.20050048828125, 0.3792724609375, 0.55804443359375, 0.73681640625, 0.91558837890625, 1.0943603515625, 1.27313232421875, 1.451904296875, 1.63067626953125, 1.8094482421875, 1.98822021484375, 2.1669921875, 2.34576416015625, 2.5245361328125, 2.70330810546875, 2.882080078125, 3.06085205078125, 3.2396240234375, 3.41839599609375, 3.59716796875, 3.77593994140625, 3.9547119140625, 4.13348388671875, 4.312255859375, 4.49102783203125, 4.6697998046875, 4.84857177734375, 5.02734375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 6.0, 2.0, 9.0, 9.0, 18.0, 22.0, 25.0, 43.0, 65.0, 81.0, 105.0, 184.0, 309.0, 519.0, 979.0, 1955.0, 4515.0, 13742.0, 62913.0, 571479.0, 334288.0, 39802.0, 10215.0, 3593.0, 1621.0, 858.0, 450.0, 261.0, 159.0, 105.0, 69.0, 42.0, 41.0, 15.0, 17.0, 16.0, 10.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.798828125, -3.671661376953125, -3.54449462890625, -3.417327880859375, -3.2901611328125, -3.162994384765625, -3.03582763671875, -2.908660888671875, -2.781494140625, -2.654327392578125, -2.52716064453125, -2.399993896484375, -2.2728271484375, -2.145660400390625, -2.01849365234375, -1.891326904296875, -1.76416015625, -1.636993408203125, -1.50982666015625, -1.382659912109375, -1.2554931640625, -1.128326416015625, -1.00115966796875, -0.873992919921875, -0.746826171875, -0.619659423828125, -0.49249267578125, -0.365325927734375, -0.2381591796875, -0.110992431640625, 0.01617431640625, 0.143341064453125, 0.2705078125, 0.397674560546875, 0.52484130859375, 0.652008056640625, 0.7791748046875, 0.906341552734375, 1.03350830078125, 1.160675048828125, 1.287841796875, 1.415008544921875, 1.54217529296875, 1.669342041015625, 1.7965087890625, 1.923675537109375, 2.05084228515625, 2.178009033203125, 2.30517578125, 2.432342529296875, 2.55950927734375, 2.686676025390625, 2.8138427734375, 2.941009521484375, 3.06817626953125, 3.195343017578125, 3.322509765625, 3.449676513671875, 3.57684326171875, 3.704010009765625, 3.8311767578125, 3.958343505859375, 4.08551025390625, 4.212677001953125, 4.33984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 10.0, 9.0, 12.0, 9.0, 18.0, 13.0, 20.0, 17.0, 22.0, 31.0, 32.0, 46.0, 37.0, 45.0, 36.0, 50.0, 37.0, 1064.0, 41.0, 53.0, 37.0, 41.0, 30.0, 35.0, 41.0, 31.0, 33.0, 17.0, 20.0, 25.0, 19.0, 17.0, 9.0, 13.0, 7.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.89453125, -3.7547607421875, -3.614990234375, -3.4752197265625, -3.33544921875, -3.1956787109375, -3.055908203125, -2.9161376953125, -2.7763671875, -2.6365966796875, -2.496826171875, -2.3570556640625, -2.21728515625, -2.0775146484375, -1.937744140625, -1.7979736328125, -1.658203125, -1.5184326171875, -1.378662109375, -1.2388916015625, -1.09912109375, -0.9593505859375, -0.819580078125, -0.6798095703125, -0.5400390625, -0.4002685546875, -0.260498046875, -0.1207275390625, 0.01904296875, 0.1588134765625, 0.298583984375, 0.4383544921875, 0.578125, 0.7178955078125, 0.857666015625, 0.9974365234375, 1.13720703125, 1.2769775390625, 1.416748046875, 1.5565185546875, 1.6962890625, 1.8360595703125, 1.975830078125, 2.1156005859375, 2.25537109375, 2.3951416015625, 2.534912109375, 2.6746826171875, 2.814453125, 2.9542236328125, 3.093994140625, 3.2337646484375, 3.37353515625, 3.5133056640625, 3.653076171875, 3.7928466796875, 3.9326171875, 4.0723876953125, 4.212158203125, 4.3519287109375, 4.49169921875, 4.6314697265625, 4.771240234375, 4.9110107421875, 5.05078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 12.0, 14.0, 18.0, 42.0, 34.0, 49.0, 62.0, 86.0, 155.0, 274.0, 432.0, 669.0, 1142.0, 2191.0, 4698.0, 12763.0, 57125.0, 888868.0, 1047063.0, 58280.0, 13099.0, 4781.0, 2225.0, 1190.0, 669.0, 427.0, 255.0, 167.0, 91.0, 64.0, 53.0, 32.0, 27.0, 23.0, 16.0, 12.0, 7.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.92578125, -2.839752197265625, -2.75372314453125, -2.667694091796875, -2.5816650390625, -2.495635986328125, -2.40960693359375, -2.323577880859375, -2.237548828125, -2.151519775390625, -2.06549072265625, -1.979461669921875, -1.8934326171875, -1.807403564453125, -1.72137451171875, -1.635345458984375, -1.54931640625, -1.463287353515625, -1.37725830078125, -1.291229248046875, -1.2052001953125, -1.119171142578125, -1.03314208984375, -0.947113037109375, -0.861083984375, -0.775054931640625, -0.68902587890625, -0.602996826171875, -0.5169677734375, -0.430938720703125, -0.34490966796875, -0.258880615234375, -0.1728515625, -0.086822509765625, -0.00079345703125, 0.085235595703125, 0.1712646484375, 0.257293701171875, 0.34332275390625, 0.429351806640625, 0.515380859375, 0.601409912109375, 0.68743896484375, 0.773468017578125, 0.8594970703125, 0.945526123046875, 1.03155517578125, 1.117584228515625, 1.20361328125, 1.289642333984375, 1.37567138671875, 1.461700439453125, 1.5477294921875, 1.633758544921875, 1.71978759765625, 1.805816650390625, 1.891845703125, 1.977874755859375, 2.06390380859375, 2.149932861328125, 2.2359619140625, 2.321990966796875, 2.40802001953125, 2.494049072265625, 2.580078125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 6.0, 6.0, 10.0, 47.0, 77.0, 179.0, 318.0, 146.0, 91.0, 39.0, 14.0, 11.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3583984375, -0.34799957275390625, -0.3376007080078125, -0.32720184326171875, -0.316802978515625, -0.30640411376953125, -0.2960052490234375, -0.28560638427734375, -0.27520751953125, -0.26480865478515625, -0.2544097900390625, -0.24401092529296875, -0.233612060546875, -0.22321319580078125, -0.2128143310546875, -0.20241546630859375, -0.1920166015625, -0.18161773681640625, -0.1712188720703125, -0.16082000732421875, -0.150421142578125, -0.14002227783203125, -0.1296234130859375, -0.11922454833984375, -0.10882568359375, -0.09842681884765625, -0.0880279541015625, -0.07762908935546875, -0.067230224609375, -0.05683135986328125, -0.0464324951171875, -0.03603363037109375, -0.025634765625, -0.01523590087890625, -0.0048370361328125, 0.00556182861328125, 0.015960693359375, 0.02635955810546875, 0.0367584228515625, 0.04715728759765625, 0.05755615234375, 0.06795501708984375, 0.0783538818359375, 0.08875274658203125, 0.099151611328125, 0.10955047607421875, 0.1199493408203125, 0.13034820556640625, 0.1407470703125, 0.15114593505859375, 0.1615447998046875, 0.17194366455078125, 0.182342529296875, 0.19274139404296875, 0.2031402587890625, 0.21353912353515625, 0.22393798828125, 0.23433685302734375, 0.2447357177734375, 0.25513458251953125, 0.265533447265625, 0.27593231201171875, 0.2863311767578125, 0.29673004150390625, 0.30712890625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 9.0, 7.0, 15.0, 11.0, 18.0, 16.0, 28.0, 43.0, 89.0, 215.0, 915.0, 6507.0, 1007919.0, 30116.0, 1938.0, 378.0, 111.0, 49.0, 30.0, 22.0, 16.0, 26.0, 21.0, 8.0, 2.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.75390625, -4.593994140625, -4.43408203125, -4.274169921875, -4.1142578125, -3.954345703125, -3.79443359375, -3.634521484375, -3.474609375, -3.314697265625, -3.15478515625, -2.994873046875, -2.8349609375, -2.675048828125, -2.51513671875, -2.355224609375, -2.1953125, -2.035400390625, -1.87548828125, -1.715576171875, -1.5556640625, -1.395751953125, -1.23583984375, -1.075927734375, -0.916015625, -0.756103515625, -0.59619140625, -0.436279296875, -0.2763671875, -0.116455078125, 0.04345703125, 0.203369140625, 0.36328125, 0.523193359375, 0.68310546875, 0.843017578125, 1.0029296875, 1.162841796875, 1.32275390625, 1.482666015625, 1.642578125, 1.802490234375, 1.96240234375, 2.122314453125, 2.2822265625, 2.442138671875, 2.60205078125, 2.761962890625, 2.921875, 3.081787109375, 3.24169921875, 3.401611328125, 3.5615234375, 3.721435546875, 3.88134765625, 4.041259765625, 4.201171875, 4.361083984375, 4.52099609375, 4.680908203125, 4.8408203125, 5.000732421875, 5.16064453125, 5.320556640625, 5.48046875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 12.0, 50.0, 181.0, 298.0, 274.0, 108.0, 50.0, 23.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1471014022827148, -1.1257257461547852, -1.1043500900268555, -1.0829743146896362, -1.0615986585617065, -1.0402230024337769, -1.0188473463058472, -0.9974716305732727, -0.9760959148406982, -0.9547202587127686, -0.9333445429801941, -0.9119688868522644, -0.8905931711196899, -0.8692175149917603, -0.8478418588638306, -0.8264661431312561, -0.8050904870033264, -0.7837148308753967, -0.7623391151428223, -0.7409634590148926, -0.7195877432823181, -0.6982120871543884, -0.676836371421814, -0.6554607152938843, -0.6340850591659546, -0.6127094030380249, -0.5913336873054504, -0.5699580311775208, -0.5485823154449463, -0.5272066593170166, -0.5058310031890869, -0.48445528745651245, -0.4630795121192932, -0.44170382618904114, -0.42032814025878906, -0.3989524841308594, -0.3775767683982849, -0.3562011122703552, -0.33482542634010315, -0.3134497404098511, -0.2920740842819214, -0.2706983983516693, -0.24932271242141724, -0.22794704139232635, -0.20657135546207428, -0.1851956695318222, -0.16381999850273132, -0.14244431257247925, -0.12106861174106598, -0.0996929258108139, -0.07831724733114243, -0.05694156885147095, -0.03556588292121887, -0.014190196990966797, 0.0071854740381240845, 0.02856115996837616, 0.049936845898628235, 0.07131253182888031, 0.09268821030855179, 0.11406388878822327, 0.13543957471847534, 0.15681526064872742, 0.1781909316778183, 0.19956661760807037, 0.22094230353832245]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 8.0, 8.0, 14.0, 9.0, 20.0, 28.0, 31.0, 34.0, 35.0, 32.0, 45.0, 57.0, 54.0, 55.0, 42.0, 45.0, 57.0, 54.0, 47.0, 42.0, 38.0, 31.0, 40.0, 24.0, 28.0, 29.0, 23.0, 12.0, 19.0, 8.0, 9.0, 9.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21800941228866577, -0.2108687162399292, -0.20372800529003143, -0.19658729434013367, -0.1894465982913971, -0.18230590224266052, -0.17516519129276276, -0.168024480342865, -0.16088378429412842, -0.15374308824539185, -0.14660237729549408, -0.1394616663455963, -0.13232097029685974, -0.12518027424812317, -0.1180395632982254, -0.11089885979890823, -0.10375815629959106, -0.0966174528002739, -0.08947674930095673, -0.08233604580163956, -0.07519534230232239, -0.06805463880300522, -0.06091393530368805, -0.05377323180437088, -0.04663252830505371, -0.03949182480573654, -0.03235112130641937, -0.025210417807102203, -0.018069714307785034, -0.010929010808467865, -0.003788307309150696, 0.0033523961901664734, 0.010493099689483643, 0.017633803188800812, 0.02477450668811798, 0.03191521018743515, 0.03905591368675232, 0.04619661718606949, 0.05333732068538666, 0.06047802418470383, 0.067618727684021, 0.07475943118333817, 0.08190013468265533, 0.0890408381819725, 0.09618154168128967, 0.10332224518060684, 0.11046294867992401, 0.11760365217924118, 0.12474435567855835, 0.13188505172729492, 0.1390257626771927, 0.14616647362709045, 0.15330716967582703, 0.1604478657245636, 0.16758857667446136, 0.17472928762435913, 0.1818699836730957, 0.18901067972183228, 0.19615139067173004, 0.2032921016216278, 0.21043279767036438, 0.21757349371910095, 0.22471420466899872, 0.23185491561889648, 0.23899561166763306]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 8.0, 4.0, 10.0, 10.0, 6.0, 13.0, 19.0, 13.0, 14.0, 24.0, 20.0, 29.0, 43.0, 30.0, 39.0, 33.0, 38.0, 54.0, 36.0, 28.0, 45.0, 35.0, 45.0, 35.0, 36.0, 42.0, 44.0, 32.0, 30.0, 18.0, 27.0, 25.0, 26.0, 17.0, 17.0, 10.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-7.23828125, -7.0443115234375, -6.850341796875, -6.6563720703125, -6.46240234375, -6.2684326171875, -6.074462890625, -5.8804931640625, -5.6865234375, -5.4925537109375, -5.298583984375, -5.1046142578125, -4.91064453125, -4.7166748046875, -4.522705078125, -4.3287353515625, -4.134765625, -3.9407958984375, -3.746826171875, -3.5528564453125, -3.35888671875, -3.1649169921875, -2.970947265625, -2.7769775390625, -2.5830078125, -2.3890380859375, -2.195068359375, -2.0010986328125, -1.80712890625, -1.6131591796875, -1.419189453125, -1.2252197265625, -1.03125, -0.8372802734375, -0.643310546875, -0.4493408203125, -0.25537109375, -0.0614013671875, 0.132568359375, 0.3265380859375, 0.5205078125, 0.7144775390625, 0.908447265625, 1.1024169921875, 1.29638671875, 1.4903564453125, 1.684326171875, 1.8782958984375, 2.072265625, 2.2662353515625, 2.460205078125, 2.6541748046875, 2.84814453125, 3.0421142578125, 3.236083984375, 3.4300537109375, 3.6240234375, 3.8179931640625, 4.011962890625, 4.2059326171875, 4.39990234375, 4.5938720703125, 4.787841796875, 4.9818115234375, 5.17578125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 10.0, 7.0, 16.0, 17.0, 21.0, 26.0, 31.0, 46.0, 55.0, 83.0, 127.0, 172.0, 224.0, 341.0, 426.0, 690.0, 1160.0, 2233.0, 4937.0, 12312.0, 37827.0, 151004.0, 500277.0, 248336.0, 57480.0, 17310.0, 6492.0, 2869.0, 1402.0, 792.0, 523.0, 389.0, 235.0, 183.0, 133.0, 116.0, 76.0, 42.0, 37.0, 24.0, 21.0, 15.0, 9.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796875, -8.51904296875, -8.2412109375, -7.96337890625, -7.685546875, -7.40771484375, -7.1298828125, -6.85205078125, -6.57421875, -6.29638671875, -6.0185546875, -5.74072265625, -5.462890625, -5.18505859375, -4.9072265625, -4.62939453125, -4.3515625, -4.07373046875, -3.7958984375, -3.51806640625, -3.240234375, -2.96240234375, -2.6845703125, -2.40673828125, -2.12890625, -1.85107421875, -1.5732421875, -1.29541015625, -1.017578125, -0.73974609375, -0.4619140625, -0.18408203125, 0.09375, 0.37158203125, 0.6494140625, 0.92724609375, 1.205078125, 1.48291015625, 1.7607421875, 2.03857421875, 2.31640625, 2.59423828125, 2.8720703125, 3.14990234375, 3.427734375, 3.70556640625, 3.9833984375, 4.26123046875, 4.5390625, 4.81689453125, 5.0947265625, 5.37255859375, 5.650390625, 5.92822265625, 6.2060546875, 6.48388671875, 6.76171875, 7.03955078125, 7.3173828125, 7.59521484375, 7.873046875, 8.15087890625, 8.4287109375, 8.70654296875, 8.984375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 17.0, 7.0, 9.0, 19.0, 21.0, 24.0, 20.0, 22.0, 31.0, 51.0, 55.0, 64.0, 88.0, 153.0, 287.0, 1385.0, 208.0, 129.0, 76.0, 70.0, 59.0, 44.0, 35.0, 18.0, 22.0, 18.0, 21.0, 11.0, 15.0, 11.0, 7.0, 9.0, 3.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.8125, -15.270751953125, -14.72900390625, -14.187255859375, -13.6455078125, -13.103759765625, -12.56201171875, -12.020263671875, -11.478515625, -10.936767578125, -10.39501953125, -9.853271484375, -9.3115234375, -8.769775390625, -8.22802734375, -7.686279296875, -7.14453125, -6.602783203125, -6.06103515625, -5.519287109375, -4.9775390625, -4.435791015625, -3.89404296875, -3.352294921875, -2.810546875, -2.268798828125, -1.72705078125, -1.185302734375, -0.6435546875, -0.101806640625, 0.43994140625, 0.981689453125, 1.5234375, 2.065185546875, 2.60693359375, 3.148681640625, 3.6904296875, 4.232177734375, 4.77392578125, 5.315673828125, 5.857421875, 6.399169921875, 6.94091796875, 7.482666015625, 8.0244140625, 8.566162109375, 9.10791015625, 9.649658203125, 10.19140625, 10.733154296875, 11.27490234375, 11.816650390625, 12.3583984375, 12.900146484375, 13.44189453125, 13.983642578125, 14.525390625, 15.067138671875, 15.60888671875, 16.150634765625, 16.6923828125, 17.234130859375, 17.77587890625, 18.317626953125, 18.859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 9.0, 8.0, 18.0, 13.0, 16.0, 21.0, 37.0, 35.0, 44.0, 67.0, 88.0, 143.0, 219.0, 358.0, 714.0, 1955.0, 13512.0, 2626871.0, 491878.0, 6731.0, 1460.0, 561.0, 301.0, 172.0, 111.0, 82.0, 62.0, 53.0, 42.0, 24.0, 23.0, 16.0, 12.0, 14.0, 6.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.71875, -31.752685546875, -30.78662109375, -29.820556640625, -28.8544921875, -27.888427734375, -26.92236328125, -25.956298828125, -24.990234375, -24.024169921875, -23.05810546875, -22.092041015625, -21.1259765625, -20.159912109375, -19.19384765625, -18.227783203125, -17.26171875, -16.295654296875, -15.32958984375, -14.363525390625, -13.3974609375, -12.431396484375, -11.46533203125, -10.499267578125, -9.533203125, -8.567138671875, -7.60107421875, -6.635009765625, -5.6689453125, -4.702880859375, -3.73681640625, -2.770751953125, -1.8046875, -0.838623046875, 0.12744140625, 1.093505859375, 2.0595703125, 3.025634765625, 3.99169921875, 4.957763671875, 5.923828125, 6.889892578125, 7.85595703125, 8.822021484375, 9.7880859375, 10.754150390625, 11.72021484375, 12.686279296875, 13.65234375, 14.618408203125, 15.58447265625, 16.550537109375, 17.5166015625, 18.482666015625, 19.44873046875, 20.414794921875, 21.380859375, 22.346923828125, 23.31298828125, 24.279052734375, 25.2451171875, 26.211181640625, 27.17724609375, 28.143310546875, 29.109375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 143.0, 849.0, 20.0, 0.0, 1.0, 0.0, 2.0], "bins": [-869.2963256835938, -854.3916625976562, -839.487060546875, -824.5823974609375, -809.677734375, -794.7730712890625, -779.8684692382812, -764.9638061523438, -750.0591430664062, -735.1544799804688, -720.2498779296875, -705.34521484375, -690.4405517578125, -675.535888671875, -660.6312866210938, -645.7266235351562, -630.8219604492188, -615.9172973632812, -601.0126953125, -586.1080322265625, -571.203369140625, -556.2987060546875, -541.3941040039062, -526.4894409179688, -511.5848083496094, -496.68017578125, -481.7755126953125, -466.8708801269531, -451.9662170410156, -437.06158447265625, -422.15692138671875, -407.2522888183594, -392.3476257324219, -377.4429931640625, -362.538330078125, -347.6336975097656, -332.7290344238281, -317.82440185546875, -302.91973876953125, -288.0151062011719, -273.1104736328125, -258.2058410644531, -243.30117797851562, -228.3965301513672, -213.49188232421875, -198.58724975585938, -183.68258666992188, -168.7779541015625, -153.873291015625, -138.96864318847656, -124.06399536132812, -109.15934753417969, -94.25469970703125, -79.35005950927734, -64.4454116821289, -49.54076385498047, -34.6361083984375, -19.731460571289062, -4.826814651489258, 10.077831268310547, 24.982479095458984, 39.887123107910156, 54.791770935058594, 69.69641876220703, 84.60106658935547]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 4.0, 7.0, 4.0, 10.0, 8.0, 13.0, 21.0, 18.0, 19.0, 21.0, 23.0, 37.0, 25.0, 39.0, 28.0, 28.0, 44.0, 41.0, 41.0, 37.0, 35.0, 30.0, 41.0, 42.0, 39.0, 31.0, 35.0, 41.0, 32.0, 36.0, 19.0, 20.0, 16.0, 15.0, 17.0, 12.0, 13.0, 15.0, 12.0, 7.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-56.94044876098633, -55.305442810058594, -53.670433044433594, -52.03542709350586, -50.40041732788086, -48.765411376953125, -47.130401611328125, -45.49539566040039, -43.860389709472656, -42.22538375854492, -40.59037399291992, -38.95536804199219, -37.32035827636719, -35.68535232543945, -34.05034637451172, -32.41533660888672, -30.78032684326172, -29.14531898498535, -27.510311126708984, -25.87530517578125, -24.24029541015625, -22.605289459228516, -20.97028160095215, -19.33527374267578, -17.700265884399414, -16.065258026123047, -14.43025016784668, -12.795243263244629, -11.160235404968262, -9.525227546691895, -7.890220642089844, -6.255212783813477, -4.620204925537109, -2.9851973056793213, -1.3501896858215332, 0.2848176956176758, 1.919825553894043, 3.55483341217041, 5.189840316772461, 6.824848175048828, 8.459856033325195, 10.094863891601562, 11.72987174987793, 13.36487865447998, 14.999886512756348, 16.63489532470703, 18.269901275634766, 19.904909133911133, 21.5399169921875, 23.174924850463867, 24.809932708740234, 26.44493865966797, 28.07994842529297, 29.714954376220703, 31.34996223449707, 32.98497009277344, 34.61997985839844, 36.25498580932617, 37.88999557495117, 39.525001525878906, 41.160011291503906, 42.79501724243164, 44.430023193359375, 46.065032958984375, 47.70003890991211]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 8.0, 7.0, 9.0, 8.0, 10.0, 15.0, 28.0, 25.0, 25.0, 31.0, 30.0, 22.0, 36.0, 36.0, 38.0, 37.0, 46.0, 43.0, 56.0, 52.0, 45.0, 24.0, 46.0, 35.0, 43.0, 36.0, 27.0, 29.0, 24.0, 17.0, 19.0, 17.0, 15.0, 8.0, 4.0, 10.0, 5.0, 2.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.9921875, -7.765869140625, -7.53955078125, -7.313232421875, -7.0869140625, -6.860595703125, -6.63427734375, -6.407958984375, -6.181640625, -5.955322265625, -5.72900390625, -5.502685546875, -5.2763671875, -5.050048828125, -4.82373046875, -4.597412109375, -4.37109375, -4.144775390625, -3.91845703125, -3.692138671875, -3.4658203125, -3.239501953125, -3.01318359375, -2.786865234375, -2.560546875, -2.334228515625, -2.10791015625, -1.881591796875, -1.6552734375, -1.428955078125, -1.20263671875, -0.976318359375, -0.75, -0.523681640625, -0.29736328125, -0.071044921875, 0.1552734375, 0.381591796875, 0.60791015625, 0.834228515625, 1.060546875, 1.286865234375, 1.51318359375, 1.739501953125, 1.9658203125, 2.192138671875, 2.41845703125, 2.644775390625, 2.87109375, 3.097412109375, 3.32373046875, 3.550048828125, 3.7763671875, 4.002685546875, 4.22900390625, 4.455322265625, 4.681640625, 4.907958984375, 5.13427734375, 5.360595703125, 5.5869140625, 5.813232421875, 6.03955078125, 6.265869140625, 6.4921875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 11.0, 13.0, 20.0, 34.0, 31.0, 61.0, 90.0, 121.0, 172.0, 252.0, 398.0, 581.0, 914.0, 1644.0, 3474.0, 11230.0, 60314.0, 884756.0, 2967052.0, 224850.0, 26462.0, 6170.0, 2277.0, 1173.0, 757.0, 456.0, 282.0, 204.0, 161.0, 91.0, 65.0, 46.0, 26.0, 12.0, 10.0, 10.0, 18.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-31.734375, -30.80859375, -29.8828125, -28.95703125, -28.03125, -27.10546875, -26.1796875, -25.25390625, -24.328125, -23.40234375, -22.4765625, -21.55078125, -20.625, -19.69921875, -18.7734375, -17.84765625, -16.921875, -15.99609375, -15.0703125, -14.14453125, -13.21875, -12.29296875, -11.3671875, -10.44140625, -9.515625, -8.58984375, -7.6640625, -6.73828125, -5.8125, -4.88671875, -3.9609375, -3.03515625, -2.109375, -1.18359375, -0.2578125, 0.66796875, 1.59375, 2.51953125, 3.4453125, 4.37109375, 5.296875, 6.22265625, 7.1484375, 8.07421875, 9.0, 9.92578125, 10.8515625, 11.77734375, 12.703125, 13.62890625, 14.5546875, 15.48046875, 16.40625, 17.33203125, 18.2578125, 19.18359375, 20.109375, 21.03515625, 21.9609375, 22.88671875, 23.8125, 24.73828125, 25.6640625, 26.58984375, 27.515625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 8.0, 13.0, 25.0, 30.0, 40.0, 56.0, 66.0, 95.0, 117.0, 164.0, 216.0, 315.0, 375.0, 468.0, 402.0, 389.0, 328.0, 236.0, 187.0, 118.0, 113.0, 86.0, 68.0, 45.0, 22.0, 13.0, 20.0, 11.0, 8.0, 5.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.1397705078125, -8.724853515625, -8.3099365234375, -7.89501953125, -7.4801025390625, -7.065185546875, -6.6502685546875, -6.2353515625, -5.8204345703125, -5.405517578125, -4.9906005859375, -4.57568359375, -4.1607666015625, -3.745849609375, -3.3309326171875, -2.916015625, -2.5010986328125, -2.086181640625, -1.6712646484375, -1.25634765625, -0.8414306640625, -0.426513671875, -0.0115966796875, 0.4033203125, 0.8182373046875, 1.233154296875, 1.6480712890625, 2.06298828125, 2.4779052734375, 2.892822265625, 3.3077392578125, 3.72265625, 4.1375732421875, 4.552490234375, 4.9674072265625, 5.38232421875, 5.7972412109375, 6.212158203125, 6.6270751953125, 7.0419921875, 7.4569091796875, 7.871826171875, 8.2867431640625, 8.70166015625, 9.1165771484375, 9.531494140625, 9.9464111328125, 10.361328125, 10.7762451171875, 11.191162109375, 11.6060791015625, 12.02099609375, 12.4359130859375, 12.850830078125, 13.2657470703125, 13.6806640625, 14.0955810546875, 14.510498046875, 14.9254150390625, 15.34033203125, 15.7552490234375, 16.170166015625, 16.5850830078125, 17.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 12.0, 16.0, 22.0, 47.0, 92.0, 199.0, 419.0, 1123.0, 4895.0, 49074.0, 977336.0, 2974785.0, 170687.0, 12409.0, 1974.0, 645.0, 255.0, 138.0, 69.0, 34.0, 15.0, 9.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.984375, -24.15771484375, -23.3310546875, -22.50439453125, -21.677734375, -20.85107421875, -20.0244140625, -19.19775390625, -18.37109375, -17.54443359375, -16.7177734375, -15.89111328125, -15.064453125, -14.23779296875, -13.4111328125, -12.58447265625, -11.7578125, -10.93115234375, -10.1044921875, -9.27783203125, -8.451171875, -7.62451171875, -6.7978515625, -5.97119140625, -5.14453125, -4.31787109375, -3.4912109375, -2.66455078125, -1.837890625, -1.01123046875, -0.1845703125, 0.64208984375, 1.46875, 2.29541015625, 3.1220703125, 3.94873046875, 4.775390625, 5.60205078125, 6.4287109375, 7.25537109375, 8.08203125, 8.90869140625, 9.7353515625, 10.56201171875, 11.388671875, 12.21533203125, 13.0419921875, 13.86865234375, 14.6953125, 15.52197265625, 16.3486328125, 17.17529296875, 18.001953125, 18.82861328125, 19.6552734375, 20.48193359375, 21.30859375, 22.13525390625, 22.9619140625, 23.78857421875, 24.615234375, 25.44189453125, 26.2685546875, 27.09521484375, 27.921875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 12.0, 12.0, 17.0, 26.0, 40.0, 52.0, 71.0, 81.0, 119.0, 97.0, 103.0, 89.0, 68.0, 53.0, 41.0, 23.0, 29.0, 19.0, 13.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.03022003173828, -75.66656494140625, -72.30290985107422, -68.93925476074219, -65.57560729980469, -62.211952209472656, -58.848297119140625, -55.484642028808594, -52.12099075317383, -48.7573356628418, -45.39368438720703, -42.030029296875, -38.66637420654297, -35.3027229309082, -31.939067840576172, -28.575414657592773, -25.211761474609375, -21.848108291625977, -18.484455108642578, -15.120800018310547, -11.757146835327148, -8.39349365234375, -5.029838562011719, -1.6661853790283203, 1.6974678039550781, 5.061121463775635, 8.424775123596191, 11.788429260253906, 15.152082443237305, 18.515735626220703, 21.879390716552734, 25.243043899536133, 28.606704711914062, 31.97035789489746, 35.33401107788086, 38.69766616821289, 42.061317443847656, 45.42497253417969, 48.78862762451172, 52.15228271484375, 55.515933990478516, 58.87958908081055, 62.24324035644531, 65.60689544677734, 68.97055053710938, 72.33419799804688, 75.69786071777344, 79.06150817871094, 82.42516326904297, 85.788818359375, 89.15247344970703, 92.51612854003906, 95.87977600097656, 99.2434310913086, 102.60708618164062, 105.97074127197266, 109.33439636230469, 112.69805145263672, 116.06170654296875, 119.42535400390625, 122.78900909423828, 126.15266418457031, 129.51632690429688, 132.87997436523438, 136.24362182617188]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 4.0, 10.0, 14.0, 3.0, 17.0, 11.0, 16.0, 18.0, 21.0, 27.0, 30.0, 30.0, 28.0, 45.0, 30.0, 39.0, 41.0, 48.0, 41.0, 45.0, 47.0, 41.0, 43.0, 40.0, 32.0, 43.0, 40.0, 21.0, 24.0, 24.0, 18.0, 23.0, 20.0, 15.0, 6.0, 8.0, 4.0, 8.0, 6.0, 3.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.854591369628906, -59.93022918701172, -58.00586700439453, -56.081504821777344, -54.15713882446289, -52.2327766418457, -50.308414459228516, -48.38405227661133, -46.459686279296875, -44.53532409667969, -42.6109619140625, -40.68659973144531, -38.76223373413086, -36.83787155151367, -34.913509368896484, -32.9891471862793, -31.06478500366211, -29.140422821044922, -27.2160587310791, -25.291696548461914, -23.367332458496094, -21.442970275878906, -19.51860809326172, -17.59424591064453, -15.669881820678711, -13.745518684387207, -11.821155548095703, -9.896793365478516, -7.972430229187012, -6.048067092895508, -4.12370491027832, -2.1993417739868164, -0.2749748229980469, 1.649388074874878, 3.5737509727478027, 5.498113632202148, 7.422476768493652, 9.346839904785156, 11.271202087402344, 13.195565223693848, 15.119928359985352, 17.04429054260254, 18.96865463256836, 20.893016815185547, 22.817378997802734, 24.741743087768555, 26.666105270385742, 28.590469360351562, 30.51483154296875, 32.43919372558594, 34.363555908203125, 36.28791809082031, 38.212284088134766, 40.13664627075195, 42.06100845336914, 43.98537063598633, 45.90973663330078, 47.83409881591797, 49.758460998535156, 51.682823181152344, 53.6071891784668, 55.531551361083984, 57.45591354370117, 59.38027572631836, 61.30463790893555]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 8.0, 7.0, 12.0, 14.0, 16.0, 13.0, 21.0, 26.0, 26.0, 34.0, 28.0, 34.0, 36.0, 23.0, 40.0, 36.0, 43.0, 45.0, 57.0, 33.0, 50.0, 50.0, 42.0, 40.0, 36.0, 23.0, 29.0, 29.0, 23.0, 22.0, 18.0, 21.0, 11.0, 8.0, 10.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-116.0625, -112.33203125, -108.6015625, -104.87109375, -101.140625, -97.41015625, -93.6796875, -89.94921875, -86.21875, -82.48828125, -78.7578125, -75.02734375, -71.296875, -67.56640625, -63.8359375, -60.10546875, -56.375, -52.64453125, -48.9140625, -45.18359375, -41.453125, -37.72265625, -33.9921875, -30.26171875, -26.53125, -22.80078125, -19.0703125, -15.33984375, -11.609375, -7.87890625, -4.1484375, -0.41796875, 3.3125, 7.04296875, 10.7734375, 14.50390625, 18.234375, 21.96484375, 25.6953125, 29.42578125, 33.15625, 36.88671875, 40.6171875, 44.34765625, 48.078125, 51.80859375, 55.5390625, 59.26953125, 63.0, 66.73046875, 70.4609375, 74.19140625, 77.921875, 81.65234375, 85.3828125, 89.11328125, 92.84375, 96.57421875, 100.3046875, 104.03515625, 107.765625, 111.49609375, 115.2265625, 118.95703125, 122.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 17.0, 21.0, 25.0, 45.0, 51.0, 112.0, 175.0, 244.0, 402.0, 687.0, 1112.0, 1820.0, 3046.0, 5066.0, 8562.0, 15048.0, 26916.0, 49722.0, 98912.0, 199028.0, 276697.0, 175071.0, 85675.0, 43800.0, 23652.0, 13341.0, 7748.0, 4598.0, 2683.0, 1646.0, 1010.0, 616.0, 365.0, 223.0, 146.0, 103.0, 68.0, 34.0, 28.0, 17.0, 9.0, 10.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.931640625, -7.65234375, -7.373046875, -7.09375, -6.814453125, -6.53515625, -6.255859375, -5.9765625, -5.697265625, -5.41796875, -5.138671875, -4.859375, -4.580078125, -4.30078125, -4.021484375, -3.7421875, -3.462890625, -3.18359375, -2.904296875, -2.625, -2.345703125, -2.06640625, -1.787109375, -1.5078125, -1.228515625, -0.94921875, -0.669921875, -0.390625, -0.111328125, 0.16796875, 0.447265625, 0.7265625, 1.005859375, 1.28515625, 1.564453125, 1.84375, 2.123046875, 2.40234375, 2.681640625, 2.9609375, 3.240234375, 3.51953125, 3.798828125, 4.078125, 4.357421875, 4.63671875, 4.916015625, 5.1953125, 5.474609375, 5.75390625, 6.033203125, 6.3125, 6.591796875, 6.87109375, 7.150390625, 7.4296875, 7.708984375, 7.98828125, 8.267578125, 8.546875, 8.826171875, 9.10546875, 9.384765625, 9.6640625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 13.0, 15.0, 9.0, 24.0, 17.0, 25.0, 29.0, 25.0, 27.0, 39.0, 38.0, 43.0, 53.0, 56.0, 30.0, 40.0, 1076.0, 52.0, 43.0, 45.0, 35.0, 43.0, 45.0, 30.0, 15.0, 20.0, 18.0, 26.0, 18.0, 18.0, 12.0, 7.0, 4.0, 9.0, 3.0, 4.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.5, -71.095703125, -68.69140625, -66.287109375, -63.8828125, -61.478515625, -59.07421875, -56.669921875, -54.265625, -51.861328125, -49.45703125, -47.052734375, -44.6484375, -42.244140625, -39.83984375, -37.435546875, -35.03125, -32.626953125, -30.22265625, -27.818359375, -25.4140625, -23.009765625, -20.60546875, -18.201171875, -15.796875, -13.392578125, -10.98828125, -8.583984375, -6.1796875, -3.775390625, -1.37109375, 1.033203125, 3.4375, 5.841796875, 8.24609375, 10.650390625, 13.0546875, 15.458984375, 17.86328125, 20.267578125, 22.671875, 25.076171875, 27.48046875, 29.884765625, 32.2890625, 34.693359375, 37.09765625, 39.501953125, 41.90625, 44.310546875, 46.71484375, 49.119140625, 51.5234375, 53.927734375, 56.33203125, 58.736328125, 61.140625, 63.544921875, 65.94921875, 68.353515625, 70.7578125, 73.162109375, 75.56640625, 77.970703125, 80.375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 5.0, 6.0, 15.0, 18.0, 21.0, 34.0, 55.0, 87.0, 156.0, 226.0, 396.0, 542.0, 888.0, 1554.0, 2563.0, 4578.0, 7624.0, 13480.0, 24569.0, 44804.0, 85734.0, 177692.0, 1278300.0, 231857.0, 101778.0, 53328.0, 28559.0, 15890.0, 9200.0, 5366.0, 3058.0, 1869.0, 1153.0, 659.0, 373.0, 224.0, 174.0, 100.0, 70.0, 49.0, 31.0, 17.0, 9.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.46875, -8.1922607421875, -7.915771484375, -7.6392822265625, -7.36279296875, -7.0863037109375, -6.809814453125, -6.5333251953125, -6.2568359375, -5.9803466796875, -5.703857421875, -5.4273681640625, -5.15087890625, -4.8743896484375, -4.597900390625, -4.3214111328125, -4.044921875, -3.7684326171875, -3.491943359375, -3.2154541015625, -2.93896484375, -2.6624755859375, -2.385986328125, -2.1094970703125, -1.8330078125, -1.5565185546875, -1.280029296875, -1.0035400390625, -0.72705078125, -0.4505615234375, -0.174072265625, 0.1024169921875, 0.37890625, 0.6553955078125, 0.931884765625, 1.2083740234375, 1.48486328125, 1.7613525390625, 2.037841796875, 2.3143310546875, 2.5908203125, 2.8673095703125, 3.143798828125, 3.4202880859375, 3.69677734375, 3.9732666015625, 4.249755859375, 4.5262451171875, 4.802734375, 5.0792236328125, 5.355712890625, 5.6322021484375, 5.90869140625, 6.1851806640625, 6.461669921875, 6.7381591796875, 7.0146484375, 7.2911376953125, 7.567626953125, 7.8441162109375, 8.12060546875, 8.3970947265625, 8.673583984375, 8.9500732421875, 9.2265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 8.0, 9.0, 16.0, 12.0, 20.0, 28.0, 50.0, 43.0, 45.0, 65.0, 90.0, 85.0, 96.0, 84.0, 58.0, 43.0, 42.0, 31.0, 24.0, 22.0, 19.0, 16.0, 14.0, 10.0, 11.0, 7.0, 6.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.297607421875, -0.28797149658203125, -0.2783355712890625, -0.26869964599609375, -0.259063720703125, -0.24942779541015625, -0.2397918701171875, -0.23015594482421875, -0.22052001953125, -0.21088409423828125, -0.2012481689453125, -0.19161224365234375, -0.181976318359375, -0.17234039306640625, -0.1627044677734375, -0.15306854248046875, -0.1434326171875, -0.13379669189453125, -0.1241607666015625, -0.11452484130859375, -0.104888916015625, -0.09525299072265625, -0.0856170654296875, -0.07598114013671875, -0.06634521484375, -0.05670928955078125, -0.0470733642578125, -0.03743743896484375, -0.027801513671875, -0.01816558837890625, -0.0085296630859375, 0.00110626220703125, 0.0107421875, 0.02037811279296875, 0.0300140380859375, 0.03964996337890625, 0.049285888671875, 0.05892181396484375, 0.0685577392578125, 0.07819366455078125, 0.08782958984375, 0.09746551513671875, 0.1071014404296875, 0.11673736572265625, 0.126373291015625, 0.13600921630859375, 0.1456451416015625, 0.15528106689453125, 0.1649169921875, 0.17455291748046875, 0.1841888427734375, 0.19382476806640625, 0.203460693359375, 0.21309661865234375, 0.2227325439453125, 0.23236846923828125, 0.24200439453125, 0.25164031982421875, 0.2612762451171875, 0.27091217041015625, 0.280548095703125, 0.29018402099609375, 0.2998199462890625, 0.30945587158203125, 0.319091796875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 7.0, 13.0, 17.0, 10.0, 37.0, 28.0, 63.0, 59.0, 97.0, 131.0, 187.0, 263.0, 364.0, 550.0, 735.0, 1098.0, 1652.0, 2877.0, 5781.0, 13370.0, 37853.0, 165446.0, 574028.0, 176506.0, 39258.0, 13737.0, 6046.0, 2896.0, 1739.0, 1096.0, 766.0, 564.0, 352.0, 264.0, 200.0, 136.0, 88.0, 58.0, 45.0, 48.0, 33.0, 20.0, 13.0, 11.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-1.767578125, -1.71636962890625, -1.6651611328125, -1.61395263671875, -1.562744140625, -1.51153564453125, -1.4603271484375, -1.40911865234375, -1.35791015625, -1.30670166015625, -1.2554931640625, -1.20428466796875, -1.153076171875, -1.10186767578125, -1.0506591796875, -0.99945068359375, -0.9482421875, -0.89703369140625, -0.8458251953125, -0.79461669921875, -0.743408203125, -0.69219970703125, -0.6409912109375, -0.58978271484375, -0.53857421875, -0.48736572265625, -0.4361572265625, -0.38494873046875, -0.333740234375, -0.28253173828125, -0.2313232421875, -0.18011474609375, -0.12890625, -0.07769775390625, -0.0264892578125, 0.02471923828125, 0.075927734375, 0.12713623046875, 0.1783447265625, 0.22955322265625, 0.28076171875, 0.33197021484375, 0.3831787109375, 0.43438720703125, 0.485595703125, 0.53680419921875, 0.5880126953125, 0.63922119140625, 0.6904296875, 0.74163818359375, 0.7928466796875, 0.84405517578125, 0.895263671875, 0.94647216796875, 0.9976806640625, 1.04888916015625, 1.10009765625, 1.15130615234375, 1.2025146484375, 1.25372314453125, 1.304931640625, 1.35614013671875, 1.4073486328125, 1.45855712890625, 1.509765625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 2.0, 7.0, 9.0, 17.0, 24.0, 32.0, 51.0, 77.0, 100.0, 124.0, 131.0, 125.0, 122.0, 62.0, 39.0, 28.0, 22.0, 11.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8307793140411377, -0.8086284399032593, -0.7864775657653809, -0.7643266916275024, -0.742175817489624, -0.7200250029563904, -0.697874128818512, -0.6757232546806335, -0.6535723805427551, -0.6314215064048767, -0.6092706322669983, -0.5871197581291199, -0.5649689435958862, -0.5428180694580078, -0.5206671953201294, -0.498516321182251, -0.47636544704437256, -0.45421457290649414, -0.4320636987686157, -0.4099128544330597, -0.3877619802951813, -0.36561110615730286, -0.3434602618217468, -0.3213093876838684, -0.29915851354599, -0.2770076394081116, -0.25485676527023315, -0.23270592093467712, -0.2105550467967987, -0.1884041726589203, -0.16625331342220306, -0.14410245418548584, -0.12195158004760742, -0.0998007133603096, -0.07764984667301178, -0.05549897998571396, -0.03334811329841614, -0.011197246611118317, 0.010953620076179504, 0.03310447931289673, 0.055255353450775146, 0.07740622013807297, 0.09955708682537079, 0.12170795351266861, 0.14385882019996643, 0.16600969433784485, 0.18816055357456207, 0.2103114128112793, 0.23246228694915771, 0.25461316108703613, 0.27676403522491455, 0.2989148795604706, 0.321065753698349, 0.3432166278362274, 0.36536747217178345, 0.38751834630966187, 0.4096692204475403, 0.4318200945854187, 0.4539709687232971, 0.47612181305885315, 0.49827268719673157, 0.5204235315322876, 0.542574405670166, 0.5647252798080444, 0.5868761539459229]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 9.0, 11.0, 8.0, 12.0, 17.0, 13.0, 30.0, 23.0, 26.0, 27.0, 27.0, 34.0, 35.0, 33.0, 38.0, 54.0, 38.0, 40.0, 36.0, 50.0, 38.0, 39.0, 40.0, 33.0, 36.0, 17.0, 29.0, 23.0, 24.0, 24.0, 17.0, 13.0, 17.0, 19.0, 11.0, 12.0, 2.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22672247886657715, -0.21937517821788788, -0.2120278775691986, -0.20468059182167053, -0.19733329117298126, -0.189985990524292, -0.18263868987560272, -0.17529138922691345, -0.16794410347938538, -0.1605968028306961, -0.15324950218200684, -0.14590221643447876, -0.1385549157857895, -0.13120761513710022, -0.12386031448841095, -0.11651301383972168, -0.10916571319103241, -0.10181841254234314, -0.09447111934423447, -0.0871238186955452, -0.07977652549743652, -0.07242922484874725, -0.06508192420005798, -0.05773462727665901, -0.05038733035326004, -0.04304003342986107, -0.0356927365064621, -0.028345435857772827, -0.020998138934373856, -0.013650842010974884, -0.006303541362285614, 0.0010437555611133575, 0.008391052484512329, 0.0157383494079113, 0.02308564819395542, 0.030432946979999542, 0.037780243903398514, 0.045127540826797485, 0.052474841475486755, 0.05982213839888573, 0.0671694353222847, 0.07451673597097397, 0.08186402916908264, 0.08921132981777191, 0.09655863046646118, 0.10390592366456985, 0.11125322431325912, 0.1186005175113678, 0.12594781816005707, 0.13329511880874634, 0.1406424194574356, 0.14798972010612488, 0.15533700585365295, 0.16268430650234222, 0.1700316071510315, 0.17737890779972076, 0.18472620844841003, 0.1920735090970993, 0.19942080974578857, 0.20676809549331665, 0.21411539614200592, 0.2214626967906952, 0.22880999743938446, 0.23615729808807373, 0.2435045838356018]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 14.0, 6.0, 11.0, 11.0, 11.0, 14.0, 11.0, 21.0, 24.0, 19.0, 35.0, 35.0, 39.0, 36.0, 42.0, 30.0, 45.0, 42.0, 51.0, 46.0, 35.0, 52.0, 41.0, 47.0, 32.0, 33.0, 28.0, 20.0, 31.0, 30.0, 17.0, 13.0, 14.0, 10.0, 10.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.0625, -100.4365234375, -96.810546875, -93.1845703125, -89.55859375, -85.9326171875, -82.306640625, -78.6806640625, -75.0546875, -71.4287109375, -67.802734375, -64.1767578125, -60.55078125, -56.9248046875, -53.298828125, -49.6728515625, -46.046875, -42.4208984375, -38.794921875, -35.1689453125, -31.54296875, -27.9169921875, -24.291015625, -20.6650390625, -17.0390625, -13.4130859375, -9.787109375, -6.1611328125, -2.53515625, 1.0908203125, 4.716796875, 8.3427734375, 11.96875, 15.5947265625, 19.220703125, 22.8466796875, 26.47265625, 30.0986328125, 33.724609375, 37.3505859375, 40.9765625, 44.6025390625, 48.228515625, 51.8544921875, 55.48046875, 59.1064453125, 62.732421875, 66.3583984375, 69.984375, 73.6103515625, 77.236328125, 80.8623046875, 84.48828125, 88.1142578125, 91.740234375, 95.3662109375, 98.9921875, 102.6181640625, 106.244140625, 109.8701171875, 113.49609375, 117.1220703125, 120.748046875, 124.3740234375, 128.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 9.0, 11.0, 11.0, 8.0, 16.0, 16.0, 20.0, 36.0, 42.0, 55.0, 64.0, 94.0, 168.0, 264.0, 526.0, 1226.0, 4081.0, 21812.0, 208194.0, 683298.0, 109866.0, 13652.0, 2946.0, 979.0, 437.0, 214.0, 136.0, 91.0, 64.0, 55.0, 34.0, 25.0, 20.0, 20.0, 11.0, 8.0, 9.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.616455078125, -20.82666015625, -20.036865234375, -19.2470703125, -18.457275390625, -17.66748046875, -16.877685546875, -16.087890625, -15.298095703125, -14.50830078125, -13.718505859375, -12.9287109375, -12.138916015625, -11.34912109375, -10.559326171875, -9.76953125, -8.979736328125, -8.18994140625, -7.400146484375, -6.6103515625, -5.820556640625, -5.03076171875, -4.240966796875, -3.451171875, -2.661376953125, -1.87158203125, -1.081787109375, -0.2919921875, 0.497802734375, 1.28759765625, 2.077392578125, 2.8671875, 3.656982421875, 4.44677734375, 5.236572265625, 6.0263671875, 6.816162109375, 7.60595703125, 8.395751953125, 9.185546875, 9.975341796875, 10.76513671875, 11.554931640625, 12.3447265625, 13.134521484375, 13.92431640625, 14.714111328125, 15.50390625, 16.293701171875, 17.08349609375, 17.873291015625, 18.6630859375, 19.452880859375, 20.24267578125, 21.032470703125, 21.822265625, 22.612060546875, 23.40185546875, 24.191650390625, 24.9814453125, 25.771240234375, 26.56103515625, 27.350830078125, 28.140625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 13.0, 10.0, 14.0, 21.0, 21.0, 27.0, 25.0, 38.0, 51.0, 56.0, 69.0, 62.0, 79.0, 2089.0, 68.0, 61.0, 58.0, 47.0, 50.0, 40.0, 31.0, 24.0, 20.0, 13.0, 16.0, 17.0, 12.0, 5.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-177.5, -170.978515625, -164.45703125, -157.935546875, -151.4140625, -144.892578125, -138.37109375, -131.849609375, -125.328125, -118.806640625, -112.28515625, -105.763671875, -99.2421875, -92.720703125, -86.19921875, -79.677734375, -73.15625, -66.634765625, -60.11328125, -53.591796875, -47.0703125, -40.548828125, -34.02734375, -27.505859375, -20.984375, -14.462890625, -7.94140625, -1.419921875, 5.1015625, 11.623046875, 18.14453125, 24.666015625, 31.1875, 37.708984375, 44.23046875, 50.751953125, 57.2734375, 63.794921875, 70.31640625, 76.837890625, 83.359375, 89.880859375, 96.40234375, 102.923828125, 109.4453125, 115.966796875, 122.48828125, 129.009765625, 135.53125, 142.052734375, 148.57421875, 155.095703125, 161.6171875, 168.138671875, 174.66015625, 181.181640625, 187.703125, 194.224609375, 200.74609375, 207.267578125, 213.7890625, 220.310546875, 226.83203125, 233.353515625, 239.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 14.0, 16.0, 42.0, 45.0, 92.0, 125.0, 245.0, 445.0, 1147.0, 3703.0, 21451.0, 369963.0, 2701984.0, 38615.0, 5158.0, 1416.0, 586.0, 253.0, 146.0, 83.0, 57.0, 31.0, 25.0, 11.0, 8.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.765625, -23.943359375, -23.12109375, -22.298828125, -21.4765625, -20.654296875, -19.83203125, -19.009765625, -18.1875, -17.365234375, -16.54296875, -15.720703125, -14.8984375, -14.076171875, -13.25390625, -12.431640625, -11.609375, -10.787109375, -9.96484375, -9.142578125, -8.3203125, -7.498046875, -6.67578125, -5.853515625, -5.03125, -4.208984375, -3.38671875, -2.564453125, -1.7421875, -0.919921875, -0.09765625, 0.724609375, 1.546875, 2.369140625, 3.19140625, 4.013671875, 4.8359375, 5.658203125, 6.48046875, 7.302734375, 8.125, 8.947265625, 9.76953125, 10.591796875, 11.4140625, 12.236328125, 13.05859375, 13.880859375, 14.703125, 15.525390625, 16.34765625, 17.169921875, 17.9921875, 18.814453125, 19.63671875, 20.458984375, 21.28125, 22.103515625, 22.92578125, 23.748046875, 24.5703125, 25.392578125, 26.21484375, 27.037109375, 27.859375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 17.0, 30.0, 47.0, 61.0, 146.0, 197.0, 171.0, 129.0, 65.0, 40.0, 22.0, 14.0, 10.0, 9.0, 2.0, 5.0, 5.0, 3.0, 6.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-302.72509765625, -294.0524597167969, -285.3797912597656, -276.7071533203125, -268.03448486328125, -259.3618469238281, -250.68917846679688, -242.01654052734375, -233.3438720703125, -224.6712188720703, -215.99856567382812, -207.32591247558594, -198.65325927734375, -189.98060607910156, -181.30795288085938, -172.63531494140625, -163.96266174316406, -155.29000854492188, -146.6173553466797, -137.9447021484375, -129.2720489501953, -120.59939575195312, -111.92675018310547, -103.25409698486328, -94.5814437866211, -85.9087905883789, -77.23613739013672, -68.56349182128906, -59.89083480834961, -51.21818161010742, -42.5455322265625, -33.87287902832031, -25.200210571289062, -16.527557373046875, -7.85490608215332, 0.8177452087402344, 9.490398406982422, 18.16305160522461, 26.83570098876953, 35.50835418701172, 44.181007385253906, 52.853660583496094, 61.52631378173828, 70.19895935058594, 78.87161254882812, 87.54426574707031, 96.2169189453125, 104.88957214355469, 113.56222534179688, 122.23487854003906, 130.90753173828125, 139.58018493652344, 148.25283813476562, 156.9254913330078, 165.59814453125, 174.27078247070312, 182.94345092773438, 191.61610412597656, 200.28875732421875, 208.96141052246094, 217.63406372070312, 226.3067169189453, 234.9793701171875, 243.65200805664062, 252.3246612548828]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 6.0, 2.0, 8.0, 10.0, 16.0, 10.0, 10.0, 14.0, 17.0, 25.0, 23.0, 25.0, 35.0, 43.0, 36.0, 42.0, 41.0, 38.0, 43.0, 45.0, 47.0, 38.0, 49.0, 38.0, 54.0, 42.0, 32.0, 27.0, 28.0, 32.0, 19.0, 17.0, 18.0, 16.0, 11.0, 5.0, 7.0, 5.0, 12.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.72418212890625, -208.71995544433594, -201.71572875976562, -194.71148681640625, -187.70726013183594, -180.70303344726562, -173.69879150390625, -166.69456481933594, -159.69033813476562, -152.6861114501953, -145.681884765625, -138.67764282226562, -131.6734161376953, -124.669189453125, -117.66495513916016, -110.66072082519531, -103.656494140625, -96.65226745605469, -89.64803314208984, -82.643798828125, -75.63957214355469, -68.63534545898438, -61.63111114501953, -54.62688064575195, -47.622650146484375, -40.6184196472168, -33.61418914794922, -26.60995864868164, -19.605728149414062, -12.601497650146484, -5.597267150878906, 1.4069633483886719, 8.411209106445312, 15.41543960571289, 22.41967010498047, 29.423900604248047, 36.428131103515625, 43.4323616027832, 50.43659210205078, 57.44082260131836, 64.44505310058594, 71.44927978515625, 78.4535140991211, 85.45774841308594, 92.46197509765625, 99.46620178222656, 106.4704360961914, 113.47467041015625, 120.47889709472656, 127.48312377929688, 134.48736572265625, 141.49159240722656, 148.49581909179688, 155.5000457763672, 162.5042724609375, 169.50851440429688, 176.5127410888672, 183.5169677734375, 190.52120971679688, 197.5254364013672, 204.5296630859375, 211.5338897705078, 218.53811645507812, 225.5423583984375, 232.5465850830078]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 6.0, 8.0, 4.0, 16.0, 13.0, 16.0, 25.0, 34.0, 49.0, 49.0, 68.0, 80.0, 116.0, 155.0, 190.0, 279.0, 426.0, 607.0, 1162.0, 2007.0, 4191.0, 8921.0, 1015063.0, 7125.0, 3360.0, 1669.0, 935.0, 563.0, 354.0, 268.0, 188.0, 134.0, 88.0, 84.0, 70.0, 58.0, 31.0, 35.0, 24.0, 25.0, 21.0, 10.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0], "bins": [-49.940921783447266, -48.34784698486328, -46.75477600097656, -45.16170120239258, -43.568626403808594, -41.975555419921875, -40.38248062133789, -38.789405822753906, -37.19633483886719, -35.6032600402832, -34.010189056396484, -32.4171142578125, -30.82404136657715, -29.230968475341797, -27.637893676757812, -26.04482078552246, -24.45174789428711, -22.858675003051758, -21.265602111816406, -19.672527313232422, -18.07945442199707, -16.48638153076172, -14.89330768585205, -13.300233840942383, -11.707160949707031, -10.11408805847168, -8.521014213562012, -6.927940845489502, -5.334867477416992, -3.7417941093444824, -2.1487207412719727, -0.5556468963623047, 1.0374298095703125, 2.6305031776428223, 4.223576545715332, 5.816649913787842, 7.409723281860352, 9.002796173095703, 10.595870018005371, 12.188943862915039, 13.78201675415039, 15.375089645385742, 16.968162536621094, 18.561237335205078, 20.15431022644043, 21.74738311767578, 23.340457916259766, 24.933530807495117, 26.52660369873047, 28.11967658996582, 29.712749481201172, 31.305824279785156, 32.898895263671875, 34.49197006225586, 36.085044860839844, 37.67811584472656, 39.27119064331055, 40.86426544189453, 42.45733642578125, 44.050411224365234, 45.64348602294922, 47.23655700683594, 48.82963180541992, 50.422706604003906, 52.015777587890625]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 4.0, 13.0, 14.0, 23.0, 29.0, 53.0, 180.0, 5312.0, 51455360.0, 1881.0, 131.0, 49.0, 33.0, 16.0, 12.0, 6.0, 5.0, 3.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-897.4190063476562, -872.0631103515625, -846.7071533203125, -821.3511962890625, -795.9953002929688, -770.639404296875, -745.283447265625, -719.927490234375, -694.5715942382812, -669.2156982421875, -643.8597412109375, -618.5037841796875, -593.1478881835938, -567.7919921875, -542.43603515625, -517.080078125, -491.72418212890625, -466.3682556152344, -441.0123291015625, -415.6564025878906, -390.30047607421875, -364.9445495605469, -339.588623046875, -314.2326965332031, -288.87677001953125, -263.5208435058594, -238.1649169921875, -212.80899047851562, -187.45306396484375, -162.09713745117188, -136.7412109375, -111.38528442382812, -86.02935791015625, -60.673431396484375, -35.3175048828125, -9.961578369140625, 15.39434814453125, 40.750274658203125, 66.106201171875, 91.46212768554688, 116.81805419921875, 142.17398071289062, 167.5299072265625, 192.88583374023438, 218.24176025390625, 243.59768676757812, 268.95361328125, 294.3095397949219, 319.66546630859375, 345.0213928222656, 370.3773193359375, 395.7332458496094, 421.08917236328125, 446.4450988769531, 471.801025390625, 497.1569519042969, 522.5128784179688, 547.8687744140625, 573.2247314453125, 598.5806884765625, 623.9365844726562, 649.29248046875, 674.6484375, 700.00439453125, 725.3602905273438]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 8.0, 11.0, 13.0, 28.0, 51.0, 78.0, 87.0, 157.0, 237.0, 375.0, 577.0, 990.0, 1642.0, 2773.0, 4907.0, 8870.0, 16543.0, 32900.0, 69026.0, 159870.0, 420533.0, 1644468.0, 3003889.0, 551408.0, 202637.0, 85715.0, 39533.0, 19787.0, 10390.0, 5792.0, 3250.0, 1839.0, 1139.0, 684.0, 445.0, 277.0, 173.0, 113.0, 74.0, 39.0, 34.0, 25.0, 21.0, 7.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.875, -31.8828125, -30.890625, -29.8984375, -28.90625, -27.9140625, -26.921875, -25.9296875, -24.9375, -23.9453125, -22.953125, -21.9609375, -20.96875, -19.9765625, -18.984375, -17.9921875, -17.0, -16.0078125, -15.015625, -14.0234375, -13.03125, -12.0390625, -11.046875, -10.0546875, -9.0625, -8.0703125, -7.078125, -6.0859375, -5.09375, -4.1015625, -3.109375, -2.1171875, -1.125, -0.1328125, 0.859375, 1.8515625, 2.84375, 3.8359375, 4.828125, 5.8203125, 6.8125, 7.8046875, 8.796875, 9.7890625, 10.78125, 11.7734375, 12.765625, 13.7578125, 14.75, 15.7421875, 16.734375, 17.7265625, 18.71875, 19.7109375, 20.703125, 21.6953125, 22.6875, 23.6796875, 24.671875, 25.6640625, 26.65625, 27.6484375, 28.640625, 29.6328125, 30.625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 3.0, 5.0, 11.0, 10.0, 11.0, 18.0, 16.0, 11.0, 25.0, 26.0, 23.0, 26.0, 27.0, 38.0, 33.0, 61.0, 54.0, 88.0, 133.0, 222.0, 364.0, 265.0, 102.0, 71.0, 36.0, 40.0, 37.0, 33.0, 34.0, 28.0, 21.0, 19.0, 21.0, 15.0, 17.0, 14.0, 11.0, 9.0, 8.0, 5.0, 7.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-34.15625, -33.0751953125, -31.994140625, -30.9130859375, -29.83203125, -28.7509765625, -27.669921875, -26.5888671875, -25.5078125, -24.4267578125, -23.345703125, -22.2646484375, -21.18359375, -20.1025390625, -19.021484375, -17.9404296875, -16.859375, -15.7783203125, -14.697265625, -13.6162109375, -12.53515625, -11.4541015625, -10.373046875, -9.2919921875, -8.2109375, -7.1298828125, -6.048828125, -4.9677734375, -3.88671875, -2.8056640625, -1.724609375, -0.6435546875, 0.4375, 1.5185546875, 2.599609375, 3.6806640625, 4.76171875, 5.8427734375, 6.923828125, 8.0048828125, 9.0859375, 10.1669921875, 11.248046875, 12.3291015625, 13.41015625, 14.4912109375, 15.572265625, 16.6533203125, 17.734375, 18.8154296875, 19.896484375, 20.9775390625, 22.05859375, 23.1396484375, 24.220703125, 25.3017578125, 26.3828125, 27.4638671875, 28.544921875, 29.6259765625, 30.70703125, 31.7880859375, 32.869140625, 33.9501953125, 35.03125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 6.0, 7.0, 11.0, 23.0, 37.0, 59.0, 82.0, 108.0, 185.0, 253.0, 373.0, 493.0, 777.0, 1042.0, 1573.0, 2316.0, 3340.0, 4770.0, 7088.0, 10999.0, 17356.0, 26704.0, 42972.0, 69220.0, 111773.0, 182478.0, 294768.0, 523525.0, 2453482.0, 1427437.0, 428126.0, 257382.0, 159093.0, 97405.0, 59926.0, 37336.0, 23766.0, 14989.0, 9900.0, 6644.0, 4404.0, 2905.0, 1935.0, 1355.0, 901.0, 675.0, 445.0, 319.0, 219.0, 163.0, 102.0, 63.0, 55.0, 32.0, 15.0, 13.0, 5.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.453125, -9.136474609375, -8.81982421875, -8.503173828125, -8.1865234375, -7.869873046875, -7.55322265625, -7.236572265625, -6.919921875, -6.603271484375, -6.28662109375, -5.969970703125, -5.6533203125, -5.336669921875, -5.02001953125, -4.703369140625, -4.38671875, -4.070068359375, -3.75341796875, -3.436767578125, -3.1201171875, -2.803466796875, -2.48681640625, -2.170166015625, -1.853515625, -1.536865234375, -1.22021484375, -0.903564453125, -0.5869140625, -0.270263671875, 0.04638671875, 0.363037109375, 0.6796875, 0.996337890625, 1.31298828125, 1.629638671875, 1.9462890625, 2.262939453125, 2.57958984375, 2.896240234375, 3.212890625, 3.529541015625, 3.84619140625, 4.162841796875, 4.4794921875, 4.796142578125, 5.11279296875, 5.429443359375, 5.74609375, 6.062744140625, 6.37939453125, 6.696044921875, 7.0126953125, 7.329345703125, 7.64599609375, 7.962646484375, 8.279296875, 8.595947265625, 8.91259765625, 9.229248046875, 9.5458984375, 9.862548828125, 10.17919921875, 10.495849609375, 10.8125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 7.0, 12.0, 7.0, 12.0, 15.0, 11.0, 16.0, 21.0, 18.0, 30.0, 30.0, 36.0, 27.0, 42.0, 53.0, 56.0, 69.0, 115.0, 448.0, 452.0, 134.0, 52.0, 42.0, 38.0, 49.0, 28.0, 16.0, 30.0, 24.0, 17.0, 20.0, 17.0, 13.0, 12.0, 9.0, 8.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.65625, -49.9892578125, -48.322265625, -46.6552734375, -44.98828125, -43.3212890625, -41.654296875, -39.9873046875, -38.3203125, -36.6533203125, -34.986328125, -33.3193359375, -31.65234375, -29.9853515625, -28.318359375, -26.6513671875, -24.984375, -23.3173828125, -21.650390625, -19.9833984375, -18.31640625, -16.6494140625, -14.982421875, -13.3154296875, -11.6484375, -9.9814453125, -8.314453125, -6.6474609375, -4.98046875, -3.3134765625, -1.646484375, 0.0205078125, 1.6875, 3.3544921875, 5.021484375, 6.6884765625, 8.35546875, 10.0224609375, 11.689453125, 13.3564453125, 15.0234375, 16.6904296875, 18.357421875, 20.0244140625, 21.69140625, 23.3583984375, 25.025390625, 26.6923828125, 28.359375, 30.0263671875, 31.693359375, 33.3603515625, 35.02734375, 36.6943359375, 38.361328125, 40.0283203125, 41.6953125, 43.3623046875, 45.029296875, 46.6962890625, 48.36328125, 50.0302734375, 51.697265625, 53.3642578125, 55.03125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 0.0, 7.0, 10.0, 8.0, 6.0, 9.0, 20.0, 23.0, 27.0, 29.0, 58.0, 83.0, 113.0, 134.0, 161.0, 238.0, 315.0, 433.0, 618.0, 997.0, 1620.0, 2949.0, 5579.0, 12426.0, 31712.0, 91881.0, 5487559.0, 516704.0, 84390.0, 29232.0, 11628.0, 5113.0, 2715.0, 1518.0, 901.0, 629.0, 392.0, 271.0, 200.0, 173.0, 139.0, 107.0, 87.0, 69.0, 52.0, 31.0, 17.0, 11.0, 14.0, 12.0, 12.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-62.65625, -60.63232421875, -58.6083984375, -56.58447265625, -54.560546875, -52.53662109375, -50.5126953125, -48.48876953125, -46.46484375, -44.44091796875, -42.4169921875, -40.39306640625, -38.369140625, -36.34521484375, -34.3212890625, -32.29736328125, -30.2734375, -28.24951171875, -26.2255859375, -24.20166015625, -22.177734375, -20.15380859375, -18.1298828125, -16.10595703125, -14.08203125, -12.05810546875, -10.0341796875, -8.01025390625, -5.986328125, -3.96240234375, -1.9384765625, 0.08544921875, 2.109375, 4.13330078125, 6.1572265625, 8.18115234375, 10.205078125, 12.22900390625, 14.2529296875, 16.27685546875, 18.30078125, 20.32470703125, 22.3486328125, 24.37255859375, 26.396484375, 28.42041015625, 30.4443359375, 32.46826171875, 34.4921875, 36.51611328125, 38.5400390625, 40.56396484375, 42.587890625, 44.61181640625, 46.6357421875, 48.65966796875, 50.68359375, 52.70751953125, 54.7314453125, 56.75537109375, 58.779296875, 60.80322265625, 62.8271484375, 64.85107421875, 66.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 2.0, 6.0, 8.0, 11.0, 7.0, 14.0, 12.0, 17.0, 24.0, 19.0, 24.0, 27.0, 31.0, 25.0, 43.0, 33.0, 36.0, 46.0, 66.0, 279.0, 705.0, 130.0, 45.0, 37.0, 46.0, 44.0, 31.0, 32.0, 29.0, 34.0, 22.0, 24.0, 17.0, 16.0, 7.0, 17.0, 10.0, 10.0, 6.0, 7.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-99.0, -96.025390625, -93.05078125, -90.076171875, -87.1015625, -84.126953125, -81.15234375, -78.177734375, -75.203125, -72.228515625, -69.25390625, -66.279296875, -63.3046875, -60.330078125, -57.35546875, -54.380859375, -51.40625, -48.431640625, -45.45703125, -42.482421875, -39.5078125, -36.533203125, -33.55859375, -30.583984375, -27.609375, -24.634765625, -21.66015625, -18.685546875, -15.7109375, -12.736328125, -9.76171875, -6.787109375, -3.8125, -0.837890625, 2.13671875, 5.111328125, 8.0859375, 11.060546875, 14.03515625, 17.009765625, 19.984375, 22.958984375, 25.93359375, 28.908203125, 31.8828125, 34.857421875, 37.83203125, 40.806640625, 43.78125, 46.755859375, 49.73046875, 52.705078125, 55.6796875, 58.654296875, 61.62890625, 64.603515625, 67.578125, 70.552734375, 73.52734375, 76.501953125, 79.4765625, 82.451171875, 85.42578125, 88.400390625, 91.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 20.0, 109.0, 750.0, 83.0, 15.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1551.8057861328125, -1513.3818359375, -1474.957763671875, -1436.5338134765625, -1398.10986328125, -1359.6859130859375, -1321.261962890625, -1282.837890625, -1244.4139404296875, -1205.989990234375, -1167.56591796875, -1129.1419677734375, -1090.718017578125, -1052.2940673828125, -1013.8700561523438, -975.446044921875, -937.0220947265625, -898.59814453125, -860.1741333007812, -821.7501220703125, -783.326171875, -744.9022216796875, -706.4782104492188, -668.05419921875, -629.6302490234375, -591.206298828125, -552.7822875976562, -514.3582763671875, -475.934326171875, -437.5103454589844, -399.08636474609375, -360.6623840332031, -322.238525390625, -283.8145446777344, -245.39056396484375, -206.96658325195312, -168.5426025390625, -130.11862182617188, -91.69464111328125, -53.270660400390625, -14.8466796875, 23.577301025390625, 62.00128173828125, 100.42526245117188, 138.8492431640625, 177.27322387695312, 215.69720458984375, 254.12118530273438, 292.545166015625, 330.9691467285156, 369.39312744140625, 407.8171081542969, 446.2410888671875, 484.6650695800781, 523.0890502929688, 561.5130615234375, 599.93701171875, 638.3609619140625, 676.7849731445312, 715.208984375, 753.6329345703125, 792.056884765625, 830.4808959960938, 868.9049072265625, 907.328857421875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 16.0, 17.0, 18.0, 26.0, 31.0, 76.0, 201.0, 243.0, 148.0, 72.0, 25.0, 19.0, 10.0, 13.0, 15.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-613.2197265625, -595.3973388671875, -577.574951171875, -559.7526245117188, -541.9302368164062, -524.1078491210938, -506.2854919433594, -488.463134765625, -470.6407470703125, -452.818359375, -434.9960021972656, -417.17364501953125, -399.35125732421875, -381.52886962890625, -363.7065124511719, -345.8841552734375, -328.061767578125, -310.2393798828125, -292.4170227050781, -274.59466552734375, -256.77227783203125, -238.9499053955078, -221.12753295898438, -203.30516052246094, -185.4827880859375, -167.66041564941406, -149.83804321289062, -132.0156707763672, -114.19329833984375, -96.37092590332031, -78.54855346679688, -60.72618103027344, -42.90380859375, -25.081436157226562, -7.259063720703125, 10.563308715820312, 28.38568115234375, 46.20805358886719, 64.03042602539062, 81.85279846191406, 99.6751708984375, 117.49754333496094, 135.31991577148438, 153.1422882080078, 170.96466064453125, 188.7870330810547, 206.60940551757812, 224.43177795410156, 242.254150390625, 260.0765380859375, 277.8988952636719, 295.72125244140625, 313.54364013671875, 331.36602783203125, 349.1883850097656, 367.0107421875, 384.8331298828125, 402.655517578125, 420.4778747558594, 438.30023193359375, 456.12261962890625, 473.94500732421875, 491.7673645019531, 509.5897216796875, 527.412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 6.0, 5.0, 8.0, 16.0, 13.0, 14.0, 19.0, 34.0, 28.0, 53.0, 58.0, 98.0, 160.0, 182.0, 278.0, 415.0, 585.0, 904.0, 1510.0, 2471.0, 4378.0, 8911.0, 24156.0, 217378.0, 3872781.0, 36909.0, 11135.0, 5067.0, 2731.0, 1518.0, 889.0, 523.0, 337.0, 238.0, 172.0, 95.0, 71.0, 36.0, 27.0, 21.0, 12.0, 12.0, 14.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-4.3671875, -4.255645751953125, -4.14410400390625, -4.032562255859375, -3.9210205078125, -3.809478759765625, -3.69793701171875, -3.586395263671875, -3.474853515625, -3.363311767578125, -3.25177001953125, -3.140228271484375, -3.0286865234375, -2.917144775390625, -2.80560302734375, -2.694061279296875, -2.58251953125, -2.470977783203125, -2.35943603515625, -2.247894287109375, -2.1363525390625, -2.024810791015625, -1.91326904296875, -1.801727294921875, -1.690185546875, -1.578643798828125, -1.46710205078125, -1.355560302734375, -1.2440185546875, -1.132476806640625, -1.02093505859375, -0.909393310546875, -0.7978515625, -0.686309814453125, -0.57476806640625, -0.463226318359375, -0.3516845703125, -0.240142822265625, -0.12860107421875, -0.017059326171875, 0.094482421875, 0.206024169921875, 0.31756591796875, 0.429107666015625, 0.5406494140625, 0.652191162109375, 0.76373291015625, 0.875274658203125, 0.98681640625, 1.098358154296875, 1.20989990234375, 1.321441650390625, 1.4329833984375, 1.544525146484375, 1.65606689453125, 1.767608642578125, 1.879150390625, 1.990692138671875, 2.10223388671875, 2.213775634765625, 2.3253173828125, 2.436859130859375, 2.54840087890625, 2.659942626953125, 2.771484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 5.0, 8.0, 6.0, 5.0, 4.0, 10.0, 13.0, 13.0, 7.0, 13.0, 359.0, 425.0, 14.0, 9.0, 13.0, 16.0, 6.0, 8.0, 7.0, 6.0, 2.0, 6.0, 2.0, 6.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.59375, -1.5505523681640625, -1.507354736328125, -1.4641571044921875, -1.42095947265625, -1.3777618408203125, -1.334564208984375, -1.2913665771484375, -1.2481689453125, -1.2049713134765625, -1.161773681640625, -1.1185760498046875, -1.07537841796875, -1.0321807861328125, -0.988983154296875, -0.9457855224609375, -0.902587890625, -0.8593902587890625, -0.816192626953125, -0.7729949951171875, -0.72979736328125, -0.6865997314453125, -0.643402099609375, -0.6002044677734375, -0.5570068359375, -0.5138092041015625, -0.470611572265625, -0.4274139404296875, -0.38421630859375, -0.3410186767578125, -0.297821044921875, -0.2546234130859375, -0.21142578125, -0.1682281494140625, -0.125030517578125, -0.0818328857421875, -0.03863525390625, 0.0045623779296875, 0.047760009765625, 0.0909576416015625, 0.1341552734375, 0.1773529052734375, 0.220550537109375, 0.2637481689453125, 0.30694580078125, 0.3501434326171875, 0.393341064453125, 0.4365386962890625, 0.479736328125, 0.5229339599609375, 0.566131591796875, 0.6093292236328125, 0.65252685546875, 0.6957244873046875, 0.738922119140625, 0.7821197509765625, 0.8253173828125, 0.8685150146484375, 0.911712646484375, 0.9549102783203125, 0.99810791015625, 1.0413055419921875, 1.084503173828125, 1.1277008056640625, 1.1708984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 20.0, 25.0, 38.0, 71.0, 93.0, 173.0, 299.0, 547.0, 1139.0, 2731.0, 8497.0, 35099.0, 365108.0, 3658598.0, 95696.0, 17398.0, 5059.0, 1890.0, 825.0, 380.0, 220.0, 135.0, 83.0, 52.0, 33.0, 20.0, 10.0, 11.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-8.4375, -8.21099853515625, -7.9844970703125, -7.75799560546875, -7.531494140625, -7.30499267578125, -7.0784912109375, -6.85198974609375, -6.62548828125, -6.39898681640625, -6.1724853515625, -5.94598388671875, -5.719482421875, -5.49298095703125, -5.2664794921875, -5.03997802734375, -4.8134765625, -4.58697509765625, -4.3604736328125, -4.13397216796875, -3.907470703125, -3.68096923828125, -3.4544677734375, -3.22796630859375, -3.00146484375, -2.77496337890625, -2.5484619140625, -2.32196044921875, -2.095458984375, -1.86895751953125, -1.6424560546875, -1.41595458984375, -1.189453125, -0.96295166015625, -0.7364501953125, -0.50994873046875, -0.283447265625, -0.05694580078125, 0.1695556640625, 0.39605712890625, 0.62255859375, 0.84906005859375, 1.0755615234375, 1.30206298828125, 1.528564453125, 1.75506591796875, 1.9815673828125, 2.20806884765625, 2.4345703125, 2.66107177734375, 2.8875732421875, 3.11407470703125, 3.340576171875, 3.56707763671875, 3.7935791015625, 4.02008056640625, 4.24658203125, 4.47308349609375, 4.6995849609375, 4.92608642578125, 5.152587890625, 5.37908935546875, 5.6055908203125, 5.83209228515625, 6.05859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 12.0, 7.0, 14.0, 21.0, 30.0, 42.0, 69.0, 138.0, 308.0, 1779.0, 1027.0, 252.0, 119.0, 83.0, 56.0, 30.0, 19.0, 17.0, 9.0, 12.0, 7.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.65625, -2.584228515625, -2.51220703125, -2.440185546875, -2.3681640625, -2.296142578125, -2.22412109375, -2.152099609375, -2.080078125, -2.008056640625, -1.93603515625, -1.864013671875, -1.7919921875, -1.719970703125, -1.64794921875, -1.575927734375, -1.50390625, -1.431884765625, -1.35986328125, -1.287841796875, -1.2158203125, -1.143798828125, -1.07177734375, -0.999755859375, -0.927734375, -0.855712890625, -0.78369140625, -0.711669921875, -0.6396484375, -0.567626953125, -0.49560546875, -0.423583984375, -0.3515625, -0.279541015625, -0.20751953125, -0.135498046875, -0.0634765625, 0.008544921875, 0.08056640625, 0.152587890625, 0.224609375, 0.296630859375, 0.36865234375, 0.440673828125, 0.5126953125, 0.584716796875, 0.65673828125, 0.728759765625, 0.80078125, 0.872802734375, 0.94482421875, 1.016845703125, 1.0888671875, 1.160888671875, 1.23291015625, 1.304931640625, 1.376953125, 1.448974609375, 1.52099609375, 1.593017578125, 1.6650390625, 1.737060546875, 1.80908203125, 1.881103515625, 1.953125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 8.0, 18.0, 27.0, 51.0, 111.0, 225.0, 244.0, 161.0, 77.0, 33.0, 19.0, 10.0, 11.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.901721954345703, -11.459807395935059, -11.017892837524414, -10.575979232788086, -10.134064674377441, -9.692150115966797, -9.250235557556152, -8.808320999145508, -8.366406440734863, -7.924491882324219, -7.482577800750732, -7.040663242340088, -6.598748683929443, -6.156834602355957, -5.7149200439453125, -5.273005485534668, -4.831091403961182, -4.389176845550537, -3.9472625255584717, -3.5053482055664062, -3.0634336471557617, -2.6215193271636963, -2.179605007171631, -1.7376904487609863, -1.295776128768921, -0.8538616895675659, -0.4119473099708557, 0.029967069625854492, 0.4718815088272095, 0.9137959480285645, 1.3557102680206299, 1.7976248264312744, 2.23953914642334, 2.6814534664154053, 3.12336802482605, 3.5652823448181152, 4.00719690322876, 4.449110984802246, 4.891025543212891, 5.332940101623535, 5.77485466003418, 6.216769218444824, 6.6586833000183105, 7.100597858428955, 7.5425124168396, 7.984426498413086, 8.42634105682373, 8.868255615234375, 9.310169219970703, 9.752083778381348, 10.193998336791992, 10.63591194152832, 11.077826499938965, 11.51974105834961, 11.961655616760254, 12.403570175170898, 12.845484733581543, 13.287399291992188, 13.729313850402832, 14.171228408813477, 14.613142013549805, 15.05505657196045, 15.496971130371094, 15.938885688781738, 16.380800247192383]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 6.0, 4.0, 9.0, 10.0, 11.0, 15.0, 19.0, 18.0, 26.0, 31.0, 48.0, 60.0, 53.0, 70.0, 56.0, 56.0, 68.0, 54.0, 50.0, 55.0, 45.0, 41.0, 42.0, 33.0, 26.0, 20.0, 18.0, 14.0, 14.0, 11.0, 9.0, 10.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.608412742614746, -5.394190311431885, -5.179967403411865, -4.965744972229004, -4.751522541046143, -4.537300109863281, -4.323077201843262, -4.1088547706604, -3.894632339477539, -3.6804096698760986, -3.4661872386932373, -3.251964569091797, -3.0377421379089355, -2.823519468307495, -2.6092967987060547, -2.3950743675231934, -2.180851697921753, -1.966629147529602, -1.7524065971374512, -1.5381839275360107, -1.3239614963531494, -1.109738826751709, -0.8955162763595581, -0.6812937259674072, -0.46707117557525635, -0.25284862518310547, -0.0386260449886322, 0.17559653520584106, 0.38981908559799194, 0.6040416955947876, 0.8182642459869385, 1.0324867963790894, 1.2467093467712402, 1.4609318971633911, 1.675154447555542, 1.8893771171569824, 2.1035995483398438, 2.317822217941284, 2.5320448875427246, 2.746267318725586, 2.9604897499084473, 3.1747124195098877, 3.388934850692749, 3.6031575202941895, 3.817379951477051, 4.03160285949707, 4.245825290679932, 4.460047721862793, 4.6742706298828125, 4.888493061065674, 5.102715969085693, 5.316938400268555, 5.531160831451416, 5.745383262634277, 5.959606170654297, 6.173828601837158, 6.3880510330200195, 6.602273464202881, 6.8164963722229, 7.030718803405762, 7.244941234588623, 7.459163665771484, 7.673386573791504, 7.887609004974365, 8.101831436157227]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 7.0, 5.0, 11.0, 9.0, 19.0, 37.0, 44.0, 69.0, 89.0, 139.0, 206.0, 277.0, 450.0, 642.0, 965.0, 1627.0, 2458.0, 3771.0, 6410.0, 10569.0, 18903.0, 38092.0, 822589.0, 80870.0, 25236.0, 13774.0, 7921.0, 4802.0, 3043.0, 1899.0, 1193.0, 829.0, 519.0, 312.0, 242.0, 171.0, 105.0, 68.0, 54.0, 41.0, 26.0, 22.0, 4.0, 9.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.091796875, -2.98779296875, -2.8837890625, -2.77978515625, -2.67578125, -2.57177734375, -2.4677734375, -2.36376953125, -2.259765625, -2.15576171875, -2.0517578125, -1.94775390625, -1.84375, -1.73974609375, -1.6357421875, -1.53173828125, -1.427734375, -1.32373046875, -1.2197265625, -1.11572265625, -1.01171875, -0.90771484375, -0.8037109375, -0.69970703125, -0.595703125, -0.49169921875, -0.3876953125, -0.28369140625, -0.1796875, -0.07568359375, 0.0283203125, 0.13232421875, 0.236328125, 0.34033203125, 0.4443359375, 0.54833984375, 0.65234375, 0.75634765625, 0.8603515625, 0.96435546875, 1.068359375, 1.17236328125, 1.2763671875, 1.38037109375, 1.484375, 1.58837890625, 1.6923828125, 1.79638671875, 1.900390625, 2.00439453125, 2.1083984375, 2.21240234375, 2.31640625, 2.42041015625, 2.5244140625, 2.62841796875, 2.732421875, 2.83642578125, 2.9404296875, 3.04443359375, 3.1484375, 3.25244140625, 3.3564453125, 3.46044921875, 3.564453125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 1.0, 5.0, 8.0, 2.0, 5.0, 5.0, 8.0, 7.0, 10.0, 6.0, 13.0, 12.0, 20.0, 357.0, 407.0, 28.0, 13.0, 9.0, 11.0, 11.0, 10.0, 6.0, 7.0, 4.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7236328125, -1.67816162109375, -1.6326904296875, -1.58721923828125, -1.541748046875, -1.49627685546875, -1.4508056640625, -1.40533447265625, -1.35986328125, -1.31439208984375, -1.2689208984375, -1.22344970703125, -1.177978515625, -1.13250732421875, -1.0870361328125, -1.04156494140625, -0.99609375, -0.95062255859375, -0.9051513671875, -0.85968017578125, -0.814208984375, -0.76873779296875, -0.7232666015625, -0.67779541015625, -0.63232421875, -0.58685302734375, -0.5413818359375, -0.49591064453125, -0.450439453125, -0.40496826171875, -0.3594970703125, -0.31402587890625, -0.2685546875, -0.22308349609375, -0.1776123046875, -0.13214111328125, -0.086669921875, -0.04119873046875, 0.0042724609375, 0.04974365234375, 0.09521484375, 0.14068603515625, 0.1861572265625, 0.23162841796875, 0.277099609375, 0.32257080078125, 0.3680419921875, 0.41351318359375, 0.458984375, 0.50445556640625, 0.5499267578125, 0.59539794921875, 0.640869140625, 0.68634033203125, 0.7318115234375, 0.77728271484375, 0.82275390625, 0.86822509765625, 0.9136962890625, 0.95916748046875, 1.004638671875, 1.05010986328125, 1.0955810546875, 1.14105224609375, 1.1865234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 4.0, 9.0, 11.0, 11.0, 19.0, 20.0, 28.0, 24.0, 37.0, 62.0, 75.0, 107.0, 125.0, 187.0, 285.0, 512.0, 988.0, 1820.0, 4015.0, 9121.0, 24217.0, 76149.0, 319819.0, 449685.0, 107714.0, 31950.0, 11698.0, 4796.0, 2157.0, 1111.0, 641.0, 327.0, 220.0, 153.0, 87.0, 81.0, 70.0, 51.0, 34.0, 29.0, 39.0, 19.0, 12.0, 7.0, 9.0, 6.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.43359375, -3.32330322265625, -3.2130126953125, -3.10272216796875, -2.992431640625, -2.88214111328125, -2.7718505859375, -2.66156005859375, -2.55126953125, -2.44097900390625, -2.3306884765625, -2.22039794921875, -2.110107421875, -1.99981689453125, -1.8895263671875, -1.77923583984375, -1.6689453125, -1.55865478515625, -1.4483642578125, -1.33807373046875, -1.227783203125, -1.11749267578125, -1.0072021484375, -0.89691162109375, -0.78662109375, -0.67633056640625, -0.5660400390625, -0.45574951171875, -0.345458984375, -0.23516845703125, -0.1248779296875, -0.01458740234375, 0.095703125, 0.20599365234375, 0.3162841796875, 0.42657470703125, 0.536865234375, 0.64715576171875, 0.7574462890625, 0.86773681640625, 0.97802734375, 1.08831787109375, 1.1986083984375, 1.30889892578125, 1.419189453125, 1.52947998046875, 1.6397705078125, 1.75006103515625, 1.8603515625, 1.97064208984375, 2.0809326171875, 2.19122314453125, 2.301513671875, 2.41180419921875, 2.5220947265625, 2.63238525390625, 2.74267578125, 2.85296630859375, 2.9632568359375, 3.07354736328125, 3.183837890625, 3.29412841796875, 3.4044189453125, 3.51470947265625, 3.625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 6.0, 9.0, 11.0, 14.0, 13.0, 15.0, 14.0, 26.0, 26.0, 26.0, 22.0, 36.0, 27.0, 50.0, 40.0, 33.0, 39.0, 34.0, 51.0, 40.0, 40.0, 35.0, 46.0, 31.0, 36.0, 27.0, 29.0, 38.0, 31.0, 29.0, 18.0, 14.0, 21.0, 12.0, 10.0, 9.0, 11.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.99609375, -5.81610107421875, -5.6361083984375, -5.45611572265625, -5.276123046875, -5.09613037109375, -4.9161376953125, -4.73614501953125, -4.55615234375, -4.37615966796875, -4.1961669921875, -4.01617431640625, -3.836181640625, -3.65618896484375, -3.4761962890625, -3.29620361328125, -3.1162109375, -2.93621826171875, -2.7562255859375, -2.57623291015625, -2.396240234375, -2.21624755859375, -2.0362548828125, -1.85626220703125, -1.67626953125, -1.49627685546875, -1.3162841796875, -1.13629150390625, -0.956298828125, -0.77630615234375, -0.5963134765625, -0.41632080078125, -0.236328125, -0.05633544921875, 0.1236572265625, 0.30364990234375, 0.483642578125, 0.66363525390625, 0.8436279296875, 1.02362060546875, 1.20361328125, 1.38360595703125, 1.5635986328125, 1.74359130859375, 1.923583984375, 2.10357666015625, 2.2835693359375, 2.46356201171875, 2.6435546875, 2.82354736328125, 3.0035400390625, 3.18353271484375, 3.363525390625, 3.54351806640625, 3.7235107421875, 3.90350341796875, 4.08349609375, 4.26348876953125, 4.4434814453125, 4.62347412109375, 4.803466796875, 4.98345947265625, 5.1634521484375, 5.34344482421875, 5.5234375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 3.0, 5.0, 5.0, 4.0, 5.0, 10.0, 12.0, 24.0, 34.0, 57.0, 78.0, 93.0, 143.0, 235.0, 394.0, 633.0, 1179.0, 2302.0, 5090.0, 13431.0, 48191.0, 270333.0, 565702.0, 102408.0, 23333.0, 7880.0, 3249.0, 1570.0, 789.0, 474.0, 295.0, 167.0, 134.0, 79.0, 51.0, 50.0, 33.0, 23.0, 13.0, 12.0, 3.0, 8.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.642578125, -3.525970458984375, -3.40936279296875, -3.292755126953125, -3.1761474609375, -3.059539794921875, -2.94293212890625, -2.826324462890625, -2.709716796875, -2.593109130859375, -2.47650146484375, -2.359893798828125, -2.2432861328125, -2.126678466796875, -2.01007080078125, -1.893463134765625, -1.77685546875, -1.660247802734375, -1.54364013671875, -1.427032470703125, -1.3104248046875, -1.193817138671875, -1.07720947265625, -0.960601806640625, -0.843994140625, -0.727386474609375, -0.61077880859375, -0.494171142578125, -0.3775634765625, -0.260955810546875, -0.14434814453125, -0.027740478515625, 0.0888671875, 0.205474853515625, 0.32208251953125, 0.438690185546875, 0.5552978515625, 0.671905517578125, 0.78851318359375, 0.905120849609375, 1.021728515625, 1.138336181640625, 1.25494384765625, 1.371551513671875, 1.4881591796875, 1.604766845703125, 1.72137451171875, 1.837982177734375, 1.95458984375, 2.071197509765625, 2.18780517578125, 2.304412841796875, 2.4210205078125, 2.537628173828125, 2.65423583984375, 2.770843505859375, 2.887451171875, 3.004058837890625, 3.12066650390625, 3.237274169921875, 3.3538818359375, 3.470489501953125, 3.58709716796875, 3.703704833984375, 3.8203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 8.0, 11.0, 12.0, 14.0, 24.0, 38.0, 34.0, 56.0, 65.0, 85.0, 79.0, 100.0, 115.0, 79.0, 76.0, 54.0, 31.0, 34.0, 21.0, 13.0, 19.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002357959747314453, -0.00022902898490428925, -0.00022226199507713318, -0.0002154950052499771, -0.00020872801542282104, -0.00020196102559566498, -0.0001951940357685089, -0.00018842704594135284, -0.00018166005611419678, -0.0001748930662870407, -0.00016812607645988464, -0.00016135908663272858, -0.0001545920968055725, -0.00014782510697841644, -0.00014105811715126038, -0.0001342911273241043, -0.00012752413749694824, -0.00012075714766979218, -0.00011399015784263611, -0.00010722316801548004, -0.00010045617818832397, -9.368918836116791e-05, -8.692219853401184e-05, -8.015520870685577e-05, -7.338821887969971e-05, -6.662122905254364e-05, -5.985423922538757e-05, -5.3087249398231506e-05, -4.632025957107544e-05, -3.955326974391937e-05, -3.2786279916763306e-05, -2.601929008960724e-05, -1.9252300262451172e-05, -1.2485310435295105e-05, -5.718320608139038e-06, 1.0486692190170288e-06, 7.815659046173096e-06, 1.4582648873329163e-05, 2.134963870048523e-05, 2.8116628527641296e-05, 3.488361835479736e-05, 4.165060818195343e-05, 4.84175980091095e-05, 5.5184587836265564e-05, 6.195157766342163e-05, 6.87185674905777e-05, 7.548555731773376e-05, 8.225254714488983e-05, 8.90195369720459e-05, 9.578652679920197e-05, 0.00010255351662635803, 0.0001093205064535141, 0.00011608749628067017, 0.00012285448610782623, 0.0001296214759349823, 0.00013638846576213837, 0.00014315545558929443, 0.0001499224454164505, 0.00015668943524360657, 0.00016345642507076263, 0.0001702234148979187, 0.00017699040472507477, 0.00018375739455223083, 0.0001905243843793869, 0.00019729137420654297]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 5.0, 5.0, 18.0, 33.0, 26.0, 41.0, 71.0, 111.0, 141.0, 268.0, 458.0, 823.0, 1585.0, 3690.0, 9222.0, 30927.0, 151174.0, 615077.0, 181762.0, 35064.0, 10134.0, 3962.0, 1788.0, 932.0, 462.0, 263.0, 166.0, 110.0, 73.0, 43.0, 34.0, 14.0, 20.0, 9.0, 8.0, 13.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-4.15234375, -4.01641845703125, -3.8804931640625, -3.74456787109375, -3.608642578125, -3.47271728515625, -3.3367919921875, -3.20086669921875, -3.06494140625, -2.92901611328125, -2.7930908203125, -2.65716552734375, -2.521240234375, -2.38531494140625, -2.2493896484375, -2.11346435546875, -1.9775390625, -1.84161376953125, -1.7056884765625, -1.56976318359375, -1.433837890625, -1.29791259765625, -1.1619873046875, -1.02606201171875, -0.89013671875, -0.75421142578125, -0.6182861328125, -0.48236083984375, -0.346435546875, -0.21051025390625, -0.0745849609375, 0.06134033203125, 0.197265625, 0.33319091796875, 0.4691162109375, 0.60504150390625, 0.740966796875, 0.87689208984375, 1.0128173828125, 1.14874267578125, 1.28466796875, 1.42059326171875, 1.5565185546875, 1.69244384765625, 1.828369140625, 1.96429443359375, 2.1002197265625, 2.23614501953125, 2.3720703125, 2.50799560546875, 2.6439208984375, 2.77984619140625, 2.915771484375, 3.05169677734375, 3.1876220703125, 3.32354736328125, 3.45947265625, 3.59539794921875, 3.7313232421875, 3.86724853515625, 4.003173828125, 4.13909912109375, 4.2750244140625, 4.41094970703125, 4.546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 7.0, 4.0, 2.0, 1.0, 6.0, 6.0, 9.0, 12.0, 13.0, 27.0, 20.0, 33.0, 38.0, 61.0, 55.0, 78.0, 57.0, 82.0, 86.0, 77.0, 53.0, 63.0, 41.0, 41.0, 28.0, 31.0, 16.0, 16.0, 7.0, 8.0, 7.0, 3.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.377899169921875, -3.27142333984375, -3.164947509765625, -3.0584716796875, -2.951995849609375, -2.84552001953125, -2.739044189453125, -2.632568359375, -2.526092529296875, -2.41961669921875, -2.313140869140625, -2.2066650390625, -2.100189208984375, -1.99371337890625, -1.887237548828125, -1.78076171875, -1.674285888671875, -1.56781005859375, -1.461334228515625, -1.3548583984375, -1.248382568359375, -1.14190673828125, -1.035430908203125, -0.928955078125, -0.822479248046875, -0.71600341796875, -0.609527587890625, -0.5030517578125, -0.396575927734375, -0.29010009765625, -0.183624267578125, -0.0771484375, 0.029327392578125, 0.13580322265625, 0.242279052734375, 0.3487548828125, 0.455230712890625, 0.56170654296875, 0.668182373046875, 0.774658203125, 0.881134033203125, 0.98760986328125, 1.094085693359375, 1.2005615234375, 1.307037353515625, 1.41351318359375, 1.519989013671875, 1.62646484375, 1.732940673828125, 1.83941650390625, 1.945892333984375, 2.0523681640625, 2.158843994140625, 2.26531982421875, 2.371795654296875, 2.478271484375, 2.584747314453125, 2.69122314453125, 2.797698974609375, 2.9041748046875, 3.010650634765625, 3.11712646484375, 3.223602294921875, 3.330078125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 8.0, 26.0, 76.0, 264.0, 383.0, 137.0, 50.0, 20.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-108.98988342285156, -106.40969848632812, -103.82950592041016, -101.24932098388672, -98.66912841796875, -96.08894348144531, -93.50875091552734, -90.9285659790039, -88.34837341308594, -85.7681884765625, -83.18799591064453, -80.6078109741211, -78.02761840820312, -75.44743347167969, -72.86724090576172, -70.28705596923828, -67.70687103271484, -65.1266860961914, -62.54649353027344, -59.966304779052734, -57.38611602783203, -54.805931091308594, -52.22574234008789, -49.64555358886719, -47.065364837646484, -44.48517608642578, -41.90498733520508, -39.324798583984375, -36.74461364746094, -34.16442108154297, -31.58423614501953, -29.004047393798828, -26.423851013183594, -23.84366226196289, -21.263473510742188, -18.683286666870117, -16.103097915649414, -13.522909164428711, -10.942721366882324, -8.362533569335938, -5.782344818115234, -3.2021565437316895, -0.6219682693481445, 1.9582200050354004, 4.538408279418945, 7.118597030639648, 9.698784828186035, 12.278972625732422, 14.859161376953125, 17.439350128173828, 20.01953887939453, 22.5997257232666, 25.179914474487305, 27.760103225708008, 30.340290069580078, 32.92047882080078, 35.500667572021484, 38.08085632324219, 40.66104507446289, 43.241233825683594, 45.82141876220703, 48.401611328125, 50.98179626464844, 53.56198501586914, 56.142173767089844]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 6.0, 6.0, 5.0, 7.0, 4.0, 13.0, 13.0, 14.0, 33.0, 61.0, 96.0, 111.0, 181.0, 151.0, 103.0, 49.0, 38.0, 27.0, 14.0, 13.0, 7.0, 7.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-117.9508285522461, -114.4417953491211, -110.93275451660156, -107.42372131347656, -103.91468811035156, -100.40565490722656, -96.89661407470703, -93.38758087158203, -89.8785400390625, -86.3695068359375, -82.86046600341797, -79.35143280029297, -75.84239959716797, -72.33335876464844, -68.82432556152344, -65.31529235839844, -61.80625915527344, -58.29722213745117, -54.78818893432617, -51.279151916503906, -47.770118713378906, -44.26108169555664, -40.752044677734375, -37.243011474609375, -33.73397445678711, -30.224939346313477, -26.715904235839844, -23.206867218017578, -19.697832107543945, -16.188796997070312, -12.679759979248047, -9.170724868774414, -5.66168212890625, -2.152646541595459, 1.356389045715332, 4.865425109863281, 8.374460220336914, 11.883495330810547, 15.392532348632812, 18.901567459106445, 22.410602569580078, 25.91963768005371, 29.428672790527344, 32.93770980834961, 36.446746826171875, 39.955780029296875, 43.46481704711914, 46.973854064941406, 50.482887268066406, 53.99192428588867, 57.50095748901367, 61.00999450683594, 64.51902770996094, 68.02806091308594, 71.53710174560547, 75.04613494873047, 78.55517578125, 82.064208984375, 85.57324981689453, 89.08228302001953, 92.59131622314453, 96.10035705566406, 99.60939025878906, 103.11842346191406, 106.62745666503906]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 14.0, 18.0, 18.0, 28.0, 32.0, 50.0, 92.0, 133.0, 205.0, 321.0, 459.0, 826.0, 1204.0, 2034.0, 3607.0, 6870.0, 15675.0, 53143.0, 3891423.0, 173213.0, 25340.0, 9229.0, 4451.0, 2299.0, 1317.0, 871.0, 501.0, 316.0, 196.0, 112.0, 79.0, 50.0, 41.0, 30.0, 17.0, 9.0, 7.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.5625, -12.2381591796875, -11.913818359375, -11.5894775390625, -11.26513671875, -10.9407958984375, -10.616455078125, -10.2921142578125, -9.9677734375, -9.6434326171875, -9.319091796875, -8.9947509765625, -8.67041015625, -8.3460693359375, -8.021728515625, -7.6973876953125, -7.373046875, -7.0487060546875, -6.724365234375, -6.4000244140625, -6.07568359375, -5.7513427734375, -5.427001953125, -5.1026611328125, -4.7783203125, -4.4539794921875, -4.129638671875, -3.8052978515625, -3.48095703125, -3.1566162109375, -2.832275390625, -2.5079345703125, -2.18359375, -1.8592529296875, -1.534912109375, -1.2105712890625, -0.88623046875, -0.5618896484375, -0.237548828125, 0.0867919921875, 0.4111328125, 0.7354736328125, 1.059814453125, 1.3841552734375, 1.70849609375, 2.0328369140625, 2.357177734375, 2.6815185546875, 3.005859375, 3.3302001953125, 3.654541015625, 3.9788818359375, 4.30322265625, 4.6275634765625, 4.951904296875, 5.2762451171875, 5.6005859375, 5.9249267578125, 6.249267578125, 6.5736083984375, 6.89794921875, 7.2222900390625, 7.546630859375, 7.8709716796875, 8.1953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 7.0, 1.0, 9.0, 10.0, 14.0, 15.0, 34.0, 118.0, 303.0, 268.0, 91.0, 30.0, 19.0, 18.0, 12.0, 10.0, 5.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.599609375, -1.557342529296875, -1.51507568359375, -1.472808837890625, -1.4305419921875, -1.388275146484375, -1.34600830078125, -1.303741455078125, -1.261474609375, -1.219207763671875, -1.17694091796875, -1.134674072265625, -1.0924072265625, -1.050140380859375, -1.00787353515625, -0.965606689453125, -0.92333984375, -0.881072998046875, -0.83880615234375, -0.796539306640625, -0.7542724609375, -0.712005615234375, -0.66973876953125, -0.627471923828125, -0.585205078125, -0.542938232421875, -0.50067138671875, -0.458404541015625, -0.4161376953125, -0.373870849609375, -0.33160400390625, -0.289337158203125, -0.2470703125, -0.204803466796875, -0.16253662109375, -0.120269775390625, -0.0780029296875, -0.035736083984375, 0.00653076171875, 0.048797607421875, 0.091064453125, 0.133331298828125, 0.17559814453125, 0.217864990234375, 0.2601318359375, 0.302398681640625, 0.34466552734375, 0.386932373046875, 0.42919921875, 0.471466064453125, 0.51373291015625, 0.555999755859375, 0.5982666015625, 0.640533447265625, 0.68280029296875, 0.725067138671875, 0.767333984375, 0.809600830078125, 0.85186767578125, 0.894134521484375, 0.9364013671875, 0.978668212890625, 1.02093505859375, 1.063201904296875, 1.10546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 15.0, 19.0, 39.0, 59.0, 86.0, 134.0, 253.0, 448.0, 835.0, 1773.0, 3754.0, 8830.0, 23859.0, 88629.0, 2599404.0, 1346608.0, 81207.0, 22474.0, 8545.0, 3673.0, 1717.0, 805.0, 424.0, 238.0, 153.0, 108.0, 40.0, 34.0, 30.0, 16.0, 12.0, 7.0, 5.0, 6.0, 5.0, 3.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.2890625, -8.02978515625, -7.7705078125, -7.51123046875, -7.251953125, -6.99267578125, -6.7333984375, -6.47412109375, -6.21484375, -5.95556640625, -5.6962890625, -5.43701171875, -5.177734375, -4.91845703125, -4.6591796875, -4.39990234375, -4.140625, -3.88134765625, -3.6220703125, -3.36279296875, -3.103515625, -2.84423828125, -2.5849609375, -2.32568359375, -2.06640625, -1.80712890625, -1.5478515625, -1.28857421875, -1.029296875, -0.77001953125, -0.5107421875, -0.25146484375, 0.0078125, 0.26708984375, 0.5263671875, 0.78564453125, 1.044921875, 1.30419921875, 1.5634765625, 1.82275390625, 2.08203125, 2.34130859375, 2.6005859375, 2.85986328125, 3.119140625, 3.37841796875, 3.6376953125, 3.89697265625, 4.15625, 4.41552734375, 4.6748046875, 4.93408203125, 5.193359375, 5.45263671875, 5.7119140625, 5.97119140625, 6.23046875, 6.48974609375, 6.7490234375, 7.00830078125, 7.267578125, 7.52685546875, 7.7861328125, 8.04541015625, 8.3046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 3.0, 7.0, 5.0, 8.0, 15.0, 13.0, 13.0, 21.0, 28.0, 34.0, 52.0, 95.0, 99.0, 161.0, 376.0, 1479.0, 789.0, 273.0, 181.0, 121.0, 69.0, 54.0, 35.0, 27.0, 29.0, 15.0, 10.0, 13.0, 10.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.9731292724609375, -0.939422607421875, -0.9057159423828125, -0.87200927734375, -0.8383026123046875, -0.804595947265625, -0.7708892822265625, -0.7371826171875, -0.7034759521484375, -0.669769287109375, -0.6360626220703125, -0.60235595703125, -0.5686492919921875, -0.534942626953125, -0.5012359619140625, -0.467529296875, -0.4338226318359375, -0.400115966796875, -0.3664093017578125, -0.33270263671875, -0.2989959716796875, -0.265289306640625, -0.2315826416015625, -0.1978759765625, -0.1641693115234375, -0.130462646484375, -0.0967559814453125, -0.06304931640625, -0.0293426513671875, 0.004364013671875, 0.0380706787109375, 0.07177734375, 0.1054840087890625, 0.139190673828125, 0.1728973388671875, 0.20660400390625, 0.2403106689453125, 0.274017333984375, 0.3077239990234375, 0.3414306640625, 0.3751373291015625, 0.408843994140625, 0.4425506591796875, 0.47625732421875, 0.5099639892578125, 0.543670654296875, 0.5773773193359375, 0.611083984375, 0.6447906494140625, 0.678497314453125, 0.7122039794921875, 0.74591064453125, 0.7796173095703125, 0.813323974609375, 0.8470306396484375, 0.8807373046875, 0.9144439697265625, 0.948150634765625, 0.9818572998046875, 1.01556396484375, 1.0492706298828125, 1.082977294921875, 1.1166839599609375, 1.150390625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 33.0, 123.0, 309.0, 333.0, 127.0, 34.0, 18.0, 10.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.074148178100586, -8.534034729003906, -7.993920803070068, -7.4538068771362305, -6.913693428039551, -6.373579978942871, -5.833466053009033, -5.293352127075195, -4.753238677978516, -4.213125228881836, -3.673011302947998, -3.1328976154327393, -2.5927839279174805, -2.0526702404022217, -1.512556552886963, -0.9724428653717041, -0.4323291778564453, 0.10778450965881348, 0.6478981971740723, 1.188011884689331, 1.7281255722045898, 2.2682392597198486, 2.8083529472351074, 3.348466634750366, 3.888580322265625, 4.428693771362305, 4.968807697296143, 5.5089216232299805, 6.04903507232666, 6.58914852142334, 7.129262447357178, 7.669376373291016, 8.209491729736328, 8.749605178833008, 9.289718627929688, 9.829833030700684, 10.369946479797363, 10.910059928894043, 11.450174331665039, 11.990287780761719, 12.530401229858398, 13.070514678955078, 13.610628128051758, 14.150742530822754, 14.690855979919434, 15.230969429016113, 15.77108383178711, 16.31119728088379, 16.85131072998047, 17.39142417907715, 17.931537628173828, 18.471651077270508, 19.011764526367188, 19.5518798828125, 20.09199333190918, 20.63210678100586, 21.17222023010254, 21.71233367919922, 22.2524471282959, 22.792560577392578, 23.33267593383789, 23.87278938293457, 24.41290283203125, 24.95301628112793, 25.49312973022461]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 17.0, 18.0, 14.0, 21.0, 16.0, 30.0, 36.0, 33.0, 52.0, 53.0, 62.0, 52.0, 76.0, 60.0, 56.0, 50.0, 45.0, 43.0, 43.0, 29.0, 39.0, 33.0, 19.0, 19.0, 17.0, 12.0, 8.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.030237197875977, -4.88551664352417, -4.7407965660095215, -4.596076011657715, -4.451355934143066, -4.30663537979126, -4.161914825439453, -4.017194747924805, -3.872474193572998, -3.7277538776397705, -3.583033561706543, -3.4383130073547363, -3.293592691421509, -3.1488723754882812, -3.0041518211364746, -2.859431505203247, -2.7147111892700195, -2.569990873336792, -2.4252705574035645, -2.280550003051758, -2.1358296871185303, -1.9911093711853027, -1.8463889360427856, -1.7016685009002686, -1.556948184967041, -1.4122278690338135, -1.2675074338912964, -1.1227869987487793, -0.9780666828155518, -0.8333463072776794, -0.6886259317398071, -0.54390549659729, -0.3991847038269043, -0.254464328289032, -0.10974395275115967, 0.034976422786712646, 0.17969679832458496, 0.3244171738624573, 0.4691375494003296, 0.6138579845428467, 0.7585783004760742, 0.9032986760139465, 1.0480190515518188, 1.192739486694336, 1.3374598026275635, 1.482180118560791, 1.626900553703308, 1.7716209888458252, 1.9163413047790527, 2.0610616207122803, 2.205781936645508, 2.3505024909973145, 2.495222806930542, 2.6399431228637695, 2.784663677215576, 2.9293839931488037, 3.0741043090820312, 3.218824625015259, 3.3635449409484863, 3.508265495300293, 3.6529858112335205, 3.797706127166748, 3.9424266815185547, 4.087146759033203, 4.23186731338501]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 13.0, 8.0, 12.0, 20.0, 36.0, 58.0, 84.0, 113.0, 173.0, 259.0, 477.0, 714.0, 1437.0, 2643.0, 5942.0, 15444.0, 59571.0, 825146.0, 102349.0, 19642.0, 7307.0, 3262.0, 1586.0, 838.0, 514.0, 292.0, 185.0, 136.0, 87.0, 60.0, 32.0, 38.0, 18.0, 13.0, 14.0, 3.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.5234375, -8.2620849609375, -8.000732421875, -7.7393798828125, -7.47802734375, -7.2166748046875, -6.955322265625, -6.6939697265625, -6.4326171875, -6.1712646484375, -5.909912109375, -5.6485595703125, -5.38720703125, -5.1258544921875, -4.864501953125, -4.6031494140625, -4.341796875, -4.0804443359375, -3.819091796875, -3.5577392578125, -3.29638671875, -3.0350341796875, -2.773681640625, -2.5123291015625, -2.2509765625, -1.9896240234375, -1.728271484375, -1.4669189453125, -1.20556640625, -0.9442138671875, -0.682861328125, -0.4215087890625, -0.16015625, 0.1011962890625, 0.362548828125, 0.6239013671875, 0.88525390625, 1.1466064453125, 1.407958984375, 1.6693115234375, 1.9306640625, 2.1920166015625, 2.453369140625, 2.7147216796875, 2.97607421875, 3.2374267578125, 3.498779296875, 3.7601318359375, 4.021484375, 4.2828369140625, 4.544189453125, 4.8055419921875, 5.06689453125, 5.3282470703125, 5.589599609375, 5.8509521484375, 6.1123046875, 6.3736572265625, 6.635009765625, 6.8963623046875, 7.15771484375, 7.4190673828125, 7.680419921875, 7.9417724609375, 8.203125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 4.0, 5.0, 5.0, 4.0, 8.0, 13.0, 8.0, 20.0, 31.0, 92.0, 221.0, 265.0, 145.0, 74.0, 24.0, 29.0, 10.0, 8.0, 7.0, 4.0, 6.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5263671875, -1.4874725341796875, -1.448577880859375, -1.4096832275390625, -1.37078857421875, -1.3318939208984375, -1.292999267578125, -1.2541046142578125, -1.2152099609375, -1.1763153076171875, -1.137420654296875, -1.0985260009765625, -1.05963134765625, -1.0207366943359375, -0.981842041015625, -0.9429473876953125, -0.904052734375, -0.8651580810546875, -0.826263427734375, -0.7873687744140625, -0.74847412109375, -0.7095794677734375, -0.670684814453125, -0.6317901611328125, -0.5928955078125, -0.5540008544921875, -0.515106201171875, -0.4762115478515625, -0.43731689453125, -0.3984222412109375, -0.359527587890625, -0.3206329345703125, -0.28173828125, -0.2428436279296875, -0.203948974609375, -0.1650543212890625, -0.12615966796875, -0.0872650146484375, -0.048370361328125, -0.0094757080078125, 0.0294189453125, 0.0683135986328125, 0.107208251953125, 0.1461029052734375, 0.18499755859375, 0.2238922119140625, 0.262786865234375, 0.3016815185546875, 0.340576171875, 0.3794708251953125, 0.418365478515625, 0.4572601318359375, 0.49615478515625, 0.5350494384765625, 0.573944091796875, 0.6128387451171875, 0.6517333984375, 0.6906280517578125, 0.729522705078125, 0.7684173583984375, 0.80731201171875, 0.8462066650390625, 0.885101318359375, 0.9239959716796875, 0.962890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 8.0, 2.0, 8.0, 4.0, 11.0, 22.0, 27.0, 50.0, 78.0, 139.0, 247.0, 481.0, 1158.0, 3273.0, 12192.0, 88634.0, 783476.0, 135865.0, 16266.0, 3897.0, 1483.0, 601.0, 264.0, 137.0, 81.0, 54.0, 39.0, 23.0, 13.0, 7.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83984375, -6.58245849609375, -6.3250732421875, -6.06768798828125, -5.810302734375, -5.55291748046875, -5.2955322265625, -5.03814697265625, -4.78076171875, -4.52337646484375, -4.2659912109375, -4.00860595703125, -3.751220703125, -3.49383544921875, -3.2364501953125, -2.97906494140625, -2.7216796875, -2.46429443359375, -2.2069091796875, -1.94952392578125, -1.692138671875, -1.43475341796875, -1.1773681640625, -0.91998291015625, -0.66259765625, -0.40521240234375, -0.1478271484375, 0.10955810546875, 0.366943359375, 0.62432861328125, 0.8817138671875, 1.13909912109375, 1.396484375, 1.65386962890625, 1.9112548828125, 2.16864013671875, 2.426025390625, 2.68341064453125, 2.9407958984375, 3.19818115234375, 3.45556640625, 3.71295166015625, 3.9703369140625, 4.22772216796875, 4.485107421875, 4.74249267578125, 4.9998779296875, 5.25726318359375, 5.5146484375, 5.77203369140625, 6.0294189453125, 6.28680419921875, 6.544189453125, 6.80157470703125, 7.0589599609375, 7.31634521484375, 7.57373046875, 7.83111572265625, 8.0885009765625, 8.34588623046875, 8.603271484375, 8.86065673828125, 9.1180419921875, 9.37542724609375, 9.6328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 12.0, 6.0, 15.0, 31.0, 28.0, 39.0, 33.0, 40.0, 48.0, 64.0, 68.0, 62.0, 65.0, 50.0, 75.0, 48.0, 56.0, 54.0, 48.0, 29.0, 23.0, 19.0, 23.0, 13.0, 11.0, 14.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.809234619140625, -3.67510986328125, -3.540985107421875, -3.4068603515625, -3.272735595703125, -3.13861083984375, -3.004486083984375, -2.870361328125, -2.736236572265625, -2.60211181640625, -2.467987060546875, -2.3338623046875, -2.199737548828125, -2.06561279296875, -1.931488037109375, -1.79736328125, -1.663238525390625, -1.52911376953125, -1.394989013671875, -1.2608642578125, -1.126739501953125, -0.99261474609375, -0.858489990234375, -0.724365234375, -0.590240478515625, -0.45611572265625, -0.321990966796875, -0.1878662109375, -0.053741455078125, 0.08038330078125, 0.214508056640625, 0.3486328125, 0.482757568359375, 0.61688232421875, 0.751007080078125, 0.8851318359375, 1.019256591796875, 1.15338134765625, 1.287506103515625, 1.421630859375, 1.555755615234375, 1.68988037109375, 1.824005126953125, 1.9581298828125, 2.092254638671875, 2.22637939453125, 2.360504150390625, 2.49462890625, 2.628753662109375, 2.76287841796875, 2.897003173828125, 3.0311279296875, 3.165252685546875, 3.29937744140625, 3.433502197265625, 3.567626953125, 3.701751708984375, 3.83587646484375, 3.970001220703125, 4.1041259765625, 4.238250732421875, 4.37237548828125, 4.506500244140625, 4.640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 2.0, 4.0, 12.0, 19.0, 33.0, 34.0, 77.0, 107.0, 195.0, 385.0, 727.0, 1527.0, 3769.0, 10591.0, 42710.0, 272366.0, 583087.0, 101689.0, 20491.0, 6094.0, 2402.0, 1039.0, 530.0, 269.0, 136.0, 99.0, 55.0, 30.0, 26.0, 17.0, 10.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.76953125, -5.59063720703125, -5.4117431640625, -5.23284912109375, -5.053955078125, -4.87506103515625, -4.6961669921875, -4.51727294921875, -4.33837890625, -4.15948486328125, -3.9805908203125, -3.80169677734375, -3.622802734375, -3.44390869140625, -3.2650146484375, -3.08612060546875, -2.9072265625, -2.72833251953125, -2.5494384765625, -2.37054443359375, -2.191650390625, -2.01275634765625, -1.8338623046875, -1.65496826171875, -1.47607421875, -1.29718017578125, -1.1182861328125, -0.93939208984375, -0.760498046875, -0.58160400390625, -0.4027099609375, -0.22381591796875, -0.044921875, 0.13397216796875, 0.3128662109375, 0.49176025390625, 0.670654296875, 0.84954833984375, 1.0284423828125, 1.20733642578125, 1.38623046875, 1.56512451171875, 1.7440185546875, 1.92291259765625, 2.101806640625, 2.28070068359375, 2.4595947265625, 2.63848876953125, 2.8173828125, 2.99627685546875, 3.1751708984375, 3.35406494140625, 3.532958984375, 3.71185302734375, 3.8907470703125, 4.06964111328125, 4.24853515625, 4.42742919921875, 4.6063232421875, 4.78521728515625, 4.964111328125, 5.14300537109375, 5.3218994140625, 5.50079345703125, 5.6796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 9.0, 20.0, 26.0, 33.0, 32.0, 66.0, 89.0, 97.0, 130.0, 109.0, 110.0, 66.0, 53.0, 38.0, 13.0, 18.0, 16.0, 6.0, 7.0, 4.0, 4.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002789497375488281, -0.0002685077488422394, -0.00025806576013565063, -0.0002476237714290619, -0.00023718178272247314, -0.0002267397940158844, -0.00021629780530929565, -0.0002058558166027069, -0.00019541382789611816, -0.00018497183918952942, -0.00017452985048294067, -0.00016408786177635193, -0.00015364587306976318, -0.00014320388436317444, -0.0001327618956565857, -0.00012231990694999695, -0.0001118779182434082, -0.00010143592953681946, -9.099394083023071e-05, -8.055195212364197e-05, -7.010996341705322e-05, -5.966797471046448e-05, -4.922598600387573e-05, -3.878399729728699e-05, -2.8342008590698242e-05, -1.7900019884109497e-05, -7.458031177520752e-06, 2.983957529067993e-06, 1.3425946235656738e-05, 2.3867934942245483e-05, 3.430992364883423e-05, 4.4751912355422974e-05, 5.519390106201172e-05, 6.563588976860046e-05, 7.607787847518921e-05, 8.651986718177795e-05, 9.69618558883667e-05, 0.00010740384459495544, 0.00011784583330154419, 0.00012828782200813293, 0.00013872981071472168, 0.00014917179942131042, 0.00015961378812789917, 0.00017005577683448792, 0.00018049776554107666, 0.0001909397542476654, 0.00020138174295425415, 0.0002118237316608429, 0.00022226572036743164, 0.00023270770907402039, 0.00024314969778060913, 0.0002535916864871979, 0.0002640336751937866, 0.00027447566390037537, 0.0002849176526069641, 0.00029535964131355286, 0.0003058016300201416, 0.00031624361872673035, 0.0003266856074333191, 0.00033712759613990784, 0.0003475695848464966, 0.00035801157355308533, 0.00036845356225967407, 0.0003788955509662628, 0.00038933753967285156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 12.0, 7.0, 8.0, 17.0, 23.0, 42.0, 52.0, 86.0, 158.0, 262.0, 469.0, 868.0, 1783.0, 4409.0, 11566.0, 40547.0, 195024.0, 563822.0, 174199.0, 36377.0, 10949.0, 4114.0, 1784.0, 853.0, 456.0, 234.0, 131.0, 88.0, 59.0, 49.0, 29.0, 9.0, 16.0, 8.0, 9.0, 2.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.61328125, -5.450439453125, -5.28759765625, -5.124755859375, -4.9619140625, -4.799072265625, -4.63623046875, -4.473388671875, -4.310546875, -4.147705078125, -3.98486328125, -3.822021484375, -3.6591796875, -3.496337890625, -3.33349609375, -3.170654296875, -3.0078125, -2.844970703125, -2.68212890625, -2.519287109375, -2.3564453125, -2.193603515625, -2.03076171875, -1.867919921875, -1.705078125, -1.542236328125, -1.37939453125, -1.216552734375, -1.0537109375, -0.890869140625, -0.72802734375, -0.565185546875, -0.40234375, -0.239501953125, -0.07666015625, 0.086181640625, 0.2490234375, 0.411865234375, 0.57470703125, 0.737548828125, 0.900390625, 1.063232421875, 1.22607421875, 1.388916015625, 1.5517578125, 1.714599609375, 1.87744140625, 2.040283203125, 2.203125, 2.365966796875, 2.52880859375, 2.691650390625, 2.8544921875, 3.017333984375, 3.18017578125, 3.343017578125, 3.505859375, 3.668701171875, 3.83154296875, 3.994384765625, 4.1572265625, 4.320068359375, 4.48291015625, 4.645751953125, 4.80859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 4.0, 12.0, 14.0, 10.0, 20.0, 17.0, 28.0, 28.0, 33.0, 47.0, 51.0, 68.0, 78.0, 84.0, 70.0, 74.0, 68.0, 48.0, 50.0, 40.0, 47.0, 17.0, 23.0, 13.0, 13.0, 4.0, 5.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3828125, -2.29840087890625, -2.2139892578125, -2.12957763671875, -2.045166015625, -1.96075439453125, -1.8763427734375, -1.79193115234375, -1.70751953125, -1.62310791015625, -1.5386962890625, -1.45428466796875, -1.369873046875, -1.28546142578125, -1.2010498046875, -1.11663818359375, -1.0322265625, -0.94781494140625, -0.8634033203125, -0.77899169921875, -0.694580078125, -0.61016845703125, -0.5257568359375, -0.44134521484375, -0.35693359375, -0.27252197265625, -0.1881103515625, -0.10369873046875, -0.019287109375, 0.06512451171875, 0.1495361328125, 0.23394775390625, 0.318359375, 0.40277099609375, 0.4871826171875, 0.57159423828125, 0.656005859375, 0.74041748046875, 0.8248291015625, 0.90924072265625, 0.99365234375, 1.07806396484375, 1.1624755859375, 1.24688720703125, 1.331298828125, 1.41571044921875, 1.5001220703125, 1.58453369140625, 1.6689453125, 1.75335693359375, 1.8377685546875, 1.92218017578125, 2.006591796875, 2.09100341796875, 2.1754150390625, 2.25982666015625, 2.34423828125, 2.42864990234375, 2.5130615234375, 2.59747314453125, 2.681884765625, 2.76629638671875, 2.8507080078125, 2.93511962890625, 3.01953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 17.0, 36.0, 325.0, 500.0, 105.0, 16.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.83599853515625, -166.70291137695312, -163.56983947753906, -160.43675231933594, -157.3036651611328, -154.17059326171875, -151.03750610351562, -147.9044189453125, -144.77133178710938, -141.63824462890625, -138.5051727294922, -135.37208557128906, -132.23899841308594, -129.10592651367188, -125.97283935546875, -122.83975219726562, -119.70668029785156, -116.57360076904297, -113.44051361083984, -110.30743408203125, -107.17434692382812, -104.04126739501953, -100.90818786621094, -97.77510070800781, -94.64201354980469, -91.5089340209961, -88.37584686279297, -85.24276733398438, -82.10968017578125, -78.97660064697266, -75.84352111816406, -72.71043395996094, -69.57735443115234, -66.44427490234375, -63.311187744140625, -60.17810821533203, -57.04502487182617, -53.91194152832031, -50.77885818481445, -47.645774841308594, -44.5126953125, -41.37961196899414, -38.24652862548828, -35.11344909667969, -31.980365753173828, -28.84728240966797, -25.71419906616211, -22.581117630004883, -19.448034286499023, -16.314950942993164, -13.181869506835938, -10.048786163330078, -6.915703773498535, -3.782621383666992, -0.6495380401611328, 2.4835433959960938, 5.616626739501953, 8.749709129333496, 11.882791519165039, 15.015874862670898, 18.148956298828125, 21.282039642333984, 24.415122985839844, 27.54820442199707, 30.68128776550293]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 11.0, 12.0, 11.0, 25.0, 35.0, 38.0, 47.0, 56.0, 63.0, 85.0, 81.0, 92.0, 71.0, 58.0, 78.0, 51.0, 47.0, 35.0, 23.0, 16.0, 14.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.666648864746094, -30.57804298400879, -29.489437103271484, -28.40083122253418, -27.312225341796875, -26.22361946105957, -25.135013580322266, -24.046405792236328, -22.957801818847656, -21.86919593811035, -20.780590057373047, -19.691984176635742, -18.603378295898438, -17.514772415161133, -16.426166534423828, -15.337559700012207, -14.248952865600586, -13.160346984863281, -12.071741104125977, -10.983135223388672, -9.894529342651367, -8.805923461914062, -7.717316627502441, -6.628710746765137, -5.540104866027832, -4.451498985290527, -3.3628928661346436, -2.2742867469787598, -1.185680866241455, -0.09707498550415039, 0.9915313720703125, 2.080137252807617, 3.168743133544922, 4.257349014282227, 5.345954895019531, 6.434561252593994, 7.523167133331299, 8.611772537231445, 9.700379371643066, 10.788985252380371, 11.877591133117676, 12.96619701385498, 14.054802894592285, 15.143409729003906, 16.23201560974121, 17.320621490478516, 18.40922737121582, 19.497833251953125, 20.58643913269043, 21.675045013427734, 22.76365089416504, 23.852256774902344, 24.94086265563965, 26.029468536376953, 27.11807632446289, 28.206680297851562, 29.2952880859375, 30.383893966674805, 31.47249984741211, 32.56110763549805, 33.64971160888672, 34.738319396972656, 35.82692337036133, 36.915531158447266, 38.00413513183594]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 0.0, 4.0, 11.0, 6.0, 13.0, 9.0, 18.0, 16.0, 19.0, 26.0, 31.0, 30.0, 38.0, 45.0, 67.0, 94.0, 143.0, 203.0, 316.0, 474.0, 722.0, 1173.0, 2094.0, 4027.0, 9363.0, 31102.0, 489314.0, 3587874.0, 45418.0, 11666.0, 4644.0, 2206.0, 1163.0, 678.0, 407.0, 269.0, 158.0, 136.0, 81.0, 54.0, 45.0, 30.0, 29.0, 22.0, 11.0, 11.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-17.109375, -16.6353759765625, -16.161376953125, -15.6873779296875, -15.21337890625, -14.7393798828125, -14.265380859375, -13.7913818359375, -13.3173828125, -12.8433837890625, -12.369384765625, -11.8953857421875, -11.42138671875, -10.9473876953125, -10.473388671875, -9.9993896484375, -9.525390625, -9.0513916015625, -8.577392578125, -8.1033935546875, -7.62939453125, -7.1553955078125, -6.681396484375, -6.2073974609375, -5.7333984375, -5.2593994140625, -4.785400390625, -4.3114013671875, -3.83740234375, -3.3634033203125, -2.889404296875, -2.4154052734375, -1.94140625, -1.4674072265625, -0.993408203125, -0.5194091796875, -0.04541015625, 0.4285888671875, 0.902587890625, 1.3765869140625, 1.8505859375, 2.3245849609375, 2.798583984375, 3.2725830078125, 3.74658203125, 4.2205810546875, 4.694580078125, 5.1685791015625, 5.642578125, 6.1165771484375, 6.590576171875, 7.0645751953125, 7.53857421875, 8.0125732421875, 8.486572265625, 8.9605712890625, 9.4345703125, 9.9085693359375, 10.382568359375, 10.8565673828125, 11.33056640625, 11.8045654296875, 12.278564453125, 12.7525634765625, 13.2265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 9.0, 9.0, 20.0, 40.0, 76.0, 138.0, 199.0, 219.0, 125.0, 56.0, 26.0, 19.0, 14.0, 14.0, 7.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3583984375, -1.3225021362304688, -1.2866058349609375, -1.2507095336914062, -1.214813232421875, -1.1789169311523438, -1.1430206298828125, -1.1071243286132812, -1.07122802734375, -1.0353317260742188, -0.9994354248046875, -0.9635391235351562, -0.927642822265625, -0.8917465209960938, -0.8558502197265625, -0.8199539184570312, -0.7840576171875, -0.7481613159179688, -0.7122650146484375, -0.6763687133789062, -0.640472412109375, -0.6045761108398438, -0.5686798095703125, -0.5327835083007812, -0.49688720703125, -0.46099090576171875, -0.4250946044921875, -0.38919830322265625, -0.353302001953125, -0.31740570068359375, -0.2815093994140625, -0.24561309814453125, -0.209716796875, -0.17382049560546875, -0.1379241943359375, -0.10202789306640625, -0.066131591796875, -0.03023529052734375, 0.0056610107421875, 0.04155731201171875, 0.07745361328125, 0.11334991455078125, 0.1492462158203125, 0.18514251708984375, 0.221038818359375, 0.25693511962890625, 0.2928314208984375, 0.32872772216796875, 0.3646240234375, 0.40052032470703125, 0.4364166259765625, 0.47231292724609375, 0.508209228515625, 0.5441055297851562, 0.5800018310546875, 0.6158981323242188, 0.65179443359375, 0.6876907348632812, 0.7235870361328125, 0.7594833374023438, 0.795379638671875, 0.8312759399414062, 0.8671722412109375, 0.9030685424804688, 0.93896484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 8.0, 10.0, 9.0, 9.0, 16.0, 34.0, 34.0, 42.0, 97.0, 183.0, 412.0, 810.0, 2034.0, 5979.0, 21926.0, 148376.0, 3757681.0, 218283.0, 27330.0, 6894.0, 2325.0, 883.0, 396.0, 202.0, 96.0, 68.0, 46.0, 16.0, 11.0, 18.0, 8.0, 10.0, 7.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-14.34375, -13.87451171875, -13.4052734375, -12.93603515625, -12.466796875, -11.99755859375, -11.5283203125, -11.05908203125, -10.58984375, -10.12060546875, -9.6513671875, -9.18212890625, -8.712890625, -8.24365234375, -7.7744140625, -7.30517578125, -6.8359375, -6.36669921875, -5.8974609375, -5.42822265625, -4.958984375, -4.48974609375, -4.0205078125, -3.55126953125, -3.08203125, -2.61279296875, -2.1435546875, -1.67431640625, -1.205078125, -0.73583984375, -0.2666015625, 0.20263671875, 0.671875, 1.14111328125, 1.6103515625, 2.07958984375, 2.548828125, 3.01806640625, 3.4873046875, 3.95654296875, 4.42578125, 4.89501953125, 5.3642578125, 5.83349609375, 6.302734375, 6.77197265625, 7.2412109375, 7.71044921875, 8.1796875, 8.64892578125, 9.1181640625, 9.58740234375, 10.056640625, 10.52587890625, 10.9951171875, 11.46435546875, 11.93359375, 12.40283203125, 12.8720703125, 13.34130859375, 13.810546875, 14.27978515625, 14.7490234375, 15.21826171875, 15.6875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 7.0, 7.0, 9.0, 10.0, 8.0, 10.0, 17.0, 18.0, 38.0, 59.0, 89.0, 128.0, 228.0, 501.0, 1676.0, 510.0, 268.0, 137.0, 99.0, 70.0, 34.0, 32.0, 20.0, 16.0, 10.0, 10.0, 11.0, 8.0, 7.0, 8.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.595703125, -1.5519561767578125, -1.508209228515625, -1.4644622802734375, -1.42071533203125, -1.3769683837890625, -1.333221435546875, -1.2894744873046875, -1.2457275390625, -1.2019805908203125, -1.158233642578125, -1.1144866943359375, -1.07073974609375, -1.0269927978515625, -0.983245849609375, -0.9394989013671875, -0.895751953125, -0.8520050048828125, -0.808258056640625, -0.7645111083984375, -0.72076416015625, -0.6770172119140625, -0.633270263671875, -0.5895233154296875, -0.5457763671875, -0.5020294189453125, -0.458282470703125, -0.4145355224609375, -0.37078857421875, -0.3270416259765625, -0.283294677734375, -0.2395477294921875, -0.19580078125, -0.1520538330078125, -0.108306884765625, -0.0645599365234375, -0.02081298828125, 0.0229339599609375, 0.066680908203125, 0.1104278564453125, 0.1541748046875, 0.1979217529296875, 0.241668701171875, 0.2854156494140625, 0.32916259765625, 0.3729095458984375, 0.416656494140625, 0.4604034423828125, 0.504150390625, 0.5478973388671875, 0.591644287109375, 0.6353912353515625, 0.67913818359375, 0.7228851318359375, 0.766632080078125, 0.8103790283203125, 0.8541259765625, 0.8978729248046875, 0.941619873046875, 0.9853668212890625, 1.02911376953125, 1.0728607177734375, 1.116607666015625, 1.1603546142578125, 1.2041015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 14.0, 19.0, 40.0, 63.0, 126.0, 161.0, 202.0, 152.0, 92.0, 55.0, 32.0, 15.0, 10.0, 9.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.792753219604492, -14.404183387756348, -14.015613555908203, -13.627042770385742, -13.238472938537598, -12.849903106689453, -12.461333274841309, -12.072763442993164, -11.684192657470703, -11.295622825622559, -10.907052993774414, -10.518482208251953, -10.129912376403809, -9.741342544555664, -9.35277271270752, -8.964202880859375, -8.57563304901123, -8.187063217163086, -7.798492908477783, -7.409923076629639, -7.021352767944336, -6.632782936096191, -6.244213104248047, -5.855643272399902, -5.4670729637146, -5.078503131866455, -4.689932823181152, -4.301362991333008, -3.912792921066284, -3.5242228507995605, -3.135653018951416, -2.7470829486846924, -2.358513832092285, -1.9699437618255615, -1.5813738107681274, -1.1928038597106934, -0.8042337894439697, -0.4156637191772461, -0.027093887329101562, 0.36147618293762207, 0.7500462532043457, 1.1386163234710693, 1.5271862745285034, 1.9157562255859375, 2.304326295852661, 2.6928963661193848, 3.0814661979675293, 3.470036268234253, 3.8586063385009766, 4.247176170349121, 4.635746479034424, 5.024316310882568, 5.412886619567871, 5.801456451416016, 6.19002628326416, 6.578596115112305, 6.967166423797607, 7.355736255645752, 7.744306564331055, 8.1328763961792, 8.521446228027344, 8.910017013549805, 9.298585891723633, 9.687156677246094, 10.075726509094238]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 9.0, 8.0, 12.0, 9.0, 25.0, 24.0, 32.0, 35.0, 43.0, 48.0, 57.0, 49.0, 52.0, 60.0, 65.0, 63.0, 66.0, 66.0, 47.0, 41.0, 38.0, 32.0, 19.0, 23.0, 22.0, 16.0, 15.0, 12.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.277908325195312, -8.062480926513672, -7.847053527832031, -7.631626129150391, -7.416199207305908, -7.200771808624268, -6.985344409942627, -6.769917011260986, -6.554490089416504, -6.339062690734863, -6.123635292053223, -5.908207893371582, -5.6927809715271, -5.477353572845459, -5.261926174163818, -5.046498775482178, -4.831071376800537, -4.6156439781188965, -4.400216579437256, -4.184789657592773, -3.969362258911133, -3.753934860229492, -3.5385074615478516, -3.323080062866211, -3.1076529026031494, -2.892225503921509, -2.6767983436584473, -2.4613709449768066, -2.245943546295166, -2.0305163860321045, -1.8150889873504639, -1.5996617078781128, -1.3842339515686035, -1.1688066720962524, -0.9533793330192566, -0.7379519939422607, -0.5225247144699097, -0.3070974349975586, -0.09167003631591797, 0.1237572431564331, 0.3391845226287842, 0.5546118021011353, 0.7700391411781311, 0.985466480255127, 1.200893759727478, 1.416321039199829, 1.6317484378814697, 1.8471757173538208, 2.062602996826172, 2.2780303955078125, 2.493457555770874, 2.7088849544525146, 2.924312114715576, 3.139739513397217, 3.3551669120788574, 3.570594310760498, 3.7860214710235596, 4.001448631286621, 4.216876029968262, 4.432303428649902, 4.647730827331543, 4.863158226013184, 5.078585624694824, 5.294012546539307, 5.509439945220947]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 11.0, 5.0, 5.0, 9.0, 11.0, 26.0, 17.0, 33.0, 54.0, 68.0, 98.0, 130.0, 180.0, 247.0, 396.0, 626.0, 1033.0, 1729.0, 3397.0, 7715.0, 22325.0, 104477.0, 647832.0, 203899.0, 34006.0, 10396.0, 4371.0, 2132.0, 1187.0, 677.0, 454.0, 274.0, 225.0, 152.0, 89.0, 70.0, 53.0, 39.0, 23.0, 21.0, 16.0, 14.0, 5.0, 9.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-9.296875, -9.01220703125, -8.7275390625, -8.44287109375, -8.158203125, -7.87353515625, -7.5888671875, -7.30419921875, -7.01953125, -6.73486328125, -6.4501953125, -6.16552734375, -5.880859375, -5.59619140625, -5.3115234375, -5.02685546875, -4.7421875, -4.45751953125, -4.1728515625, -3.88818359375, -3.603515625, -3.31884765625, -3.0341796875, -2.74951171875, -2.46484375, -2.18017578125, -1.8955078125, -1.61083984375, -1.326171875, -1.04150390625, -0.7568359375, -0.47216796875, -0.1875, 0.09716796875, 0.3818359375, 0.66650390625, 0.951171875, 1.23583984375, 1.5205078125, 1.80517578125, 2.08984375, 2.37451171875, 2.6591796875, 2.94384765625, 3.228515625, 3.51318359375, 3.7978515625, 4.08251953125, 4.3671875, 4.65185546875, 4.9365234375, 5.22119140625, 5.505859375, 5.79052734375, 6.0751953125, 6.35986328125, 6.64453125, 6.92919921875, 7.2138671875, 7.49853515625, 7.783203125, 8.06787109375, 8.3525390625, 8.63720703125, 8.921875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 15.0, 22.0, 45.0, 72.0, 134.0, 166.0, 200.0, 137.0, 76.0, 52.0, 27.0, 17.0, 12.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.310394287109375, -1.27410888671875, -1.237823486328125, -1.2015380859375, -1.165252685546875, -1.12896728515625, -1.092681884765625, -1.056396484375, -1.020111083984375, -0.98382568359375, -0.947540283203125, -0.9112548828125, -0.874969482421875, -0.83868408203125, -0.802398681640625, -0.76611328125, -0.729827880859375, -0.69354248046875, -0.657257080078125, -0.6209716796875, -0.584686279296875, -0.54840087890625, -0.512115478515625, -0.475830078125, -0.439544677734375, -0.40325927734375, -0.366973876953125, -0.3306884765625, -0.294403076171875, -0.25811767578125, -0.221832275390625, -0.185546875, -0.149261474609375, -0.11297607421875, -0.076690673828125, -0.0404052734375, -0.004119873046875, 0.03216552734375, 0.068450927734375, 0.104736328125, 0.141021728515625, 0.17730712890625, 0.213592529296875, 0.2498779296875, 0.286163330078125, 0.32244873046875, 0.358734130859375, 0.39501953125, 0.431304931640625, 0.46759033203125, 0.503875732421875, 0.5401611328125, 0.576446533203125, 0.61273193359375, 0.649017333984375, 0.685302734375, 0.721588134765625, 0.75787353515625, 0.794158935546875, 0.8304443359375, 0.866729736328125, 0.90301513671875, 0.939300537109375, 0.9755859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 12.0, 9.0, 22.0, 18.0, 27.0, 36.0, 52.0, 52.0, 72.0, 125.0, 152.0, 241.0, 312.0, 565.0, 956.0, 1928.0, 3796.0, 9406.0, 28042.0, 113378.0, 491614.0, 305284.0, 62064.0, 17507.0, 6447.0, 2792.0, 1465.0, 743.0, 464.0, 284.0, 189.0, 144.0, 95.0, 62.0, 61.0, 37.0, 31.0, 17.0, 11.0, 14.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-9.0078125, -8.7413330078125, -8.474853515625, -8.2083740234375, -7.94189453125, -7.6754150390625, -7.408935546875, -7.1424560546875, -6.8759765625, -6.6094970703125, -6.343017578125, -6.0765380859375, -5.81005859375, -5.5435791015625, -5.277099609375, -5.0106201171875, -4.744140625, -4.4776611328125, -4.211181640625, -3.9447021484375, -3.67822265625, -3.4117431640625, -3.145263671875, -2.8787841796875, -2.6123046875, -2.3458251953125, -2.079345703125, -1.8128662109375, -1.54638671875, -1.2799072265625, -1.013427734375, -0.7469482421875, -0.48046875, -0.2139892578125, 0.052490234375, 0.3189697265625, 0.58544921875, 0.8519287109375, 1.118408203125, 1.3848876953125, 1.6513671875, 1.9178466796875, 2.184326171875, 2.4508056640625, 2.71728515625, 2.9837646484375, 3.250244140625, 3.5167236328125, 3.783203125, 4.0496826171875, 4.316162109375, 4.5826416015625, 4.84912109375, 5.1156005859375, 5.382080078125, 5.6485595703125, 5.9150390625, 6.1815185546875, 6.447998046875, 6.7144775390625, 6.98095703125, 7.2474365234375, 7.513916015625, 7.7803955078125, 8.046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 9.0, 11.0, 10.0, 9.0, 15.0, 20.0, 18.0, 26.0, 36.0, 33.0, 42.0, 42.0, 36.0, 44.0, 36.0, 53.0, 67.0, 58.0, 72.0, 51.0, 50.0, 31.0, 35.0, 28.0, 38.0, 30.0, 16.0, 16.0, 14.0, 20.0, 12.0, 6.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.515350341796875, -3.39593505859375, -3.276519775390625, -3.1571044921875, -3.037689208984375, -2.91827392578125, -2.798858642578125, -2.679443359375, -2.560028076171875, -2.44061279296875, -2.321197509765625, -2.2017822265625, -2.082366943359375, -1.96295166015625, -1.843536376953125, -1.72412109375, -1.604705810546875, -1.48529052734375, -1.365875244140625, -1.2464599609375, -1.127044677734375, -1.00762939453125, -0.888214111328125, -0.768798828125, -0.649383544921875, -0.52996826171875, -0.410552978515625, -0.2911376953125, -0.171722412109375, -0.05230712890625, 0.067108154296875, 0.1865234375, 0.305938720703125, 0.42535400390625, 0.544769287109375, 0.6641845703125, 0.783599853515625, 0.90301513671875, 1.022430419921875, 1.141845703125, 1.261260986328125, 1.38067626953125, 1.500091552734375, 1.6195068359375, 1.738922119140625, 1.85833740234375, 1.977752685546875, 2.09716796875, 2.216583251953125, 2.33599853515625, 2.455413818359375, 2.5748291015625, 2.694244384765625, 2.81365966796875, 2.933074951171875, 3.052490234375, 3.171905517578125, 3.29132080078125, 3.410736083984375, 3.5301513671875, 3.649566650390625, 3.76898193359375, 3.888397216796875, 4.0078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 8.0, 13.0, 21.0, 23.0, 25.0, 25.0, 55.0, 66.0, 93.0, 184.0, 251.0, 417.0, 756.0, 1392.0, 2643.0, 5254.0, 12061.0, 30314.0, 89660.0, 298200.0, 398890.0, 134160.0, 43619.0, 16192.0, 6952.0, 3209.0, 1652.0, 911.0, 569.0, 336.0, 209.0, 122.0, 76.0, 67.0, 26.0, 26.0, 28.0, 11.0, 12.0, 5.0, 6.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.95513916015625, -3.8282470703125, -3.70135498046875, -3.574462890625, -3.44757080078125, -3.3206787109375, -3.19378662109375, -3.06689453125, -2.94000244140625, -2.8131103515625, -2.68621826171875, -2.559326171875, -2.43243408203125, -2.3055419921875, -2.17864990234375, -2.0517578125, -1.92486572265625, -1.7979736328125, -1.67108154296875, -1.544189453125, -1.41729736328125, -1.2904052734375, -1.16351318359375, -1.03662109375, -0.90972900390625, -0.7828369140625, -0.65594482421875, -0.529052734375, -0.40216064453125, -0.2752685546875, -0.14837646484375, -0.021484375, 0.10540771484375, 0.2322998046875, 0.35919189453125, 0.486083984375, 0.61297607421875, 0.7398681640625, 0.86676025390625, 0.99365234375, 1.12054443359375, 1.2474365234375, 1.37432861328125, 1.501220703125, 1.62811279296875, 1.7550048828125, 1.88189697265625, 2.0087890625, 2.13568115234375, 2.2625732421875, 2.38946533203125, 2.516357421875, 2.64324951171875, 2.7701416015625, 2.89703369140625, 3.02392578125, 3.15081787109375, 3.2777099609375, 3.40460205078125, 3.531494140625, 3.65838623046875, 3.7852783203125, 3.91217041015625, 4.0390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 8.0, 6.0, 9.0, 8.0, 13.0, 13.0, 22.0, 26.0, 32.0, 50.0, 82.0, 93.0, 98.0, 114.0, 90.0, 83.0, 71.0, 47.0, 28.0, 28.0, 17.0, 11.0, 8.0, 8.0, 5.0, 5.0, 4.0, 6.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007767677307128906, -0.0007540881633758545, -0.0007314085960388184, -0.0007087290287017822, -0.0006860494613647461, -0.00066336989402771, -0.0006406903266906738, -0.0006180107593536377, -0.0005953311920166016, -0.0005726516246795654, -0.0005499720573425293, -0.0005272924900054932, -0.000504612922668457, -0.0004819333553314209, -0.00045925378799438477, -0.00043657422065734863, -0.0004138946533203125, -0.00039121508598327637, -0.00036853551864624023, -0.0003458559513092041, -0.00032317638397216797, -0.00030049681663513184, -0.0002778172492980957, -0.00025513768196105957, -0.00023245811462402344, -0.0002097785472869873, -0.00018709897994995117, -0.00016441941261291504, -0.0001417398452758789, -0.00011906027793884277, -9.638071060180664e-05, -7.370114326477051e-05, -5.1021575927734375e-05, -2.8342008590698242e-05, -5.662441253662109e-06, 1.7017126083374023e-05, 3.9696693420410156e-05, 6.237626075744629e-05, 8.505582809448242e-05, 0.00010773539543151855, 0.0001304149627685547, 0.00015309453010559082, 0.00017577409744262695, 0.00019845366477966309, 0.00022113323211669922, 0.00024381279945373535, 0.0002664923667907715, 0.0002891719341278076, 0.00031185150146484375, 0.0003345310688018799, 0.000357210636138916, 0.00037989020347595215, 0.0004025697708129883, 0.0004252493381500244, 0.00044792890548706055, 0.0004706084728240967, 0.0004932880401611328, 0.0005159676074981689, 0.0005386471748352051, 0.0005613267421722412, 0.0005840063095092773, 0.0006066858768463135, 0.0006293654441833496, 0.0006520450115203857, 0.0006747245788574219]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 10.0, 12.0, 15.0, 13.0, 16.0, 29.0, 39.0, 39.0, 49.0, 104.0, 144.0, 258.0, 390.0, 644.0, 1154.0, 2246.0, 4887.0, 11629.0, 36183.0, 153370.0, 550359.0, 213792.0, 46761.0, 14639.0, 5868.0, 2639.0, 1350.0, 730.0, 399.0, 263.0, 165.0, 115.0, 64.0, 49.0, 33.0, 23.0, 9.0, 18.0, 10.0, 3.0, 9.0, 5.0, 2.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.26171875, -5.09521484375, -4.9287109375, -4.76220703125, -4.595703125, -4.42919921875, -4.2626953125, -4.09619140625, -3.9296875, -3.76318359375, -3.5966796875, -3.43017578125, -3.263671875, -3.09716796875, -2.9306640625, -2.76416015625, -2.59765625, -2.43115234375, -2.2646484375, -2.09814453125, -1.931640625, -1.76513671875, -1.5986328125, -1.43212890625, -1.265625, -1.09912109375, -0.9326171875, -0.76611328125, -0.599609375, -0.43310546875, -0.2666015625, -0.10009765625, 0.06640625, 0.23291015625, 0.3994140625, 0.56591796875, 0.732421875, 0.89892578125, 1.0654296875, 1.23193359375, 1.3984375, 1.56494140625, 1.7314453125, 1.89794921875, 2.064453125, 2.23095703125, 2.3974609375, 2.56396484375, 2.73046875, 2.89697265625, 3.0634765625, 3.22998046875, 3.396484375, 3.56298828125, 3.7294921875, 3.89599609375, 4.0625, 4.22900390625, 4.3955078125, 4.56201171875, 4.728515625, 4.89501953125, 5.0615234375, 5.22802734375, 5.39453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 11.0, 19.0, 20.0, 22.0, 38.0, 34.0, 53.0, 52.0, 60.0, 68.0, 80.0, 76.0, 70.0, 70.0, 58.0, 51.0, 36.0, 30.0, 22.0, 19.0, 13.0, 14.0, 13.0, 4.0, 9.0, 10.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.498046875, -2.4229736328125, -2.347900390625, -2.2728271484375, -2.19775390625, -2.1226806640625, -2.047607421875, -1.9725341796875, -1.8974609375, -1.8223876953125, -1.747314453125, -1.6722412109375, -1.59716796875, -1.5220947265625, -1.447021484375, -1.3719482421875, -1.296875, -1.2218017578125, -1.146728515625, -1.0716552734375, -0.99658203125, -0.9215087890625, -0.846435546875, -0.7713623046875, -0.6962890625, -0.6212158203125, -0.546142578125, -0.4710693359375, -0.39599609375, -0.3209228515625, -0.245849609375, -0.1707763671875, -0.095703125, -0.0206298828125, 0.054443359375, 0.1295166015625, 0.20458984375, 0.2796630859375, 0.354736328125, 0.4298095703125, 0.5048828125, 0.5799560546875, 0.655029296875, 0.7301025390625, 0.80517578125, 0.8802490234375, 0.955322265625, 1.0303955078125, 1.10546875, 1.1805419921875, 1.255615234375, 1.3306884765625, 1.40576171875, 1.4808349609375, 1.555908203125, 1.6309814453125, 1.7060546875, 1.7811279296875, 1.856201171875, 1.9312744140625, 2.00634765625, 2.0814208984375, 2.156494140625, 2.2315673828125, 2.306640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 15.0, 55.0, 221.0, 386.0, 231.0, 63.0, 16.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.46278381347656, -139.41738891601562, -135.37200927734375, -131.3266143798828, -127.28123474121094, -123.23583984375, -119.1904525756836, -115.14506530761719, -111.09967803955078, -107.05429077148438, -103.00890350341797, -98.96351623535156, -94.91812133789062, -90.87274169921875, -86.82734680175781, -82.7819595336914, -78.736572265625, -74.6911849975586, -70.64579772949219, -66.60041046142578, -62.55501937866211, -58.5096321105957, -54.46424102783203, -50.418853759765625, -46.37346649169922, -42.32807922363281, -38.282691955566406, -34.237300872802734, -30.191913604736328, -26.146526336669922, -22.101137161254883, -18.055747985839844, -14.010353088378906, -9.964964866638184, -5.919576644897461, -1.8741884231567383, 2.1711997985839844, 6.216587066650391, 10.26197624206543, 14.307365417480469, 18.352752685546875, 22.39813995361328, 26.44352912902832, 30.48891830444336, 34.534305572509766, 38.57969284057617, 42.625083923339844, 46.67047119140625, 50.715858459472656, 54.76124572753906, 58.80663299560547, 62.85202407836914, 66.89741516113281, 70.94279479980469, 74.98818969726562, 79.03357696533203, 83.07896423339844, 87.12435150146484, 91.16973876953125, 95.21512603759766, 99.26051330566406, 103.305908203125, 107.3512954711914, 111.39668273925781, 115.44207000732422]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 12.0, 9.0, 20.0, 29.0, 20.0, 36.0, 38.0, 51.0, 47.0, 58.0, 75.0, 65.0, 67.0, 65.0, 61.0, 61.0, 61.0, 61.0, 32.0, 36.0, 20.0, 22.0, 14.0, 6.0, 5.0, 4.0, 10.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.85041809082031, -40.723182678222656, -39.595951080322266, -38.46871566772461, -37.34148406982422, -36.21424865722656, -35.08701705932617, -33.959781646728516, -32.832550048828125, -31.7053165435791, -30.578083038330078, -29.450849533081055, -28.32361602783203, -27.196380615234375, -26.06914710998535, -24.941913604736328, -23.814678192138672, -22.68744468688965, -21.560211181640625, -20.4329776763916, -19.305744171142578, -18.178508758544922, -17.0512752532959, -15.924041748046875, -14.796808242797852, -13.669574737548828, -12.542341232299805, -11.415106773376465, -10.287873268127441, -9.160639762878418, -8.033405303955078, -6.906171798706055, -5.778934478759766, -4.651700973510742, -3.5244669914245605, -2.397233247756958, -1.2699995040893555, -0.14276599884033203, 0.9844679832458496, 2.1117019653320312, 3.2389354705810547, 4.366168975830078, 5.49340295791626, 6.620636940002441, 7.747870445251465, 8.875103950500488, 10.002338409423828, 11.129571914672852, 12.256805419921875, 13.384038925170898, 14.511272430419922, 15.638506889343262, 16.76573944091797, 17.892974853515625, 19.02020835876465, 20.147441864013672, 21.274675369262695, 22.40190887451172, 23.529142379760742, 24.656375885009766, 25.783611297607422, 26.910842895507812, 28.03807830810547, 29.165311813354492, 30.292545318603516]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 6.0, 14.0, 9.0, 16.0, 36.0, 51.0, 90.0, 191.0, 328.0, 712.0, 2380.0, 13634.0, 3698185.0, 466129.0, 9915.0, 1734.0, 475.0, 200.0, 83.0, 47.0, 22.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.28125, -42.169189453125, -41.05712890625, -39.945068359375, -38.8330078125, -37.720947265625, -36.60888671875, -35.496826171875, -34.384765625, -33.272705078125, -32.16064453125, -31.048583984375, -29.9365234375, -28.824462890625, -27.71240234375, -26.600341796875, -25.48828125, -24.376220703125, -23.26416015625, -22.152099609375, -21.0400390625, -19.927978515625, -18.81591796875, -17.703857421875, -16.591796875, -15.479736328125, -14.36767578125, -13.255615234375, -12.1435546875, -11.031494140625, -9.91943359375, -8.807373046875, -7.6953125, -6.583251953125, -5.47119140625, -4.359130859375, -3.2470703125, -2.135009765625, -1.02294921875, 0.089111328125, 1.201171875, 2.313232421875, 3.42529296875, 4.537353515625, 5.6494140625, 6.761474609375, 7.87353515625, 8.985595703125, 10.09765625, 11.209716796875, 12.32177734375, 13.433837890625, 14.5458984375, 15.657958984375, 16.77001953125, 17.882080078125, 18.994140625, 20.106201171875, 21.21826171875, 22.330322265625, 23.4423828125, 24.554443359375, 25.66650390625, 26.778564453125, 27.890625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 8.0, 4.0, 6.0, 18.0, 27.0, 46.0, 89.0, 148.0, 180.0, 148.0, 114.0, 83.0, 57.0, 32.0, 11.0, 6.0, 11.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.736328125, -1.692779541015625, -1.64923095703125, -1.605682373046875, -1.5621337890625, -1.518585205078125, -1.47503662109375, -1.431488037109375, -1.387939453125, -1.344390869140625, -1.30084228515625, -1.257293701171875, -1.2137451171875, -1.170196533203125, -1.12664794921875, -1.083099365234375, -1.03955078125, -0.996002197265625, -0.95245361328125, -0.908905029296875, -0.8653564453125, -0.821807861328125, -0.77825927734375, -0.734710693359375, -0.691162109375, -0.647613525390625, -0.60406494140625, -0.560516357421875, -0.5169677734375, -0.473419189453125, -0.42987060546875, -0.386322021484375, -0.3427734375, -0.299224853515625, -0.25567626953125, -0.212127685546875, -0.1685791015625, -0.125030517578125, -0.08148193359375, -0.037933349609375, 0.005615234375, 0.049163818359375, 0.09271240234375, 0.136260986328125, 0.1798095703125, 0.223358154296875, 0.26690673828125, 0.310455322265625, 0.35400390625, 0.397552490234375, 0.44110107421875, 0.484649658203125, 0.5281982421875, 0.571746826171875, 0.61529541015625, 0.658843994140625, 0.702392578125, 0.745941162109375, 0.78948974609375, 0.833038330078125, 0.8765869140625, 0.920135498046875, 0.96368408203125, 1.007232666015625, 1.05078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 9.0, 12.0, 13.0, 8.0, 28.0, 48.0, 59.0, 91.0, 160.0, 215.0, 407.0, 731.0, 1399.0, 2944.0, 7627.0, 29298.0, 208603.0, 3649902.0, 245126.0, 33148.0, 8385.0, 3047.0, 1364.0, 677.0, 390.0, 237.0, 113.0, 81.0, 53.0, 32.0, 22.0, 17.0, 13.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.625, -13.1787109375, -12.732421875, -12.2861328125, -11.83984375, -11.3935546875, -10.947265625, -10.5009765625, -10.0546875, -9.6083984375, -9.162109375, -8.7158203125, -8.26953125, -7.8232421875, -7.376953125, -6.9306640625, -6.484375, -6.0380859375, -5.591796875, -5.1455078125, -4.69921875, -4.2529296875, -3.806640625, -3.3603515625, -2.9140625, -2.4677734375, -2.021484375, -1.5751953125, -1.12890625, -0.6826171875, -0.236328125, 0.2099609375, 0.65625, 1.1025390625, 1.548828125, 1.9951171875, 2.44140625, 2.8876953125, 3.333984375, 3.7802734375, 4.2265625, 4.6728515625, 5.119140625, 5.5654296875, 6.01171875, 6.4580078125, 6.904296875, 7.3505859375, 7.796875, 8.2431640625, 8.689453125, 9.1357421875, 9.58203125, 10.0283203125, 10.474609375, 10.9208984375, 11.3671875, 11.8134765625, 12.259765625, 12.7060546875, 13.15234375, 13.5986328125, 14.044921875, 14.4912109375, 14.9375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 3.0, 9.0, 9.0, 16.0, 31.0, 49.0, 66.0, 134.0, 214.0, 540.0, 1770.0, 662.0, 203.0, 107.0, 68.0, 46.0, 46.0, 27.0, 25.0, 13.0, 5.0, 2.0, 7.0, 2.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.955078125, -2.8719482421875, -2.788818359375, -2.7056884765625, -2.62255859375, -2.5394287109375, -2.456298828125, -2.3731689453125, -2.2900390625, -2.2069091796875, -2.123779296875, -2.0406494140625, -1.95751953125, -1.8743896484375, -1.791259765625, -1.7081298828125, -1.625, -1.5418701171875, -1.458740234375, -1.3756103515625, -1.29248046875, -1.2093505859375, -1.126220703125, -1.0430908203125, -0.9599609375, -0.8768310546875, -0.793701171875, -0.7105712890625, -0.62744140625, -0.5443115234375, -0.461181640625, -0.3780517578125, -0.294921875, -0.2117919921875, -0.128662109375, -0.0455322265625, 0.03759765625, 0.1207275390625, 0.203857421875, 0.2869873046875, 0.3701171875, 0.4532470703125, 0.536376953125, 0.6195068359375, 0.70263671875, 0.7857666015625, 0.868896484375, 0.9520263671875, 1.03515625, 1.1182861328125, 1.201416015625, 1.2845458984375, 1.36767578125, 1.4508056640625, 1.533935546875, 1.6170654296875, 1.7001953125, 1.7833251953125, 1.866455078125, 1.9495849609375, 2.03271484375, 2.1158447265625, 2.198974609375, 2.2821044921875, 2.365234375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 10.0, 15.0, 36.0, 70.0, 130.0, 201.0, 208.0, 168.0, 88.0, 39.0, 16.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.06146240234375, -26.35172462463379, -25.641986846923828, -24.932249069213867, -24.222511291503906, -23.512775421142578, -22.803035736083984, -22.093299865722656, -21.383562088012695, -20.673824310302734, -19.964086532592773, -19.254348754882812, -18.54461097717285, -17.83487319946289, -17.125137329101562, -16.4153995513916, -15.705660820007324, -14.995923042297363, -14.286185264587402, -13.576448440551758, -12.866710662841797, -12.156972885131836, -11.447235107421875, -10.737497329711914, -10.027759552001953, -9.318021774291992, -8.608283996582031, -7.8985466957092285, -7.188809394836426, -6.479071617126465, -5.769333839416504, -5.059596538543701, -4.349859237670898, -3.6401216983795166, -2.9303841590881348, -2.220646381378174, -1.510908842086792, -0.8011713027954102, -0.09143352508544922, 0.6183037757873535, 1.3280415534973145, 2.0377790927886963, 2.747516632080078, 3.457254409790039, 4.1669921875, 4.876729488372803, 5.586467266082764, 6.296204566955566, 7.005942344665527, 7.715680122375488, 8.42541790008545, 9.135154724121094, 9.844892501831055, 10.554630279541016, 11.264368057250977, 11.974105834960938, 12.683843612670898, 13.39358139038086, 14.10331916809082, 14.813056945800781, 15.522793769836426, 16.232532501220703, 16.94226837158203, 17.652006149291992, 18.361743927001953]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 2.0, 7.0, 4.0, 5.0, 9.0, 15.0, 12.0, 11.0, 15.0, 23.0, 16.0, 25.0, 29.0, 35.0, 39.0, 27.0, 41.0, 37.0, 39.0, 44.0, 48.0, 49.0, 50.0, 39.0, 36.0, 52.0, 34.0, 37.0, 27.0, 26.0, 27.0, 22.0, 27.0, 18.0, 14.0, 9.0, 7.0, 7.0, 7.0, 7.0, 7.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-8.621857643127441, -8.376824378967285, -8.131792068481445, -7.886758804321289, -7.641725540161133, -7.396692752838135, -7.151659965515137, -6.9066267013549805, -6.661593914031982, -6.416561126708984, -6.171527862548828, -5.92649507522583, -5.681462287902832, -5.436429023742676, -5.191396236419678, -4.94636344909668, -4.701330184936523, -4.456297397613525, -4.211264133453369, -3.966231346130371, -3.721198320388794, -3.476165294647217, -3.2311325073242188, -2.9860994815826416, -2.7410664558410645, -2.4960334300994873, -2.25100040435791, -2.005967617034912, -1.760934591293335, -1.5159015655517578, -1.2708686590194702, -1.0258357524871826, -0.7808027267456055, -0.5357697606086731, -0.2907367944717407, -0.04570382833480835, 0.19932913780212402, 0.44436216354370117, 0.6893950700759888, 0.9344279766082764, 1.1794610023498535, 1.4244940280914307, 1.6695269346237183, 1.9145598411560059, 2.159592866897583, 2.40462589263916, 2.649658679962158, 2.8946917057037354, 3.1397247314453125, 3.3847577571868896, 3.629790782928467, 3.874823570251465, 4.119856834411621, 4.364889621734619, 4.609922409057617, 4.854955673217773, 5.0999884605407715, 5.3450212478637695, 5.590054512023926, 5.835087299346924, 6.080120086669922, 6.325153350830078, 6.570186138153076, 6.815218925476074, 7.0602521896362305]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 14.0, 5.0, 21.0, 17.0, 25.0, 28.0, 48.0, 57.0, 78.0, 111.0, 203.0, 273.0, 432.0, 645.0, 1132.0, 2098.0, 4243.0, 9720.0, 28407.0, 118142.0, 507203.0, 286289.0, 58897.0, 16959.0, 6454.0, 3050.0, 1520.0, 889.0, 516.0, 328.0, 224.0, 117.0, 108.0, 82.0, 48.0, 50.0, 34.0, 22.0, 14.0, 16.0, 8.0, 3.0, 5.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-8.3046875, -8.05126953125, -7.7978515625, -7.54443359375, -7.291015625, -7.03759765625, -6.7841796875, -6.53076171875, -6.27734375, -6.02392578125, -5.7705078125, -5.51708984375, -5.263671875, -5.01025390625, -4.7568359375, -4.50341796875, -4.25, -3.99658203125, -3.7431640625, -3.48974609375, -3.236328125, -2.98291015625, -2.7294921875, -2.47607421875, -2.22265625, -1.96923828125, -1.7158203125, -1.46240234375, -1.208984375, -0.95556640625, -0.7021484375, -0.44873046875, -0.1953125, 0.05810546875, 0.3115234375, 0.56494140625, 0.818359375, 1.07177734375, 1.3251953125, 1.57861328125, 1.83203125, 2.08544921875, 2.3388671875, 2.59228515625, 2.845703125, 3.09912109375, 3.3525390625, 3.60595703125, 3.859375, 4.11279296875, 4.3662109375, 4.61962890625, 4.873046875, 5.12646484375, 5.3798828125, 5.63330078125, 5.88671875, 6.14013671875, 6.3935546875, 6.64697265625, 6.900390625, 7.15380859375, 7.4072265625, 7.66064453125, 7.9140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 8.0, 23.0, 31.0, 51.0, 59.0, 104.0, 119.0, 143.0, 108.0, 107.0, 78.0, 59.0, 45.0, 15.0, 17.0, 12.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.7158203125, -1.6736526489257812, -1.6314849853515625, -1.5893173217773438, -1.547149658203125, -1.5049819946289062, -1.4628143310546875, -1.4206466674804688, -1.37847900390625, -1.3363113403320312, -1.2941436767578125, -1.2519760131835938, -1.209808349609375, -1.1676406860351562, -1.1254730224609375, -1.0833053588867188, -1.0411376953125, -0.9989700317382812, -0.9568023681640625, -0.9146347045898438, -0.872467041015625, -0.8302993774414062, -0.7881317138671875, -0.7459640502929688, -0.70379638671875, -0.6616287231445312, -0.6194610595703125, -0.5772933959960938, -0.535125732421875, -0.49295806884765625, -0.4507904052734375, -0.40862274169921875, -0.366455078125, -0.32428741455078125, -0.2821197509765625, -0.23995208740234375, -0.197784423828125, -0.15561676025390625, -0.1134490966796875, -0.07128143310546875, -0.02911376953125, 0.01305389404296875, 0.0552215576171875, 0.09738922119140625, 0.139556884765625, 0.18172454833984375, 0.2238922119140625, 0.26605987548828125, 0.3082275390625, 0.35039520263671875, 0.3925628662109375, 0.43473052978515625, 0.476898193359375, 0.5190658569335938, 0.5612335205078125, 0.6034011840820312, 0.64556884765625, 0.6877365112304688, 0.7299041748046875, 0.7720718383789062, 0.814239501953125, 0.8564071655273438, 0.8985748291015625, 0.9407424926757812, 0.98291015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 7.0, 5.0, 6.0, 10.0, 17.0, 16.0, 30.0, 39.0, 53.0, 66.0, 96.0, 115.0, 171.0, 217.0, 324.0, 494.0, 825.0, 1394.0, 2634.0, 5356.0, 12699.0, 34510.0, 117190.0, 440508.0, 308330.0, 79078.0, 25108.0, 9559.0, 4283.0, 2027.0, 1155.0, 688.0, 459.0, 291.0, 200.0, 157.0, 111.0, 74.0, 62.0, 45.0, 37.0, 37.0, 16.0, 14.0, 13.0, 9.0, 7.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.779052734375, -7.52685546875, -7.274658203125, -7.0224609375, -6.770263671875, -6.51806640625, -6.265869140625, -6.013671875, -5.761474609375, -5.50927734375, -5.257080078125, -5.0048828125, -4.752685546875, -4.50048828125, -4.248291015625, -3.99609375, -3.743896484375, -3.49169921875, -3.239501953125, -2.9873046875, -2.735107421875, -2.48291015625, -2.230712890625, -1.978515625, -1.726318359375, -1.47412109375, -1.221923828125, -0.9697265625, -0.717529296875, -0.46533203125, -0.213134765625, 0.0390625, 0.291259765625, 0.54345703125, 0.795654296875, 1.0478515625, 1.300048828125, 1.55224609375, 1.804443359375, 2.056640625, 2.308837890625, 2.56103515625, 2.813232421875, 3.0654296875, 3.317626953125, 3.56982421875, 3.822021484375, 4.07421875, 4.326416015625, 4.57861328125, 4.830810546875, 5.0830078125, 5.335205078125, 5.58740234375, 5.839599609375, 6.091796875, 6.343994140625, 6.59619140625, 6.848388671875, 7.1005859375, 7.352783203125, 7.60498046875, 7.857177734375, 8.109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 8.0, 3.0, 7.0, 12.0, 4.0, 13.0, 14.0, 8.0, 15.0, 22.0, 22.0, 28.0, 34.0, 37.0, 28.0, 40.0, 38.0, 55.0, 41.0, 43.0, 41.0, 48.0, 35.0, 43.0, 40.0, 40.0, 37.0, 36.0, 26.0, 33.0, 22.0, 19.0, 12.0, 21.0, 12.0, 10.0, 9.0, 9.0, 2.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.46270751953125, -4.3277587890625, -4.19281005859375, -4.057861328125, -3.92291259765625, -3.7879638671875, -3.65301513671875, -3.51806640625, -3.38311767578125, -3.2481689453125, -3.11322021484375, -2.978271484375, -2.84332275390625, -2.7083740234375, -2.57342529296875, -2.4384765625, -2.30352783203125, -2.1685791015625, -2.03363037109375, -1.898681640625, -1.76373291015625, -1.6287841796875, -1.49383544921875, -1.35888671875, -1.22393798828125, -1.0889892578125, -0.95404052734375, -0.819091796875, -0.68414306640625, -0.5491943359375, -0.41424560546875, -0.279296875, -0.14434814453125, -0.0093994140625, 0.12554931640625, 0.260498046875, 0.39544677734375, 0.5303955078125, 0.66534423828125, 0.80029296875, 0.93524169921875, 1.0701904296875, 1.20513916015625, 1.340087890625, 1.47503662109375, 1.6099853515625, 1.74493408203125, 1.8798828125, 2.01483154296875, 2.1497802734375, 2.28472900390625, 2.419677734375, 2.55462646484375, 2.6895751953125, 2.82452392578125, 2.95947265625, 3.09442138671875, 3.2293701171875, 3.36431884765625, 3.499267578125, 3.63421630859375, 3.7691650390625, 3.90411376953125, 4.0390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 4.0, 9.0, 11.0, 14.0, 15.0, 24.0, 35.0, 45.0, 87.0, 113.0, 195.0, 276.0, 432.0, 696.0, 1195.0, 2048.0, 3699.0, 7318.0, 16296.0, 41805.0, 129415.0, 444299.0, 272792.0, 76531.0, 27376.0, 11431.0, 5435.0, 2822.0, 1521.0, 995.0, 561.0, 363.0, 211.0, 144.0, 117.0, 64.0, 54.0, 27.0, 25.0, 19.0, 14.0, 6.0, 10.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.99609375, -4.860260009765625, -4.72442626953125, -4.588592529296875, -4.4527587890625, -4.316925048828125, -4.18109130859375, -4.045257568359375, -3.909423828125, -3.773590087890625, -3.63775634765625, -3.501922607421875, -3.3660888671875, -3.230255126953125, -3.09442138671875, -2.958587646484375, -2.82275390625, -2.686920166015625, -2.55108642578125, -2.415252685546875, -2.2794189453125, -2.143585205078125, -2.00775146484375, -1.871917724609375, -1.736083984375, -1.600250244140625, -1.46441650390625, -1.328582763671875, -1.1927490234375, -1.056915283203125, -0.92108154296875, -0.785247802734375, -0.6494140625, -0.513580322265625, -0.37774658203125, -0.241912841796875, -0.1060791015625, 0.029754638671875, 0.16558837890625, 0.301422119140625, 0.437255859375, 0.573089599609375, 0.70892333984375, 0.844757080078125, 0.9805908203125, 1.116424560546875, 1.25225830078125, 1.388092041015625, 1.52392578125, 1.659759521484375, 1.79559326171875, 1.931427001953125, 2.0672607421875, 2.203094482421875, 2.33892822265625, 2.474761962890625, 2.610595703125, 2.746429443359375, 2.88226318359375, 3.018096923828125, 3.1539306640625, 3.289764404296875, 3.42559814453125, 3.561431884765625, 3.697265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 3.0, 9.0, 10.0, 16.0, 16.0, 28.0, 27.0, 27.0, 48.0, 44.0, 70.0, 103.0, 134.0, 109.0, 89.0, 55.0, 47.0, 26.0, 27.0, 18.0, 11.0, 14.0, 13.0, 15.0, 6.0, 5.0, 6.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0007486343383789062, -0.0007256194949150085, -0.0007026046514511108, -0.0006795898079872131, -0.0006565749645233154, -0.0006335601210594177, -0.00061054527759552, -0.0005875304341316223, -0.0005645155906677246, -0.0005415007472038269, -0.0005184859037399292, -0.0004954710602760315, -0.0004724562168121338, -0.0004494413733482361, -0.0004264265298843384, -0.0004034116864204407, -0.00038039684295654297, -0.00035738199949264526, -0.00033436715602874756, -0.00031135231256484985, -0.00028833746910095215, -0.00026532262563705444, -0.00024230778217315674, -0.00021929293870925903, -0.00019627809524536133, -0.00017326325178146362, -0.00015024840831756592, -0.0001272335648536682, -0.00010421872138977051, -8.12038779258728e-05, -5.81890344619751e-05, -3.517419099807739e-05, -1.2159347534179688e-05, 1.0855495929718018e-05, 3.387033939361572e-05, 5.688518285751343e-05, 7.990002632141113e-05, 0.00010291486978530884, 0.00012592971324920654, 0.00014894455671310425, 0.00017195940017700195, 0.00019497424364089966, 0.00021798908710479736, 0.00024100393056869507, 0.0002640187740325928, 0.0002870336174964905, 0.0003100484609603882, 0.0003330633044242859, 0.0003560781478881836, 0.0003790929913520813, 0.000402107834815979, 0.0004251226782798767, 0.0004481375217437744, 0.0004711523652076721, 0.0004941672086715698, 0.0005171820521354675, 0.0005401968955993652, 0.0005632117390632629, 0.0005862265825271606, 0.0006092414259910583, 0.0006322562694549561, 0.0006552711129188538, 0.0006782859563827515, 0.0007013007998466492, 0.0007243156433105469]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 10.0, 16.0, 18.0, 28.0, 44.0, 56.0, 90.0, 113.0, 238.0, 315.0, 620.0, 1166.0, 2493.0, 6210.0, 20075.0, 88619.0, 583678.0, 277204.0, 47051.0, 12197.0, 4333.0, 1844.0, 885.0, 472.0, 271.0, 163.0, 110.0, 80.0, 40.0, 34.0, 30.0, 11.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.59375, -7.36907958984375, -7.1444091796875, -6.91973876953125, -6.695068359375, -6.47039794921875, -6.2457275390625, -6.02105712890625, -5.79638671875, -5.57171630859375, -5.3470458984375, -5.12237548828125, -4.897705078125, -4.67303466796875, -4.4483642578125, -4.22369384765625, -3.9990234375, -3.77435302734375, -3.5496826171875, -3.32501220703125, -3.100341796875, -2.87567138671875, -2.6510009765625, -2.42633056640625, -2.20166015625, -1.97698974609375, -1.7523193359375, -1.52764892578125, -1.302978515625, -1.07830810546875, -0.8536376953125, -0.62896728515625, -0.404296875, -0.17962646484375, 0.0450439453125, 0.26971435546875, 0.494384765625, 0.71905517578125, 0.9437255859375, 1.16839599609375, 1.39306640625, 1.61773681640625, 1.8424072265625, 2.06707763671875, 2.291748046875, 2.51641845703125, 2.7410888671875, 2.96575927734375, 3.1904296875, 3.41510009765625, 3.6397705078125, 3.86444091796875, 4.089111328125, 4.31378173828125, 4.5384521484375, 4.76312255859375, 4.98779296875, 5.21246337890625, 5.4371337890625, 5.66180419921875, 5.886474609375, 6.11114501953125, 6.3358154296875, 6.56048583984375, 6.78515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 1.0, 6.0, 1.0, 5.0, 6.0, 7.0, 11.0, 16.0, 17.0, 18.0, 24.0, 31.0, 40.0, 41.0, 72.0, 97.0, 124.0, 96.0, 85.0, 62.0, 47.0, 36.0, 29.0, 25.0, 30.0, 16.0, 15.0, 8.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.4114990234375, -3.301513671875, -3.1915283203125, -3.08154296875, -2.9715576171875, -2.861572265625, -2.7515869140625, -2.6416015625, -2.5316162109375, -2.421630859375, -2.3116455078125, -2.20166015625, -2.0916748046875, -1.981689453125, -1.8717041015625, -1.76171875, -1.6517333984375, -1.541748046875, -1.4317626953125, -1.32177734375, -1.2117919921875, -1.101806640625, -0.9918212890625, -0.8818359375, -0.7718505859375, -0.661865234375, -0.5518798828125, -0.44189453125, -0.3319091796875, -0.221923828125, -0.1119384765625, -0.001953125, 0.1080322265625, 0.218017578125, 0.3280029296875, 0.43798828125, 0.5479736328125, 0.657958984375, 0.7679443359375, 0.8779296875, 0.9879150390625, 1.097900390625, 1.2078857421875, 1.31787109375, 1.4278564453125, 1.537841796875, 1.6478271484375, 1.7578125, 1.8677978515625, 1.977783203125, 2.0877685546875, 2.19775390625, 2.3077392578125, 2.417724609375, 2.5277099609375, 2.6376953125, 2.7476806640625, 2.857666015625, 2.9676513671875, 3.07763671875, 3.1876220703125, 3.297607421875, 3.4075927734375, 3.517578125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 23.0, 30.0, 58.0, 87.0, 163.0, 195.0, 142.0, 109.0, 58.0, 46.0, 22.0, 18.0, 10.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.97011184692383, -50.0161247253418, -48.06214141845703, -46.108154296875, -44.15416717529297, -42.20018005371094, -40.24619674682617, -38.29220962524414, -36.338226318359375, -34.384239196777344, -32.43025588989258, -30.476268768310547, -28.522281646728516, -26.568296432495117, -24.61431121826172, -22.660324096679688, -20.706336975097656, -18.752351760864258, -16.798364639282227, -14.844379425048828, -12.890393257141113, -10.936407089233398, -8.982421875, -7.028435707092285, -5.07444953918457, -3.1204636096954346, -1.1664776802062988, 0.7875080108642578, 2.7414941787719727, 4.6954803466796875, 6.649465560913086, 8.6034517288208, 10.557441711425781, 12.511427879333496, 14.465414047241211, 16.41939926147461, 18.37338638305664, 20.32737159729004, 22.281356811523438, 24.23534393310547, 26.189329147338867, 28.143314361572266, 30.097301483154297, 32.05128479003906, 34.005271911621094, 35.959259033203125, 37.913246154785156, 39.86722946166992, 41.82121658325195, 43.775203704833984, 45.72918701171875, 47.68317413330078, 49.63716125488281, 51.591148376464844, 53.54513168334961, 55.49911880493164, 57.453102111816406, 59.40708923339844, 61.3610725402832, 63.315059661865234, 65.26904296875, 67.22303009033203, 69.17701721191406, 71.1310043334961, 73.08499145507812]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 7.0, 8.0, 6.0, 8.0, 19.0, 24.0, 16.0, 16.0, 17.0, 26.0, 30.0, 24.0, 28.0, 52.0, 55.0, 38.0, 46.0, 51.0, 47.0, 35.0, 41.0, 34.0, 40.0, 29.0, 34.0, 26.0, 35.0, 35.0, 22.0, 31.0, 18.0, 23.0, 13.0, 14.0, 9.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.17507553100586, -28.222301483154297, -27.269527435302734, -26.316753387451172, -25.363981246948242, -24.41120719909668, -23.458433151245117, -22.505659103393555, -21.552885055541992, -20.60011100769043, -19.647336959838867, -18.694564819335938, -17.741790771484375, -16.789016723632812, -15.83624267578125, -14.883468627929688, -13.930695533752441, -12.977921485900879, -12.025148391723633, -11.07237434387207, -10.119600296020508, -9.166826248168945, -8.2140531539917, -7.261279106140137, -6.308505535125732, -5.355731964111328, -4.402957916259766, -3.4501843452453613, -2.497410535812378, -1.5446367263793945, -0.5918631553649902, 0.36091089248657227, 1.3136844635009766, 2.26645827293396, 3.2192320823669434, 4.172005653381348, 5.12477970123291, 6.0775532722473145, 7.030326843261719, 7.983100891113281, 8.935874938964844, 9.888648986816406, 10.841422080993652, 11.794196128845215, 12.746970176696777, 13.699743270874023, 14.652517318725586, 15.605291366577148, 16.558063507080078, 17.51083755493164, 18.463611602783203, 19.416385650634766, 20.369157791137695, 21.321931838989258, 22.27470588684082, 23.227479934692383, 24.180253982543945, 25.133028030395508, 26.08580207824707, 27.03857421875, 27.991348266601562, 28.944122314453125, 29.896896362304688, 30.84967041015625, 31.802444458007812]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 4.0, 2.0, 6.0, 2.0, 8.0, 5.0, 7.0, 9.0, 14.0, 11.0, 12.0, 18.0, 33.0, 39.0, 52.0, 106.0, 116.0, 160.0, 260.0, 421.0, 616.0, 1204.0, 2449.0, 5741.0, 17776.0, 98953.0, 3834051.0, 192741.0, 25806.0, 7664.0, 2956.0, 1357.0, 714.0, 370.0, 202.0, 134.0, 96.0, 48.0, 40.0, 20.0, 19.0, 8.0, 8.0, 8.0, 11.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-14.21875, -13.8505859375, -13.482421875, -13.1142578125, -12.74609375, -12.3779296875, -12.009765625, -11.6416015625, -11.2734375, -10.9052734375, -10.537109375, -10.1689453125, -9.80078125, -9.4326171875, -9.064453125, -8.6962890625, -8.328125, -7.9599609375, -7.591796875, -7.2236328125, -6.85546875, -6.4873046875, -6.119140625, -5.7509765625, -5.3828125, -5.0146484375, -4.646484375, -4.2783203125, -3.91015625, -3.5419921875, -3.173828125, -2.8056640625, -2.4375, -2.0693359375, -1.701171875, -1.3330078125, -0.96484375, -0.5966796875, -0.228515625, 0.1396484375, 0.5078125, 0.8759765625, 1.244140625, 1.6123046875, 1.98046875, 2.3486328125, 2.716796875, 3.0849609375, 3.453125, 3.8212890625, 4.189453125, 4.5576171875, 4.92578125, 5.2939453125, 5.662109375, 6.0302734375, 6.3984375, 6.7666015625, 7.134765625, 7.5029296875, 7.87109375, 8.2392578125, 8.607421875, 8.9755859375, 9.34375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 8.0, 13.0, 19.0, 24.0, 53.0, 72.0, 86.0, 95.0, 101.0, 93.0, 83.0, 73.0, 88.0, 56.0, 46.0, 30.0, 9.0, 11.0, 11.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.765625, -1.7216796875, -1.677734375, -1.6337890625, -1.58984375, -1.5458984375, -1.501953125, -1.4580078125, -1.4140625, -1.3701171875, -1.326171875, -1.2822265625, -1.23828125, -1.1943359375, -1.150390625, -1.1064453125, -1.0625, -1.0185546875, -0.974609375, -0.9306640625, -0.88671875, -0.8427734375, -0.798828125, -0.7548828125, -0.7109375, -0.6669921875, -0.623046875, -0.5791015625, -0.53515625, -0.4912109375, -0.447265625, -0.4033203125, -0.359375, -0.3154296875, -0.271484375, -0.2275390625, -0.18359375, -0.1396484375, -0.095703125, -0.0517578125, -0.0078125, 0.0361328125, 0.080078125, 0.1240234375, 0.16796875, 0.2119140625, 0.255859375, 0.2998046875, 0.34375, 0.3876953125, 0.431640625, 0.4755859375, 0.51953125, 0.5634765625, 0.607421875, 0.6513671875, 0.6953125, 0.7392578125, 0.783203125, 0.8271484375, 0.87109375, 0.9150390625, 0.958984375, 1.0029296875, 1.046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 8.0, 11.0, 15.0, 20.0, 28.0, 61.0, 68.0, 109.0, 153.0, 260.0, 473.0, 732.0, 1274.0, 2446.0, 5119.0, 12774.0, 38913.0, 188046.0, 3380090.0, 466223.0, 64358.0, 18913.0, 7123.0, 3219.0, 1615.0, 925.0, 487.0, 281.0, 173.0, 112.0, 83.0, 58.0, 29.0, 20.0, 20.0, 9.0, 7.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.796875, -8.54327392578125, -8.2896728515625, -8.03607177734375, -7.782470703125, -7.52886962890625, -7.2752685546875, -7.02166748046875, -6.76806640625, -6.51446533203125, -6.2608642578125, -6.00726318359375, -5.753662109375, -5.50006103515625, -5.2464599609375, -4.99285888671875, -4.7392578125, -4.48565673828125, -4.2320556640625, -3.97845458984375, -3.724853515625, -3.47125244140625, -3.2176513671875, -2.96405029296875, -2.71044921875, -2.45684814453125, -2.2032470703125, -1.94964599609375, -1.696044921875, -1.44244384765625, -1.1888427734375, -0.93524169921875, -0.681640625, -0.42803955078125, -0.1744384765625, 0.07916259765625, 0.332763671875, 0.58636474609375, 0.8399658203125, 1.09356689453125, 1.34716796875, 1.60076904296875, 1.8543701171875, 2.10797119140625, 2.361572265625, 2.61517333984375, 2.8687744140625, 3.12237548828125, 3.3759765625, 3.62957763671875, 3.8831787109375, 4.13677978515625, 4.390380859375, 4.64398193359375, 4.8975830078125, 5.15118408203125, 5.40478515625, 5.65838623046875, 5.9119873046875, 6.16558837890625, 6.419189453125, 6.67279052734375, 6.9263916015625, 7.17999267578125, 7.43359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 10.0, 6.0, 16.0, 20.0, 30.0, 33.0, 55.0, 89.0, 114.0, 224.0, 548.0, 1644.0, 624.0, 252.0, 120.0, 82.0, 48.0, 36.0, 25.0, 20.0, 18.0, 9.0, 13.0, 9.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.326171875, -2.262542724609375, -2.19891357421875, -2.135284423828125, -2.0716552734375, -2.008026123046875, -1.94439697265625, -1.880767822265625, -1.817138671875, -1.753509521484375, -1.68988037109375, -1.626251220703125, -1.5626220703125, -1.498992919921875, -1.43536376953125, -1.371734619140625, -1.30810546875, -1.244476318359375, -1.18084716796875, -1.117218017578125, -1.0535888671875, -0.989959716796875, -0.92633056640625, -0.862701416015625, -0.799072265625, -0.735443115234375, -0.67181396484375, -0.608184814453125, -0.5445556640625, -0.480926513671875, -0.41729736328125, -0.353668212890625, -0.2900390625, -0.226409912109375, -0.16278076171875, -0.099151611328125, -0.0355224609375, 0.028106689453125, 0.09173583984375, 0.155364990234375, 0.218994140625, 0.282623291015625, 0.34625244140625, 0.409881591796875, 0.4735107421875, 0.537139892578125, 0.60076904296875, 0.664398193359375, 0.72802734375, 0.791656494140625, 0.85528564453125, 0.918914794921875, 0.9825439453125, 1.046173095703125, 1.10980224609375, 1.173431396484375, 1.237060546875, 1.300689697265625, 1.36431884765625, 1.427947998046875, 1.4915771484375, 1.555206298828125, 1.61883544921875, 1.682464599609375, 1.74609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 10.0, 24.0, 91.0, 210.0, 323.0, 209.0, 86.0, 32.0, 12.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.86993408203125, -24.92953109741211, -23.989126205444336, -23.048723220825195, -22.108318328857422, -21.16791534423828, -20.227510452270508, -19.287107467651367, -18.346702575683594, -17.406299591064453, -16.46589469909668, -15.525490760803223, -14.585086822509766, -13.644683837890625, -12.704278945922852, -11.763875961303711, -10.823472023010254, -9.883068084716797, -8.94266414642334, -8.002260208129883, -7.061856269836426, -6.121452808380127, -5.18104887008667, -4.240644931793213, -3.300240993499756, -2.359837055206299, -1.4194332361221313, -0.47902941703796387, 0.46137452125549316, 1.401778221130371, 2.342182159423828, 3.282586097717285, 4.222990036010742, 5.163393974304199, 6.103797912597656, 7.044201850891113, 7.98460578918457, 8.925008773803711, 9.865413665771484, 10.805816650390625, 11.746221542358398, 12.686625480651855, 13.627029418945312, 14.56743335723877, 15.507837295532227, 16.448240280151367, 17.38864517211914, 18.32904815673828, 19.269451141357422, 20.209854125976562, 21.150259017944336, 22.090662002563477, 23.03106689453125, 23.97146987915039, 24.911874771118164, 25.852277755737305, 26.792682647705078, 27.73308563232422, 28.673490524291992, 29.613893508911133, 30.554298400878906, 31.494701385498047, 32.43510437011719, 33.375511169433594, 34.315914154052734]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 7.0, 9.0, 15.0, 13.0, 16.0, 24.0, 32.0, 21.0, 26.0, 30.0, 38.0, 40.0, 53.0, 47.0, 43.0, 59.0, 57.0, 48.0, 45.0, 56.0, 53.0, 39.0, 33.0, 33.0, 20.0, 31.0, 18.0, 19.0, 15.0, 8.0, 9.0, 5.0, 6.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.428889274597168, -7.2026143074035645, -6.976339817047119, -6.750064849853516, -6.52379035949707, -6.297515392303467, -6.0712409019470215, -5.844965934753418, -5.618691444396973, -5.392416477203369, -5.166141986846924, -4.93986701965332, -4.713592529296875, -4.4873175621032715, -4.261043071746826, -4.034768104553223, -3.8084933757781982, -3.582218647003174, -3.3559439182281494, -3.129669189453125, -2.9033944606781006, -2.677119731903076, -2.4508447647094727, -2.2245702743530273, -1.9982954263687134, -1.772020697593689, -1.5457459688186646, -1.3194711208343506, -1.0931963920593262, -0.8669216632843018, -0.6406469345092773, -0.41437220573425293, -0.18809747695922852, 0.03817726671695709, 0.2644520103931427, 0.4907267689704895, 0.7170014977455139, 0.9432762861251831, 1.1695510149002075, 1.395825743675232, 1.6221004724502563, 1.8483752012252808, 2.0746500492095947, 2.300924777984619, 2.5271995067596436, 2.753474235534668, 2.9797489643096924, 3.206023693084717, 3.432298421859741, 3.6585731506347656, 3.88484787940979, 4.1111226081848145, 4.337397575378418, 4.563672065734863, 4.789947032928467, 5.016221523284912, 5.242496490478516, 5.468771457672119, 5.6950459480285645, 5.921320915222168, 6.147595405578613, 6.373870372772217, 6.600144863128662, 6.826419830322266, 7.052694320678711]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 10.0, 12.0, 9.0, 15.0, 18.0, 22.0, 18.0, 29.0, 43.0, 54.0, 68.0, 83.0, 97.0, 167.0, 286.0, 393.0, 709.0, 1067.0, 1922.0, 3557.0, 7408.0, 17448.0, 47829.0, 158336.0, 440516.0, 250044.0, 73208.0, 24670.0, 10009.0, 4560.0, 2344.0, 1258.0, 792.0, 489.0, 312.0, 212.0, 141.0, 85.0, 70.0, 50.0, 53.0, 27.0, 22.0, 22.0, 20.0, 11.0, 20.0, 7.0, 4.0, 1.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.8951416015625, -5.696533203125, -5.4979248046875, -5.29931640625, -5.1007080078125, -4.902099609375, -4.7034912109375, -4.5048828125, -4.3062744140625, -4.107666015625, -3.9090576171875, -3.71044921875, -3.5118408203125, -3.313232421875, -3.1146240234375, -2.916015625, -2.7174072265625, -2.518798828125, -2.3201904296875, -2.12158203125, -1.9229736328125, -1.724365234375, -1.5257568359375, -1.3271484375, -1.1285400390625, -0.929931640625, -0.7313232421875, -0.53271484375, -0.3341064453125, -0.135498046875, 0.0631103515625, 0.26171875, 0.4603271484375, 0.658935546875, 0.8575439453125, 1.05615234375, 1.2547607421875, 1.453369140625, 1.6519775390625, 1.8505859375, 2.0491943359375, 2.247802734375, 2.4464111328125, 2.64501953125, 2.8436279296875, 3.042236328125, 3.2408447265625, 3.439453125, 3.6380615234375, 3.836669921875, 4.0352783203125, 4.23388671875, 4.4324951171875, 4.631103515625, 4.8297119140625, 5.0283203125, 5.2269287109375, 5.425537109375, 5.6241455078125, 5.82275390625, 6.0213623046875, 6.219970703125, 6.4185791015625, 6.6171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 8.0, 3.0, 5.0, 16.0, 24.0, 38.0, 47.0, 51.0, 66.0, 97.0, 85.0, 97.0, 87.0, 99.0, 75.0, 56.0, 41.0, 34.0, 27.0, 16.0, 9.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.66796875, -1.625762939453125, -1.58355712890625, -1.541351318359375, -1.4991455078125, -1.456939697265625, -1.41473388671875, -1.372528076171875, -1.330322265625, -1.288116455078125, -1.24591064453125, -1.203704833984375, -1.1614990234375, -1.119293212890625, -1.07708740234375, -1.034881591796875, -0.99267578125, -0.950469970703125, -0.90826416015625, -0.866058349609375, -0.8238525390625, -0.781646728515625, -0.73944091796875, -0.697235107421875, -0.655029296875, -0.612823486328125, -0.57061767578125, -0.528411865234375, -0.4862060546875, -0.444000244140625, -0.40179443359375, -0.359588623046875, -0.3173828125, -0.275177001953125, -0.23297119140625, -0.190765380859375, -0.1485595703125, -0.106353759765625, -0.06414794921875, -0.021942138671875, 0.020263671875, 0.062469482421875, 0.10467529296875, 0.146881103515625, 0.1890869140625, 0.231292724609375, 0.27349853515625, 0.315704345703125, 0.35791015625, 0.400115966796875, 0.44232177734375, 0.484527587890625, 0.5267333984375, 0.568939208984375, 0.61114501953125, 0.653350830078125, 0.695556640625, 0.737762451171875, 0.77996826171875, 0.822174072265625, 0.8643798828125, 0.906585693359375, 0.94879150390625, 0.990997314453125, 1.033203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 11.0, 11.0, 17.0, 34.0, 39.0, 50.0, 57.0, 98.0, 129.0, 218.0, 326.0, 495.0, 759.0, 1397.0, 2684.0, 5743.0, 15036.0, 45496.0, 165205.0, 467496.0, 242262.0, 65672.0, 20252.0, 7560.0, 3356.0, 1576.0, 909.0, 546.0, 361.0, 241.0, 133.0, 114.0, 74.0, 63.0, 35.0, 26.0, 25.0, 12.0, 7.0, 8.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.453125, -6.24920654296875, -6.0452880859375, -5.84136962890625, -5.637451171875, -5.43353271484375, -5.2296142578125, -5.02569580078125, -4.82177734375, -4.61785888671875, -4.4139404296875, -4.21002197265625, -4.006103515625, -3.80218505859375, -3.5982666015625, -3.39434814453125, -3.1904296875, -2.98651123046875, -2.7825927734375, -2.57867431640625, -2.374755859375, -2.17083740234375, -1.9669189453125, -1.76300048828125, -1.55908203125, -1.35516357421875, -1.1512451171875, -0.94732666015625, -0.743408203125, -0.53948974609375, -0.3355712890625, -0.13165283203125, 0.072265625, 0.27618408203125, 0.4801025390625, 0.68402099609375, 0.887939453125, 1.09185791015625, 1.2957763671875, 1.49969482421875, 1.70361328125, 1.90753173828125, 2.1114501953125, 2.31536865234375, 2.519287109375, 2.72320556640625, 2.9271240234375, 3.13104248046875, 3.3349609375, 3.53887939453125, 3.7427978515625, 3.94671630859375, 4.150634765625, 4.35455322265625, 4.5584716796875, 4.76239013671875, 4.96630859375, 5.17022705078125, 5.3741455078125, 5.57806396484375, 5.781982421875, 5.98590087890625, 6.1898193359375, 6.39373779296875, 6.59765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 3.0, 7.0, 8.0, 13.0, 10.0, 19.0, 25.0, 27.0, 27.0, 50.0, 50.0, 46.0, 63.0, 61.0, 67.0, 82.0, 63.0, 58.0, 59.0, 47.0, 46.0, 29.0, 29.0, 26.0, 18.0, 14.0, 15.0, 9.0, 6.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.5594482421875, -4.376708984375, -4.1939697265625, -4.01123046875, -3.8284912109375, -3.645751953125, -3.4630126953125, -3.2802734375, -3.0975341796875, -2.914794921875, -2.7320556640625, -2.54931640625, -2.3665771484375, -2.183837890625, -2.0010986328125, -1.818359375, -1.6356201171875, -1.452880859375, -1.2701416015625, -1.08740234375, -0.9046630859375, -0.721923828125, -0.5391845703125, -0.3564453125, -0.1737060546875, 0.009033203125, 0.1917724609375, 0.37451171875, 0.5572509765625, 0.739990234375, 0.9227294921875, 1.10546875, 1.2882080078125, 1.470947265625, 1.6536865234375, 1.83642578125, 2.0191650390625, 2.201904296875, 2.3846435546875, 2.5673828125, 2.7501220703125, 2.932861328125, 3.1156005859375, 3.29833984375, 3.4810791015625, 3.663818359375, 3.8465576171875, 4.029296875, 4.2120361328125, 4.394775390625, 4.5775146484375, 4.76025390625, 4.9429931640625, 5.125732421875, 5.3084716796875, 5.4912109375, 5.6739501953125, 5.856689453125, 6.0394287109375, 6.22216796875, 6.4049072265625, 6.587646484375, 6.7703857421875, 6.953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 10.0, 14.0, 16.0, 24.0, 32.0, 33.0, 69.0, 138.0, 193.0, 356.0, 644.0, 1278.0, 2607.0, 6402.0, 18130.0, 65355.0, 301111.0, 479688.0, 124545.0, 30595.0, 9868.0, 3852.0, 1670.0, 797.0, 466.0, 226.0, 141.0, 93.0, 63.0, 42.0, 24.0, 22.0, 13.0, 15.0, 8.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.994140625, -2.895050048828125, -2.79595947265625, -2.696868896484375, -2.5977783203125, -2.498687744140625, -2.39959716796875, -2.300506591796875, -2.201416015625, -2.102325439453125, -2.00323486328125, -1.904144287109375, -1.8050537109375, -1.705963134765625, -1.60687255859375, -1.507781982421875, -1.40869140625, -1.309600830078125, -1.21051025390625, -1.111419677734375, -1.0123291015625, -0.913238525390625, -0.81414794921875, -0.715057373046875, -0.615966796875, -0.516876220703125, -0.41778564453125, -0.318695068359375, -0.2196044921875, -0.120513916015625, -0.02142333984375, 0.077667236328125, 0.1767578125, 0.275848388671875, 0.37493896484375, 0.474029541015625, 0.5731201171875, 0.672210693359375, 0.77130126953125, 0.870391845703125, 0.969482421875, 1.068572998046875, 1.16766357421875, 1.266754150390625, 1.3658447265625, 1.464935302734375, 1.56402587890625, 1.663116455078125, 1.76220703125, 1.861297607421875, 1.96038818359375, 2.059478759765625, 2.1585693359375, 2.257659912109375, 2.35675048828125, 2.455841064453125, 2.554931640625, 2.654022216796875, 2.75311279296875, 2.852203369140625, 2.9512939453125, 3.050384521484375, 3.14947509765625, 3.248565673828125, 3.34765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 7.0, 3.0, 2.0, 3.0, 7.0, 4.0, 9.0, 8.0, 6.0, 15.0, 21.0, 20.0, 34.0, 52.0, 49.0, 61.0, 71.0, 81.0, 88.0, 103.0, 68.0, 50.0, 59.0, 39.0, 30.0, 17.0, 21.0, 19.0, 12.0, 11.0, 9.0, 6.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0005655288696289062, -0.0005508400499820709, -0.0005361512303352356, -0.0005214624106884003, -0.0005067735910415649, -0.0004920847713947296, -0.0004773959517478943, -0.00046270713210105896, -0.00044801831245422363, -0.0004333294928073883, -0.000418640673160553, -0.00040395185351371765, -0.0003892630338668823, -0.000374574214220047, -0.00035988539457321167, -0.00034519657492637634, -0.000330507755279541, -0.0003158189356327057, -0.00030113011598587036, -0.00028644129633903503, -0.0002717524766921997, -0.0002570636570453644, -0.00024237483739852905, -0.00022768601775169373, -0.0002129971981048584, -0.00019830837845802307, -0.00018361955881118774, -0.00016893073916435242, -0.0001542419195175171, -0.00013955309987068176, -0.00012486428022384644, -0.00011017546057701111, -9.548664093017578e-05, -8.079782128334045e-05, -6.610900163650513e-05, -5.14201819896698e-05, -3.673136234283447e-05, -2.2042542695999146e-05, -7.353723049163818e-06, 7.335096597671509e-06, 2.2023916244506836e-05, 3.671273589134216e-05, 5.140155553817749e-05, 6.609037518501282e-05, 8.077919483184814e-05, 9.546801447868347e-05, 0.0001101568341255188, 0.00012484565377235413, 0.00013953447341918945, 0.00015422329306602478, 0.0001689121127128601, 0.00018360093235969543, 0.00019828975200653076, 0.0002129785716533661, 0.00022766739130020142, 0.00024235621094703674, 0.00025704503059387207, 0.0002717338502407074, 0.0002864226698875427, 0.00030111148953437805, 0.0003158003091812134, 0.0003304891288280487, 0.00034517794847488403, 0.00035986676812171936, 0.0003745555877685547]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 8.0, 7.0, 12.0, 12.0, 21.0, 25.0, 44.0, 54.0, 81.0, 111.0, 192.0, 289.0, 449.0, 837.0, 1610.0, 3553.0, 8610.0, 25865.0, 100688.0, 454615.0, 346907.0, 71466.0, 19916.0, 6954.0, 2948.0, 1393.0, 739.0, 413.0, 252.0, 174.0, 91.0, 60.0, 49.0, 25.0, 21.0, 15.0, 7.0, 12.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.783111572265625, -2.67559814453125, -2.568084716796875, -2.4605712890625, -2.353057861328125, -2.24554443359375, -2.138031005859375, -2.030517578125, -1.923004150390625, -1.81549072265625, -1.707977294921875, -1.6004638671875, -1.492950439453125, -1.38543701171875, -1.277923583984375, -1.17041015625, -1.062896728515625, -0.95538330078125, -0.847869873046875, -0.7403564453125, -0.632843017578125, -0.52532958984375, -0.417816162109375, -0.310302734375, -0.202789306640625, -0.09527587890625, 0.012237548828125, 0.1197509765625, 0.227264404296875, 0.33477783203125, 0.442291259765625, 0.5498046875, 0.657318115234375, 0.76483154296875, 0.872344970703125, 0.9798583984375, 1.087371826171875, 1.19488525390625, 1.302398681640625, 1.409912109375, 1.517425537109375, 1.62493896484375, 1.732452392578125, 1.8399658203125, 1.947479248046875, 2.05499267578125, 2.162506103515625, 2.27001953125, 2.377532958984375, 2.48504638671875, 2.592559814453125, 2.7000732421875, 2.807586669921875, 2.91510009765625, 3.022613525390625, 3.130126953125, 3.237640380859375, 3.34515380859375, 3.452667236328125, 3.5601806640625, 3.667694091796875, 3.77520751953125, 3.882720947265625, 3.990234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 7.0, 18.0, 14.0, 16.0, 30.0, 43.0, 40.0, 40.0, 50.0, 52.0, 53.0, 65.0, 78.0, 56.0, 51.0, 68.0, 54.0, 43.0, 40.0, 31.0, 22.0, 19.0, 14.0, 15.0, 7.0, 13.0, 9.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.521484375, -1.464324951171875, -1.40716552734375, -1.350006103515625, -1.2928466796875, -1.235687255859375, -1.17852783203125, -1.121368408203125, -1.064208984375, -1.007049560546875, -0.94989013671875, -0.892730712890625, -0.8355712890625, -0.778411865234375, -0.72125244140625, -0.664093017578125, -0.60693359375, -0.549774169921875, -0.49261474609375, -0.435455322265625, -0.3782958984375, -0.321136474609375, -0.26397705078125, -0.206817626953125, -0.149658203125, -0.092498779296875, -0.03533935546875, 0.021820068359375, 0.0789794921875, 0.136138916015625, 0.19329833984375, 0.250457763671875, 0.3076171875, 0.364776611328125, 0.42193603515625, 0.479095458984375, 0.5362548828125, 0.593414306640625, 0.65057373046875, 0.707733154296875, 0.764892578125, 0.822052001953125, 0.87921142578125, 0.936370849609375, 0.9935302734375, 1.050689697265625, 1.10784912109375, 1.165008544921875, 1.22216796875, 1.279327392578125, 1.33648681640625, 1.393646240234375, 1.4508056640625, 1.507965087890625, 1.56512451171875, 1.622283935546875, 1.679443359375, 1.736602783203125, 1.79376220703125, 1.850921630859375, 1.9080810546875, 1.965240478515625, 2.02239990234375, 2.079559326171875, 2.13671875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 22.0, 24.0, 49.0, 52.0, 98.0, 102.0, 130.0, 117.0, 130.0, 93.0, 63.0, 39.0, 21.0, 16.0, 6.0, 9.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.254756927490234, -30.047578811645508, -28.84040069580078, -27.633222579956055, -26.426044464111328, -25.21886444091797, -24.011686325073242, -22.804508209228516, -21.59733009338379, -20.390151977539062, -19.182973861694336, -17.97579574584961, -16.76861572265625, -15.56143856048584, -14.354259490966797, -13.14708137512207, -11.939903259277344, -10.732725143432617, -9.52554702758789, -8.318367958068848, -7.111189842224121, -5.9040117263793945, -4.69683313369751, -3.489654541015625, -2.2824764251708984, -1.0752980709075928, 0.1318802833557129, 1.3390586376190186, 2.546236991882324, 3.753415107727051, 4.9605937004089355, 6.16777229309082, 7.374946594238281, 8.582124710083008, 9.789302825927734, 10.996481895446777, 12.203660011291504, 13.41083812713623, 14.618017196655273, 15.8251953125, 17.032373428344727, 18.239551544189453, 19.44672966003418, 20.653907775878906, 21.861087799072266, 23.06826400756836, 24.27544403076172, 25.482622146606445, 26.689800262451172, 27.8969783782959, 29.104156494140625, 30.31133460998535, 31.518512725830078, 32.72569274902344, 33.93286895751953, 35.14004898071289, 36.34722900390625, 37.55440902709961, 38.7615852355957, 39.96876525878906, 41.175941467285156, 42.383121490478516, 43.59029769897461, 44.79747772216797, 46.00465393066406]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 9.0, 8.0, 9.0, 12.0, 11.0, 10.0, 22.0, 15.0, 21.0, 29.0, 37.0, 25.0, 29.0, 46.0, 35.0, 37.0, 33.0, 52.0, 40.0, 51.0, 55.0, 46.0, 42.0, 36.0, 32.0, 34.0, 23.0, 28.0, 28.0, 25.0, 17.0, 17.0, 17.0, 18.0, 8.0, 5.0, 7.0, 2.0, 9.0, 6.0, 7.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.670129776000977, -22.955322265625, -22.240516662597656, -21.52570915222168, -20.810901641845703, -20.09609603881836, -19.381288528442383, -18.666481018066406, -17.951675415039062, -17.236867904663086, -16.522062301635742, -15.807254791259766, -15.092448234558105, -14.377641677856445, -13.662834167480469, -12.948027610778809, -12.233221054077148, -11.518414497375488, -10.803607940673828, -10.088800430297852, -9.373993873596191, -8.659187316894531, -7.944380283355713, -7.2295732498168945, -6.514766693115234, -5.799960136413574, -5.085153102874756, -4.3703460693359375, -3.6555395126342773, -2.940732717514038, -2.225925922393799, -1.5111188888549805, -0.7963104248046875, -0.08150362968444824, 0.633303165435791, 1.3481099605560303, 2.0629167556762695, 2.777723550796509, 3.492530345916748, 4.207337379455566, 4.922143936157227, 5.636950492858887, 6.351757526397705, 7.066564559936523, 7.781371116638184, 8.496177673339844, 9.21098518371582, 9.92579174041748, 10.64059829711914, 11.3554048538208, 12.070211410522461, 12.785018920898438, 13.499825477600098, 14.214632034301758, 14.929439544677734, 15.644246101379395, 16.359052658081055, 17.07386016845703, 17.788665771484375, 18.50347328186035, 19.218280792236328, 19.933086395263672, 20.64789390563965, 21.362701416015625, 22.07750701904297]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 8.0, 8.0, 17.0, 15.0, 16.0, 24.0, 37.0, 49.0, 89.0, 91.0, 138.0, 216.0, 403.0, 584.0, 1096.0, 2085.0, 4552.0, 11770.0, 44440.0, 1119618.0, 2935486.0, 50841.0, 12911.0, 4840.0, 2170.0, 1161.0, 633.0, 366.0, 199.0, 124.0, 97.0, 55.0, 42.0, 25.0, 18.0, 15.0, 6.0, 8.0, 8.0, 1.0, 2.0, 2.0, 5.0], "bins": [-12.3203125, -12.02001953125, -11.7197265625, -11.41943359375, -11.119140625, -10.81884765625, -10.5185546875, -10.21826171875, -9.91796875, -9.61767578125, -9.3173828125, -9.01708984375, -8.716796875, -8.41650390625, -8.1162109375, -7.81591796875, -7.515625, -7.21533203125, -6.9150390625, -6.61474609375, -6.314453125, -6.01416015625, -5.7138671875, -5.41357421875, -5.11328125, -4.81298828125, -4.5126953125, -4.21240234375, -3.912109375, -3.61181640625, -3.3115234375, -3.01123046875, -2.7109375, -2.41064453125, -2.1103515625, -1.81005859375, -1.509765625, -1.20947265625, -0.9091796875, -0.60888671875, -0.30859375, -0.00830078125, 0.2919921875, 0.59228515625, 0.892578125, 1.19287109375, 1.4931640625, 1.79345703125, 2.09375, 2.39404296875, 2.6943359375, 2.99462890625, 3.294921875, 3.59521484375, 3.8955078125, 4.19580078125, 4.49609375, 4.79638671875, 5.0966796875, 5.39697265625, 5.697265625, 5.99755859375, 6.2978515625, 6.59814453125, 6.8984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 2.0, 6.0, 12.0, 15.0, 20.0, 26.0, 43.0, 49.0, 52.0, 64.0, 82.0, 85.0, 101.0, 73.0, 78.0, 66.0, 60.0, 39.0, 36.0, 24.0, 19.0, 16.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.626953125, -1.5865325927734375, -1.546112060546875, -1.5056915283203125, -1.46527099609375, -1.4248504638671875, -1.384429931640625, -1.3440093994140625, -1.3035888671875, -1.2631683349609375, -1.222747802734375, -1.1823272705078125, -1.14190673828125, -1.1014862060546875, -1.061065673828125, -1.0206451416015625, -0.980224609375, -0.9398040771484375, -0.899383544921875, -0.8589630126953125, -0.81854248046875, -0.7781219482421875, -0.737701416015625, -0.6972808837890625, -0.6568603515625, -0.6164398193359375, -0.576019287109375, -0.5355987548828125, -0.49517822265625, -0.4547576904296875, -0.414337158203125, -0.3739166259765625, -0.33349609375, -0.2930755615234375, -0.252655029296875, -0.2122344970703125, -0.17181396484375, -0.1313934326171875, -0.090972900390625, -0.0505523681640625, -0.0101318359375, 0.0302886962890625, 0.070709228515625, 0.1111297607421875, 0.15155029296875, 0.1919708251953125, 0.232391357421875, 0.2728118896484375, 0.313232421875, 0.3536529541015625, 0.394073486328125, 0.4344940185546875, 0.47491455078125, 0.5153350830078125, 0.555755615234375, 0.5961761474609375, 0.6365966796875, 0.6770172119140625, 0.717437744140625, 0.7578582763671875, 0.79827880859375, 0.8386993408203125, 0.879119873046875, 0.9195404052734375, 0.9599609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 5.0, 10.0, 12.0, 22.0, 34.0, 35.0, 55.0, 80.0, 121.0, 181.0, 266.0, 425.0, 620.0, 999.0, 1847.0, 3592.0, 7738.0, 21046.0, 80155.0, 1130053.0, 2803778.0, 101315.0, 24362.0, 8857.0, 3867.0, 1927.0, 1085.0, 641.0, 375.0, 249.0, 152.0, 113.0, 53.0, 52.0, 44.0, 30.0, 21.0, 15.0, 18.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.43792724609375, -6.2000732421875, -5.96221923828125, -5.724365234375, -5.48651123046875, -5.2486572265625, -5.01080322265625, -4.77294921875, -4.53509521484375, -4.2972412109375, -4.05938720703125, -3.821533203125, -3.58367919921875, -3.3458251953125, -3.10797119140625, -2.8701171875, -2.63226318359375, -2.3944091796875, -2.15655517578125, -1.918701171875, -1.68084716796875, -1.4429931640625, -1.20513916015625, -0.96728515625, -0.72943115234375, -0.4915771484375, -0.25372314453125, -0.015869140625, 0.22198486328125, 0.4598388671875, 0.69769287109375, 0.935546875, 1.17340087890625, 1.4112548828125, 1.64910888671875, 1.886962890625, 2.12481689453125, 2.3626708984375, 2.60052490234375, 2.83837890625, 3.07623291015625, 3.3140869140625, 3.55194091796875, 3.789794921875, 4.02764892578125, 4.2655029296875, 4.50335693359375, 4.7412109375, 4.97906494140625, 5.2169189453125, 5.45477294921875, 5.692626953125, 5.93048095703125, 6.1683349609375, 6.40618896484375, 6.64404296875, 6.88189697265625, 7.1197509765625, 7.35760498046875, 7.595458984375, 7.83331298828125, 8.0711669921875, 8.30902099609375, 8.546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 14.0, 23.0, 36.0, 41.0, 60.0, 98.0, 182.0, 507.0, 2031.0, 527.0, 217.0, 101.0, 74.0, 36.0, 29.0, 14.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.13653564453125, -2.0640869140625, -1.99163818359375, -1.919189453125, -1.84674072265625, -1.7742919921875, -1.70184326171875, -1.62939453125, -1.55694580078125, -1.4844970703125, -1.41204833984375, -1.339599609375, -1.26715087890625, -1.1947021484375, -1.12225341796875, -1.0498046875, -0.97735595703125, -0.9049072265625, -0.83245849609375, -0.760009765625, -0.68756103515625, -0.6151123046875, -0.54266357421875, -0.47021484375, -0.39776611328125, -0.3253173828125, -0.25286865234375, -0.180419921875, -0.10797119140625, -0.0355224609375, 0.03692626953125, 0.109375, 0.18182373046875, 0.2542724609375, 0.32672119140625, 0.399169921875, 0.47161865234375, 0.5440673828125, 0.61651611328125, 0.68896484375, 0.76141357421875, 0.8338623046875, 0.90631103515625, 0.978759765625, 1.05120849609375, 1.1236572265625, 1.19610595703125, 1.2685546875, 1.34100341796875, 1.4134521484375, 1.48590087890625, 1.558349609375, 1.63079833984375, 1.7032470703125, 1.77569580078125, 1.84814453125, 1.92059326171875, 1.9930419921875, 2.06549072265625, 2.137939453125, 2.21038818359375, 2.2828369140625, 2.35528564453125, 2.427734375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 19.0, 28.0, 46.0, 67.0, 108.0, 145.0, 167.0, 130.0, 100.0, 67.0, 30.0, 23.0, 19.0, 16.0, 6.0, 7.0, 1.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.134748458862305, -7.713335990905762, -7.291923522949219, -6.870511054992676, -6.449098110198975, -6.027685642242432, -5.606273174285889, -5.1848602294921875, -4.7634477615356445, -4.342035293579102, -3.9206225872039795, -3.4992101192474365, -3.0777974128723145, -2.6563849449157715, -2.2349724769592285, -1.8135597705841064, -1.3921475410461426, -0.9707349538803101, -0.5493224263191223, -0.12790989875793457, 0.29350268840789795, 0.7149152755737305, 1.1363277435302734, 1.5577404499053955, 1.9791529178619385, 2.4005653858184814, 2.8219780921936035, 3.2433905601501465, 3.6648030281066895, 4.086215972900391, 4.507628440856934, 4.929040908813477, 5.3504533767700195, 5.7718658447265625, 6.1932783126831055, 6.614690780639648, 7.03610372543335, 7.457516193389893, 7.8789286613464355, 8.300341606140137, 8.72175407409668, 9.143166542053223, 9.564579010009766, 9.985991477966309, 10.407403945922852, 10.828817367553711, 11.250228881835938, 11.671642303466797, 12.093053817749023, 12.514466285705566, 12.93587875366211, 13.357291221618652, 13.778703689575195, 14.200117111206055, 14.621528625488281, 15.04294204711914, 15.464354515075684, 15.885766983032227, 16.307180404663086, 16.728591918945312, 17.150005340576172, 17.5714168548584, 17.992830276489258, 18.414241790771484, 18.835655212402344]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 13.0, 3.0, 13.0, 10.0, 14.0, 18.0, 17.0, 20.0, 25.0, 28.0, 21.0, 30.0, 34.0, 29.0, 48.0, 43.0, 36.0, 25.0, 42.0, 37.0, 42.0, 53.0, 37.0, 38.0, 36.0, 51.0, 26.0, 29.0, 29.0, 34.0, 20.0, 26.0, 15.0, 7.0, 11.0, 11.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.579960823059082, -6.375895023345947, -6.1718292236328125, -5.967763423919678, -5.763697624206543, -5.559631824493408, -5.355566024780273, -5.151500225067139, -4.947434425354004, -4.743368625640869, -4.539302825927734, -4.3352370262146, -4.131171226501465, -3.92710542678833, -3.7230396270751953, -3.5189738273620605, -3.314908027648926, -3.110842227935791, -2.9067764282226562, -2.7027106285095215, -2.4986448287963867, -2.294579029083252, -2.090513229370117, -1.8864474296569824, -1.6823816299438477, -1.478315830230713, -1.2742500305175781, -1.0701842308044434, -0.8661184310913086, -0.6620526313781738, -0.45798683166503906, -0.2539210319519043, -0.04985523223876953, 0.15421056747436523, 0.3582763671875, 0.5623421669006348, 0.7664079666137695, 0.9704737663269043, 1.174539566040039, 1.3786053657531738, 1.5826711654663086, 1.7867369651794434, 1.9908027648925781, 2.194868564605713, 2.3989343643188477, 2.6030001640319824, 2.807065963745117, 3.011131763458252, 3.2151975631713867, 3.4192633628845215, 3.6233291625976562, 3.827394962310791, 4.031460762023926, 4.2355265617370605, 4.439592361450195, 4.64365816116333, 4.847723960876465, 5.0517897605896, 5.255855560302734, 5.459921360015869, 5.663987159729004, 5.868052959442139, 6.072118759155273, 6.276184558868408, 6.480250358581543]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 15.0, 15.0, 29.0, 35.0, 57.0, 92.0, 145.0, 213.0, 393.0, 764.0, 1614.0, 3626.0, 9666.0, 33948.0, 169727.0, 590626.0, 183690.0, 36188.0, 10309.0, 3866.0, 1624.0, 815.0, 437.0, 222.0, 140.0, 92.0, 64.0, 32.0, 21.0, 27.0, 13.0, 9.0, 13.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.7818603515625, -7.509033203125, -7.2362060546875, -6.96337890625, -6.6905517578125, -6.417724609375, -6.1448974609375, -5.8720703125, -5.5992431640625, -5.326416015625, -5.0535888671875, -4.78076171875, -4.5079345703125, -4.235107421875, -3.9622802734375, -3.689453125, -3.4166259765625, -3.143798828125, -2.8709716796875, -2.59814453125, -2.3253173828125, -2.052490234375, -1.7796630859375, -1.5068359375, -1.2340087890625, -0.961181640625, -0.6883544921875, -0.41552734375, -0.1427001953125, 0.130126953125, 0.4029541015625, 0.67578125, 0.9486083984375, 1.221435546875, 1.4942626953125, 1.76708984375, 2.0399169921875, 2.312744140625, 2.5855712890625, 2.8583984375, 3.1312255859375, 3.404052734375, 3.6768798828125, 3.94970703125, 4.2225341796875, 4.495361328125, 4.7681884765625, 5.041015625, 5.3138427734375, 5.586669921875, 5.8594970703125, 6.13232421875, 6.4051513671875, 6.677978515625, 6.9508056640625, 7.2236328125, 7.4964599609375, 7.769287109375, 8.0421142578125, 8.31494140625, 8.5877685546875, 8.860595703125, 9.1334228515625, 9.40625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 9.0, 9.0, 17.0, 23.0, 27.0, 29.0, 33.0, 47.0, 56.0, 57.0, 63.0, 70.0, 76.0, 78.0, 57.0, 77.0, 58.0, 42.0, 35.0, 36.0, 20.0, 22.0, 12.0, 15.0, 7.0, 3.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.3837890625, -1.3478622436523438, -1.3119354248046875, -1.2760086059570312, -1.240081787109375, -1.2041549682617188, -1.1682281494140625, -1.1323013305664062, -1.09637451171875, -1.0604476928710938, -1.0245208740234375, -0.9885940551757812, -0.952667236328125, -0.9167404174804688, -0.8808135986328125, -0.8448867797851562, -0.8089599609375, -0.7730331420898438, -0.7371063232421875, -0.7011795043945312, -0.665252685546875, -0.6293258666992188, -0.5933990478515625, -0.5574722290039062, -0.52154541015625, -0.48561859130859375, -0.4496917724609375, -0.41376495361328125, -0.377838134765625, -0.34191131591796875, -0.3059844970703125, -0.27005767822265625, -0.234130859375, -0.19820404052734375, -0.1622772216796875, -0.12635040283203125, -0.090423583984375, -0.05449676513671875, -0.0185699462890625, 0.01735687255859375, 0.05328369140625, 0.08921051025390625, 0.1251373291015625, 0.16106414794921875, 0.196990966796875, 0.23291778564453125, 0.2688446044921875, 0.30477142333984375, 0.3406982421875, 0.37662506103515625, 0.4125518798828125, 0.44847869873046875, 0.484405517578125, 0.5203323364257812, 0.5562591552734375, 0.5921859741210938, 0.62811279296875, 0.6640396118164062, 0.6999664306640625, 0.7358932495117188, 0.771820068359375, 0.8077468872070312, 0.8436737060546875, 0.8796005249023438, 0.91552734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 14.0, 7.0, 14.0, 11.0, 37.0, 41.0, 51.0, 74.0, 99.0, 136.0, 195.0, 295.0, 468.0, 727.0, 1248.0, 2361.0, 5417.0, 14731.0, 47507.0, 171464.0, 460993.0, 241985.0, 67052.0, 20023.0, 6821.0, 2912.0, 1416.0, 825.0, 489.0, 317.0, 240.0, 159.0, 100.0, 70.0, 54.0, 38.0, 43.0, 30.0, 19.0, 14.0, 16.0, 5.0, 6.0, 3.0, 5.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.90625, -5.73065185546875, -5.5550537109375, -5.37945556640625, -5.203857421875, -5.02825927734375, -4.8526611328125, -4.67706298828125, -4.50146484375, -4.32586669921875, -4.1502685546875, -3.97467041015625, -3.799072265625, -3.62347412109375, -3.4478759765625, -3.27227783203125, -3.0966796875, -2.92108154296875, -2.7454833984375, -2.56988525390625, -2.394287109375, -2.21868896484375, -2.0430908203125, -1.86749267578125, -1.69189453125, -1.51629638671875, -1.3406982421875, -1.16510009765625, -0.989501953125, -0.81390380859375, -0.6383056640625, -0.46270751953125, -0.287109375, -0.11151123046875, 0.0640869140625, 0.23968505859375, 0.415283203125, 0.59088134765625, 0.7664794921875, 0.94207763671875, 1.11767578125, 1.29327392578125, 1.4688720703125, 1.64447021484375, 1.820068359375, 1.99566650390625, 2.1712646484375, 2.34686279296875, 2.5224609375, 2.69805908203125, 2.8736572265625, 3.04925537109375, 3.224853515625, 3.40045166015625, 3.5760498046875, 3.75164794921875, 3.92724609375, 4.10284423828125, 4.2784423828125, 4.45404052734375, 4.629638671875, 4.80523681640625, 4.9808349609375, 5.15643310546875, 5.33203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 3.0, 11.0, 17.0, 14.0, 12.0, 19.0, 22.0, 21.0, 21.0, 27.0, 34.0, 39.0, 34.0, 37.0, 45.0, 53.0, 48.0, 52.0, 47.0, 46.0, 33.0, 34.0, 32.0, 46.0, 35.0, 32.0, 32.0, 30.0, 13.0, 14.0, 14.0, 20.0, 10.0, 11.0, 14.0, 2.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.982421875, -3.861053466796875, -3.73968505859375, -3.618316650390625, -3.4969482421875, -3.375579833984375, -3.25421142578125, -3.132843017578125, -3.011474609375, -2.890106201171875, -2.76873779296875, -2.647369384765625, -2.5260009765625, -2.404632568359375, -2.28326416015625, -2.161895751953125, -2.04052734375, -1.919158935546875, -1.79779052734375, -1.676422119140625, -1.5550537109375, -1.433685302734375, -1.31231689453125, -1.190948486328125, -1.069580078125, -0.948211669921875, -0.82684326171875, -0.705474853515625, -0.5841064453125, -0.462738037109375, -0.34136962890625, -0.220001220703125, -0.0986328125, 0.022735595703125, 0.14410400390625, 0.265472412109375, 0.3868408203125, 0.508209228515625, 0.62957763671875, 0.750946044921875, 0.872314453125, 0.993682861328125, 1.11505126953125, 1.236419677734375, 1.3577880859375, 1.479156494140625, 1.60052490234375, 1.721893310546875, 1.84326171875, 1.964630126953125, 2.08599853515625, 2.207366943359375, 2.3287353515625, 2.450103759765625, 2.57147216796875, 2.692840576171875, 2.814208984375, 2.935577392578125, 3.05694580078125, 3.178314208984375, 3.2996826171875, 3.421051025390625, 3.54241943359375, 3.663787841796875, 3.78515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 15.0, 8.0, 7.0, 12.0, 34.0, 38.0, 72.0, 118.0, 170.0, 324.0, 662.0, 1416.0, 3375.0, 9966.0, 40264.0, 286793.0, 586501.0, 91581.0, 17718.0, 5400.0, 2039.0, 895.0, 480.0, 280.0, 129.0, 100.0, 50.0, 30.0, 25.0, 13.0, 7.0, 3.0, 11.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.3685302734375, -4.237060546875, -4.1055908203125, -3.97412109375, -3.8426513671875, -3.711181640625, -3.5797119140625, -3.4482421875, -3.3167724609375, -3.185302734375, -3.0538330078125, -2.92236328125, -2.7908935546875, -2.659423828125, -2.5279541015625, -2.396484375, -2.2650146484375, -2.133544921875, -2.0020751953125, -1.87060546875, -1.7391357421875, -1.607666015625, -1.4761962890625, -1.3447265625, -1.2132568359375, -1.081787109375, -0.9503173828125, -0.81884765625, -0.6873779296875, -0.555908203125, -0.4244384765625, -0.29296875, -0.1614990234375, -0.030029296875, 0.1014404296875, 0.23291015625, 0.3643798828125, 0.495849609375, 0.6273193359375, 0.7587890625, 0.8902587890625, 1.021728515625, 1.1531982421875, 1.28466796875, 1.4161376953125, 1.547607421875, 1.6790771484375, 1.810546875, 1.9420166015625, 2.073486328125, 2.2049560546875, 2.33642578125, 2.4678955078125, 2.599365234375, 2.7308349609375, 2.8623046875, 2.9937744140625, 3.125244140625, 3.2567138671875, 3.38818359375, 3.5196533203125, 3.651123046875, 3.7825927734375, 3.9140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 10.0, 8.0, 7.0, 12.0, 13.0, 19.0, 23.0, 24.0, 29.0, 46.0, 63.0, 83.0, 96.0, 113.0, 85.0, 75.0, 61.0, 46.0, 30.0, 25.0, 30.0, 17.0, 13.0, 13.0, 13.0, 7.0, 14.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0005893707275390625, -0.000573623925447464, -0.0005578771233558655, -0.000542130321264267, -0.0005263835191726685, -0.00051063671708107, -0.0004948899149894714, -0.0004791431128978729, -0.0004633963108062744, -0.0004476495087146759, -0.0004319027066230774, -0.0004161559045314789, -0.00040040910243988037, -0.00038466230034828186, -0.00036891549825668335, -0.00035316869616508484, -0.00033742189407348633, -0.0003216750919818878, -0.0003059282898902893, -0.0002901814877986908, -0.0002744346857070923, -0.0002586878836154938, -0.00024294108152389526, -0.00022719427943229675, -0.00021144747734069824, -0.00019570067524909973, -0.00017995387315750122, -0.0001642070710659027, -0.0001484602689743042, -0.0001327134668827057, -0.00011696666479110718, -0.00010121986269950867, -8.547306060791016e-05, -6.972625851631165e-05, -5.3979456424713135e-05, -3.8232654333114624e-05, -2.2485852241516113e-05, -6.7390501499176025e-06, 9.007751941680908e-06, 2.475455403327942e-05, 4.050135612487793e-05, 5.624815821647644e-05, 7.199496030807495e-05, 8.774176239967346e-05, 0.00010348856449127197, 0.00011923536658287048, 0.000134982168674469, 0.0001507289707660675, 0.00016647577285766602, 0.00018222257494926453, 0.00019796937704086304, 0.00021371617913246155, 0.00022946298122406006, 0.00024520978331565857, 0.0002609565854072571, 0.0002767033874988556, 0.0002924501895904541, 0.0003081969916820526, 0.0003239437937736511, 0.00033969059586524963, 0.00035543739795684814, 0.00037118420004844666, 0.00038693100214004517, 0.0004026778042316437, 0.0004184246063232422]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 3.0, 2.0, 5.0, 4.0, 11.0, 14.0, 13.0, 14.0, 18.0, 36.0, 39.0, 56.0, 81.0, 112.0, 222.0, 304.0, 567.0, 981.0, 2066.0, 4879.0, 13773.0, 58647.0, 471523.0, 421228.0, 52128.0, 12876.0, 4600.0, 1923.0, 995.0, 526.0, 310.0, 190.0, 117.0, 83.0, 60.0, 36.0, 33.0, 9.0, 15.0, 14.0, 11.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.9453125, -3.81365966796875, -3.6820068359375, -3.55035400390625, -3.418701171875, -3.28704833984375, -3.1553955078125, -3.02374267578125, -2.89208984375, -2.76043701171875, -2.6287841796875, -2.49713134765625, -2.365478515625, -2.23382568359375, -2.1021728515625, -1.97052001953125, -1.8388671875, -1.70721435546875, -1.5755615234375, -1.44390869140625, -1.312255859375, -1.18060302734375, -1.0489501953125, -0.91729736328125, -0.78564453125, -0.65399169921875, -0.5223388671875, -0.39068603515625, -0.259033203125, -0.12738037109375, 0.0042724609375, 0.13592529296875, 0.267578125, 0.39923095703125, 0.5308837890625, 0.66253662109375, 0.794189453125, 0.92584228515625, 1.0574951171875, 1.18914794921875, 1.32080078125, 1.45245361328125, 1.5841064453125, 1.71575927734375, 1.847412109375, 1.97906494140625, 2.1107177734375, 2.24237060546875, 2.3740234375, 2.50567626953125, 2.6373291015625, 2.76898193359375, 2.900634765625, 3.03228759765625, 3.1639404296875, 3.29559326171875, 3.42724609375, 3.55889892578125, 3.6905517578125, 3.82220458984375, 3.953857421875, 4.08551025390625, 4.2171630859375, 4.34881591796875, 4.48046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 10.0, 14.0, 24.0, 33.0, 40.0, 61.0, 80.0, 113.0, 116.0, 110.0, 92.0, 70.0, 68.0, 37.0, 30.0, 24.0, 18.0, 7.0, 7.0, 5.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830078125, -2.74395751953125, -2.6578369140625, -2.57171630859375, -2.485595703125, -2.39947509765625, -2.3133544921875, -2.22723388671875, -2.14111328125, -2.05499267578125, -1.9688720703125, -1.88275146484375, -1.796630859375, -1.71051025390625, -1.6243896484375, -1.53826904296875, -1.4521484375, -1.36602783203125, -1.2799072265625, -1.19378662109375, -1.107666015625, -1.02154541015625, -0.9354248046875, -0.84930419921875, -0.76318359375, -0.67706298828125, -0.5909423828125, -0.50482177734375, -0.418701171875, -0.33258056640625, -0.2464599609375, -0.16033935546875, -0.07421875, 0.01190185546875, 0.0980224609375, 0.18414306640625, 0.270263671875, 0.35638427734375, 0.4425048828125, 0.52862548828125, 0.61474609375, 0.70086669921875, 0.7869873046875, 0.87310791015625, 0.959228515625, 1.04534912109375, 1.1314697265625, 1.21759033203125, 1.3037109375, 1.38983154296875, 1.4759521484375, 1.56207275390625, 1.648193359375, 1.73431396484375, 1.8204345703125, 1.90655517578125, 1.99267578125, 2.07879638671875, 2.1649169921875, 2.25103759765625, 2.337158203125, 2.42327880859375, 2.5093994140625, 2.59552001953125, 2.681640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 12.0, 18.0, 44.0, 99.0, 150.0, 189.0, 181.0, 141.0, 76.0, 40.0, 25.0, 7.0, 10.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.99439239501953, -65.26271057128906, -63.53103256225586, -61.79935073852539, -60.06767272949219, -58.33599090576172, -56.604312896728516, -54.87263107299805, -53.140953063964844, -51.409271240234375, -49.67759323120117, -47.9459114074707, -46.2142333984375, -44.48255157470703, -42.75087356567383, -41.01919174194336, -39.287513732910156, -37.55583190917969, -35.824153900146484, -34.092472076416016, -32.36079406738281, -30.629112243652344, -28.89743423461914, -27.165752410888672, -25.434070587158203, -23.702390670776367, -21.97071075439453, -20.239030838012695, -18.50735092163086, -16.77566909790039, -15.043990135192871, -13.312310218811035, -11.580631256103516, -9.84895133972168, -8.117271423339844, -6.38559103012085, -4.653911113739014, -2.9222307205200195, -1.1905508041381836, 0.5411291122436523, 2.2728090286254883, 4.004488945007324, 5.73616886138916, 7.467849254608154, 9.199529647827148, 10.931209564208984, 12.66288948059082, 14.394569396972656, 16.126249313354492, 17.857929229736328, 19.589609146118164, 21.3212890625, 23.052968978881836, 24.784648895263672, 26.51633071899414, 28.248008728027344, 29.979690551757812, 31.71137046813965, 33.443050384521484, 35.17473220825195, 36.906410217285156, 38.638092041015625, 40.36977005004883, 42.1014518737793, 43.8331298828125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 8.0, 12.0, 8.0, 10.0, 21.0, 22.0, 22.0, 22.0, 29.0, 22.0, 33.0, 34.0, 35.0, 37.0, 39.0, 44.0, 40.0, 43.0, 43.0, 49.0, 42.0, 37.0, 35.0, 30.0, 29.0, 35.0, 22.0, 29.0, 19.0, 20.0, 20.0, 17.0, 18.0, 15.0, 9.0, 8.0, 9.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.12846565246582, -20.500459671020508, -19.872453689575195, -19.244447708129883, -18.61644172668457, -17.988435745239258, -17.360429763793945, -16.732423782348633, -16.10441780090332, -15.476411819458008, -14.848405838012695, -14.220399856567383, -13.59239387512207, -12.964387893676758, -12.336381912231445, -11.708375930786133, -11.08036994934082, -10.452363967895508, -9.824357986450195, -9.196352005004883, -8.56834602355957, -7.940340042114258, -7.312334060668945, -6.684328079223633, -6.05632209777832, -5.428316116333008, -4.800310134887695, -4.172304153442383, -3.5442981719970703, -2.916292190551758, -2.2882862091064453, -1.6602802276611328, -1.0322761535644531, -0.4042701721191406, 0.22373580932617188, 0.8517417907714844, 1.4797477722167969, 2.1077537536621094, 2.735759735107422, 3.3637657165527344, 3.991771697998047, 4.619777679443359, 5.247783660888672, 5.875789642333984, 6.503795623779297, 7.131801605224609, 7.759807586669922, 8.387813568115234, 9.015819549560547, 9.64382553100586, 10.271831512451172, 10.899837493896484, 11.527843475341797, 12.15584945678711, 12.783855438232422, 13.411861419677734, 14.039867401123047, 14.66787338256836, 15.295879364013672, 15.923885345458984, 16.551891326904297, 17.17989730834961, 17.807903289794922, 18.435909271240234, 19.063915252685547]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 9.0, 11.0, 7.0, 13.0, 27.0, 23.0, 44.0, 49.0, 74.0, 110.0, 150.0, 222.0, 336.0, 566.0, 865.0, 1749.0, 3516.0, 8555.0, 26484.0, 145490.0, 3705347.0, 246953.0, 35362.0, 10281.0, 3971.0, 1854.0, 884.0, 508.0, 289.0, 188.0, 94.0, 81.0, 46.0, 33.0, 26.0, 13.0, 8.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 3.0], "bins": [-10.59375, -10.31195068359375, -10.0301513671875, -9.74835205078125, -9.466552734375, -9.18475341796875, -8.9029541015625, -8.62115478515625, -8.33935546875, -8.05755615234375, -7.7757568359375, -7.49395751953125, -7.212158203125, -6.93035888671875, -6.6485595703125, -6.36676025390625, -6.0849609375, -5.80316162109375, -5.5213623046875, -5.23956298828125, -4.957763671875, -4.67596435546875, -4.3941650390625, -4.11236572265625, -3.83056640625, -3.54876708984375, -3.2669677734375, -2.98516845703125, -2.703369140625, -2.42156982421875, -2.1397705078125, -1.85797119140625, -1.576171875, -1.29437255859375, -1.0125732421875, -0.73077392578125, -0.448974609375, -0.16717529296875, 0.1146240234375, 0.39642333984375, 0.67822265625, 0.96002197265625, 1.2418212890625, 1.52362060546875, 1.805419921875, 2.08721923828125, 2.3690185546875, 2.65081787109375, 2.9326171875, 3.21441650390625, 3.4962158203125, 3.77801513671875, 4.059814453125, 4.34161376953125, 4.6234130859375, 4.90521240234375, 5.18701171875, 5.46881103515625, 5.7506103515625, 6.03240966796875, 6.314208984375, 6.59600830078125, 6.8778076171875, 7.15960693359375, 7.44140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 14.0, 13.0, 20.0, 23.0, 31.0, 43.0, 44.0, 46.0, 66.0, 68.0, 68.0, 76.0, 80.0, 53.0, 46.0, 66.0, 35.0, 39.0, 33.0, 28.0, 23.0, 12.0, 14.0, 12.0, 9.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.3359375, -1.3011856079101562, -1.2664337158203125, -1.2316818237304688, -1.196929931640625, -1.1621780395507812, -1.1274261474609375, -1.0926742553710938, -1.05792236328125, -1.0231704711914062, -0.9884185791015625, -0.9536666870117188, -0.918914794921875, -0.8841629028320312, -0.8494110107421875, -0.8146591186523438, -0.7799072265625, -0.7451553344726562, -0.7104034423828125, -0.6756515502929688, -0.640899658203125, -0.6061477661132812, -0.5713958740234375, -0.5366439819335938, -0.50189208984375, -0.46714019775390625, -0.4323883056640625, -0.39763641357421875, -0.362884521484375, -0.32813262939453125, -0.2933807373046875, -0.25862884521484375, -0.223876953125, -0.18912506103515625, -0.1543731689453125, -0.11962127685546875, -0.084869384765625, -0.05011749267578125, -0.0153656005859375, 0.01938629150390625, 0.05413818359375, 0.08889007568359375, 0.1236419677734375, 0.15839385986328125, 0.193145751953125, 0.22789764404296875, 0.2626495361328125, 0.29740142822265625, 0.3321533203125, 0.36690521240234375, 0.4016571044921875, 0.43640899658203125, 0.471160888671875, 0.5059127807617188, 0.5406646728515625, 0.5754165649414062, 0.61016845703125, 0.6449203491210938, 0.6796722412109375, 0.7144241333007812, 0.749176025390625, 0.7839279174804688, 0.8186798095703125, 0.8534317016601562, 0.88818359375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 0.0, 4.0, 4.0, 12.0, 18.0, 13.0, 20.0, 39.0, 44.0, 51.0, 109.0, 150.0, 232.0, 375.0, 555.0, 895.0, 1541.0, 2599.0, 5088.0, 10184.0, 21811.0, 53100.0, 167988.0, 1289679.0, 2306093.0, 218484.0, 63773.0, 25783.0, 11785.0, 5941.0, 3176.0, 1820.0, 1071.0, 602.0, 413.0, 253.0, 184.0, 118.0, 66.0, 62.0, 36.0, 28.0, 28.0, 16.0, 15.0, 5.0, 5.0, 10.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.0859375, -3.95013427734375, -3.8143310546875, -3.67852783203125, -3.542724609375, -3.40692138671875, -3.2711181640625, -3.13531494140625, -2.99951171875, -2.86370849609375, -2.7279052734375, -2.59210205078125, -2.456298828125, -2.32049560546875, -2.1846923828125, -2.04888916015625, -1.9130859375, -1.77728271484375, -1.6414794921875, -1.50567626953125, -1.369873046875, -1.23406982421875, -1.0982666015625, -0.96246337890625, -0.82666015625, -0.69085693359375, -0.5550537109375, -0.41925048828125, -0.283447265625, -0.14764404296875, -0.0118408203125, 0.12396240234375, 0.259765625, 0.39556884765625, 0.5313720703125, 0.66717529296875, 0.802978515625, 0.93878173828125, 1.0745849609375, 1.21038818359375, 1.34619140625, 1.48199462890625, 1.6177978515625, 1.75360107421875, 1.889404296875, 2.02520751953125, 2.1610107421875, 2.29681396484375, 2.4326171875, 2.56842041015625, 2.7042236328125, 2.84002685546875, 2.975830078125, 3.11163330078125, 3.2474365234375, 3.38323974609375, 3.51904296875, 3.65484619140625, 3.7906494140625, 3.92645263671875, 4.062255859375, 4.19805908203125, 4.3338623046875, 4.46966552734375, 4.60546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 6.0, 5.0, 11.0, 7.0, 12.0, 21.0, 25.0, 23.0, 43.0, 57.0, 100.0, 133.0, 249.0, 467.0, 1207.0, 779.0, 342.0, 186.0, 102.0, 71.0, 52.0, 37.0, 44.0, 26.0, 12.0, 9.0, 15.0, 9.0, 9.0, 4.0, 3.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.470703125, -2.39752197265625, -2.3243408203125, -2.25115966796875, -2.177978515625, -2.10479736328125, -2.0316162109375, -1.95843505859375, -1.88525390625, -1.81207275390625, -1.7388916015625, -1.66571044921875, -1.592529296875, -1.51934814453125, -1.4461669921875, -1.37298583984375, -1.2998046875, -1.22662353515625, -1.1534423828125, -1.08026123046875, -1.007080078125, -0.93389892578125, -0.8607177734375, -0.78753662109375, -0.71435546875, -0.64117431640625, -0.5679931640625, -0.49481201171875, -0.421630859375, -0.34844970703125, -0.2752685546875, -0.20208740234375, -0.12890625, -0.05572509765625, 0.0174560546875, 0.09063720703125, 0.163818359375, 0.23699951171875, 0.3101806640625, 0.38336181640625, 0.45654296875, 0.52972412109375, 0.6029052734375, 0.67608642578125, 0.749267578125, 0.82244873046875, 0.8956298828125, 0.96881103515625, 1.0419921875, 1.11517333984375, 1.1883544921875, 1.26153564453125, 1.334716796875, 1.40789794921875, 1.4810791015625, 1.55426025390625, 1.62744140625, 1.70062255859375, 1.7738037109375, 1.84698486328125, 1.920166015625, 1.99334716796875, 2.0665283203125, 2.13970947265625, 2.212890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 12.0, 29.0, 56.0, 86.0, 99.0, 155.0, 143.0, 126.0, 112.0, 54.0, 43.0, 26.0, 13.0, 10.0, 8.0, 3.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.913623809814453, -19.291202545166016, -18.668781280517578, -18.04636001586914, -17.423938751220703, -16.801517486572266, -16.179096221923828, -15.556674003601074, -14.934252738952637, -14.3118314743042, -13.689410209655762, -13.066988945007324, -12.44456672668457, -11.822145462036133, -11.199724197387695, -10.577302932739258, -9.95488166809082, -9.332460403442383, -8.710039138793945, -8.087617874145508, -7.465196132659912, -6.842774868011475, -6.220353126525879, -5.597931861877441, -4.975510597229004, -4.353089332580566, -3.73066782951355, -3.108246326446533, -2.4858250617980957, -1.8634037971496582, -1.2409822940826416, -0.618560791015625, 0.0038604736328125, 0.6262818574905396, 1.2487032413482666, 1.8711246252059937, 2.4935460090637207, 3.115967273712158, 3.738388776779175, 4.360810279846191, 4.983231544494629, 5.605652809143066, 6.228074073791504, 6.8504958152771, 7.472917079925537, 8.095338821411133, 8.71776008605957, 9.340181350708008, 9.962602615356445, 10.585023880004883, 11.20744514465332, 11.829866409301758, 12.452287673950195, 13.074708938598633, 13.697131156921387, 14.319552421569824, 14.941973686218262, 15.5643949508667, 16.186817169189453, 16.80923843383789, 17.431659698486328, 18.054080963134766, 18.676502227783203, 19.29892349243164, 19.921344757080078]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 1.0, 9.0, 5.0, 4.0, 8.0, 9.0, 9.0, 11.0, 12.0, 13.0, 17.0, 23.0, 21.0, 27.0, 29.0, 32.0, 36.0, 34.0, 34.0, 24.0, 42.0, 40.0, 35.0, 38.0, 36.0, 36.0, 38.0, 34.0, 43.0, 39.0, 29.0, 31.0, 30.0, 24.0, 22.0, 26.0, 14.0, 16.0, 17.0, 10.0, 8.0, 4.0, 9.0, 9.0, 4.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0], "bins": [-9.701818466186523, -9.444954872131348, -9.188092231750488, -8.931228637695312, -8.674365997314453, -8.417502403259277, -8.160638809204102, -7.903775691986084, -7.646912574768066, -7.390049457550049, -7.133186340332031, -6.8763227462768555, -6.619459629058838, -6.36259651184082, -6.1057329177856445, -5.848869800567627, -5.592006683349609, -5.335143566131592, -5.078280448913574, -4.821416854858398, -4.564553737640381, -4.307690620422363, -4.0508270263671875, -3.79396390914917, -3.5371007919311523, -3.2802376747131348, -3.023374319076538, -2.7665109634399414, -2.509647846221924, -2.2527847290039062, -1.9959213733673096, -1.7390581369400024, -1.4821958541870117, -1.2253326177597046, -0.9684693813323975, -0.7116061449050903, -0.4547429084777832, -0.19787967205047607, 0.058983564376831055, 0.3158468008041382, 0.5727100372314453, 0.8295732736587524, 1.0864365100860596, 1.3432997465133667, 1.6001629829406738, 1.857026219367981, 2.113889455795288, 2.3707528114318848, 2.6276159286499023, 2.88447904586792, 3.1413424015045166, 3.3982057571411133, 3.655068874359131, 3.9119319915771484, 4.168795585632324, 4.425658702850342, 4.682521820068359, 4.939384937286377, 5.1962480545043945, 5.45311164855957, 5.709974765777588, 5.9668378829956055, 6.223701477050781, 6.480564594268799, 6.737427711486816]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 9.0, 8.0, 7.0, 16.0, 22.0, 18.0, 33.0, 39.0, 89.0, 132.0, 232.0, 411.0, 739.0, 1490.0, 3488.0, 10041.0, 34972.0, 192415.0, 640303.0, 125001.0, 25992.0, 7604.0, 2841.0, 1191.0, 602.0, 358.0, 171.0, 116.0, 80.0, 49.0, 31.0, 15.0, 13.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.484375, -9.16162109375, -8.8388671875, -8.51611328125, -8.193359375, -7.87060546875, -7.5478515625, -7.22509765625, -6.90234375, -6.57958984375, -6.2568359375, -5.93408203125, -5.611328125, -5.28857421875, -4.9658203125, -4.64306640625, -4.3203125, -3.99755859375, -3.6748046875, -3.35205078125, -3.029296875, -2.70654296875, -2.3837890625, -2.06103515625, -1.73828125, -1.41552734375, -1.0927734375, -0.77001953125, -0.447265625, -0.12451171875, 0.1982421875, 0.52099609375, 0.84375, 1.16650390625, 1.4892578125, 1.81201171875, 2.134765625, 2.45751953125, 2.7802734375, 3.10302734375, 3.42578125, 3.74853515625, 4.0712890625, 4.39404296875, 4.716796875, 5.03955078125, 5.3623046875, 5.68505859375, 6.0078125, 6.33056640625, 6.6533203125, 6.97607421875, 7.298828125, 7.62158203125, 7.9443359375, 8.26708984375, 8.58984375, 8.91259765625, 9.2353515625, 9.55810546875, 9.880859375, 10.20361328125, 10.5263671875, 10.84912109375, 11.171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 10.0, 6.0, 14.0, 18.0, 21.0, 23.0, 27.0, 52.0, 39.0, 55.0, 63.0, 63.0, 63.0, 69.0, 56.0, 75.0, 66.0, 48.0, 53.0, 35.0, 31.0, 21.0, 22.0, 15.0, 21.0, 6.0, 7.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3525390625, -1.3174667358398438, -1.2823944091796875, -1.2473220825195312, -1.212249755859375, -1.1771774291992188, -1.1421051025390625, -1.1070327758789062, -1.07196044921875, -1.0368881225585938, -1.0018157958984375, -0.9667434692382812, -0.931671142578125, -0.8965988159179688, -0.8615264892578125, -0.8264541625976562, -0.7913818359375, -0.7563095092773438, -0.7212371826171875, -0.6861648559570312, -0.651092529296875, -0.6160202026367188, -0.5809478759765625, -0.5458755493164062, -0.51080322265625, -0.47573089599609375, -0.4406585693359375, -0.40558624267578125, -0.370513916015625, -0.33544158935546875, -0.3003692626953125, -0.26529693603515625, -0.230224609375, -0.19515228271484375, -0.1600799560546875, -0.12500762939453125, -0.089935302734375, -0.05486297607421875, -0.0197906494140625, 0.01528167724609375, 0.05035400390625, 0.08542633056640625, 0.1204986572265625, 0.15557098388671875, 0.190643310546875, 0.22571563720703125, 0.2607879638671875, 0.29586029052734375, 0.3309326171875, 0.36600494384765625, 0.4010772705078125, 0.43614959716796875, 0.471221923828125, 0.5062942504882812, 0.5413665771484375, 0.5764389038085938, 0.61151123046875, 0.6465835571289062, 0.6816558837890625, 0.7167282104492188, 0.751800537109375, 0.7868728637695312, 0.8219451904296875, 0.8570175170898438, 0.89208984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 9.0, 5.0, 7.0, 11.0, 24.0, 22.0, 30.0, 31.0, 33.0, 55.0, 89.0, 108.0, 173.0, 242.0, 375.0, 557.0, 960.0, 1657.0, 2940.0, 5916.0, 13559.0, 35435.0, 107598.0, 357515.0, 353294.0, 105449.0, 35685.0, 13467.0, 5858.0, 3041.0, 1615.0, 946.0, 591.0, 376.0, 273.0, 195.0, 116.0, 79.0, 64.0, 47.0, 37.0, 22.0, 19.0, 7.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.4609375, -5.30029296875, -5.1396484375, -4.97900390625, -4.818359375, -4.65771484375, -4.4970703125, -4.33642578125, -4.17578125, -4.01513671875, -3.8544921875, -3.69384765625, -3.533203125, -3.37255859375, -3.2119140625, -3.05126953125, -2.890625, -2.72998046875, -2.5693359375, -2.40869140625, -2.248046875, -2.08740234375, -1.9267578125, -1.76611328125, -1.60546875, -1.44482421875, -1.2841796875, -1.12353515625, -0.962890625, -0.80224609375, -0.6416015625, -0.48095703125, -0.3203125, -0.15966796875, 0.0009765625, 0.16162109375, 0.322265625, 0.48291015625, 0.6435546875, 0.80419921875, 0.96484375, 1.12548828125, 1.2861328125, 1.44677734375, 1.607421875, 1.76806640625, 1.9287109375, 2.08935546875, 2.25, 2.41064453125, 2.5712890625, 2.73193359375, 2.892578125, 3.05322265625, 3.2138671875, 3.37451171875, 3.53515625, 3.69580078125, 3.8564453125, 4.01708984375, 4.177734375, 4.33837890625, 4.4990234375, 4.65966796875, 4.8203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 10.0, 7.0, 6.0, 11.0, 11.0, 15.0, 23.0, 32.0, 36.0, 26.0, 27.0, 44.0, 41.0, 42.0, 37.0, 46.0, 47.0, 45.0, 41.0, 49.0, 48.0, 44.0, 35.0, 35.0, 41.0, 29.0, 31.0, 19.0, 30.0, 18.0, 12.0, 14.0, 12.0, 2.0, 10.0, 2.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.532470703125, -4.39306640625, -4.253662109375, -4.1142578125, -3.974853515625, -3.83544921875, -3.696044921875, -3.556640625, -3.417236328125, -3.27783203125, -3.138427734375, -2.9990234375, -2.859619140625, -2.72021484375, -2.580810546875, -2.44140625, -2.302001953125, -2.16259765625, -2.023193359375, -1.8837890625, -1.744384765625, -1.60498046875, -1.465576171875, -1.326171875, -1.186767578125, -1.04736328125, -0.907958984375, -0.7685546875, -0.629150390625, -0.48974609375, -0.350341796875, -0.2109375, -0.071533203125, 0.06787109375, 0.207275390625, 0.3466796875, 0.486083984375, 0.62548828125, 0.764892578125, 0.904296875, 1.043701171875, 1.18310546875, 1.322509765625, 1.4619140625, 1.601318359375, 1.74072265625, 1.880126953125, 2.01953125, 2.158935546875, 2.29833984375, 2.437744140625, 2.5771484375, 2.716552734375, 2.85595703125, 2.995361328125, 3.134765625, 3.274169921875, 3.41357421875, 3.552978515625, 3.6923828125, 3.831787109375, 3.97119140625, 4.110595703125, 4.25]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 15.0, 7.0, 14.0, 21.0, 38.0, 59.0, 155.0, 269.0, 844.0, 3180.0, 21316.0, 389610.0, 596297.0, 30907.0, 4139.0, 1018.0, 355.0, 128.0, 66.0, 32.0, 33.0, 18.0, 12.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.212646484375, -7.96435546875, -7.716064453125, -7.4677734375, -7.219482421875, -6.97119140625, -6.722900390625, -6.474609375, -6.226318359375, -5.97802734375, -5.729736328125, -5.4814453125, -5.233154296875, -4.98486328125, -4.736572265625, -4.48828125, -4.239990234375, -3.99169921875, -3.743408203125, -3.4951171875, -3.246826171875, -2.99853515625, -2.750244140625, -2.501953125, -2.253662109375, -2.00537109375, -1.757080078125, -1.5087890625, -1.260498046875, -1.01220703125, -0.763916015625, -0.515625, -0.267333984375, -0.01904296875, 0.229248046875, 0.4775390625, 0.725830078125, 0.97412109375, 1.222412109375, 1.470703125, 1.718994140625, 1.96728515625, 2.215576171875, 2.4638671875, 2.712158203125, 2.96044921875, 3.208740234375, 3.45703125, 3.705322265625, 3.95361328125, 4.201904296875, 4.4501953125, 4.698486328125, 4.94677734375, 5.195068359375, 5.443359375, 5.691650390625, 5.93994140625, 6.188232421875, 6.4365234375, 6.684814453125, 6.93310546875, 7.181396484375, 7.4296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 12.0, 9.0, 11.0, 16.0, 15.0, 34.0, 35.0, 57.0, 73.0, 112.0, 127.0, 128.0, 79.0, 58.0, 52.0, 32.0, 29.0, 17.0, 15.0, 19.0, 9.0, 8.0, 8.0, 6.0, 8.0, 1.0, 3.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007309913635253906, -0.0007122457027435303, -0.0006935000419616699, -0.0006747543811798096, -0.0006560087203979492, -0.0006372630596160889, -0.0006185173988342285, -0.0005997717380523682, -0.0005810260772705078, -0.0005622804164886475, -0.0005435347557067871, -0.0005247890949249268, -0.0005060434341430664, -0.00048729777336120605, -0.0004685521125793457, -0.00044980645179748535, -0.000431060791015625, -0.00041231513023376465, -0.0003935694694519043, -0.00037482380867004395, -0.0003560781478881836, -0.00033733248710632324, -0.0003185868263244629, -0.00029984116554260254, -0.0002810955047607422, -0.00026234984397888184, -0.00024360418319702148, -0.00022485852241516113, -0.00020611286163330078, -0.00018736720085144043, -0.00016862154006958008, -0.00014987587928771973, -0.00013113021850585938, -0.00011238455772399902, -9.363889694213867e-05, -7.489323616027832e-05, -5.614757537841797e-05, -3.740191459655762e-05, -1.8656253814697266e-05, 8.940696716308594e-08, 1.8835067749023438e-05, 3.758072853088379e-05, 5.632638931274414e-05, 7.507205009460449e-05, 9.381771087646484e-05, 0.0001125633716583252, 0.00013130903244018555, 0.0001500546932220459, 0.00016880035400390625, 0.0001875460147857666, 0.00020629167556762695, 0.0002250373363494873, 0.00024378299713134766, 0.000262528657913208, 0.00028127431869506836, 0.0003000199794769287, 0.00031876564025878906, 0.0003375113010406494, 0.00035625696182250977, 0.0003750026226043701, 0.00039374828338623047, 0.0004124939441680908, 0.00043123960494995117, 0.0004499852657318115, 0.0004687309265136719]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 11.0, 7.0, 11.0, 15.0, 35.0, 40.0, 85.0, 128.0, 250.0, 474.0, 970.0, 2459.0, 6960.0, 29828.0, 234692.0, 655304.0, 94610.0, 15145.0, 4333.0, 1616.0, 723.0, 333.0, 202.0, 107.0, 65.0, 47.0, 36.0, 14.0, 14.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.4935302734375, -4.334716796875, -4.1759033203125, -4.01708984375, -3.8582763671875, -3.699462890625, -3.5406494140625, -3.3818359375, -3.2230224609375, -3.064208984375, -2.9053955078125, -2.74658203125, -2.5877685546875, -2.428955078125, -2.2701416015625, -2.111328125, -1.9525146484375, -1.793701171875, -1.6348876953125, -1.47607421875, -1.3172607421875, -1.158447265625, -0.9996337890625, -0.8408203125, -0.6820068359375, -0.523193359375, -0.3643798828125, -0.20556640625, -0.0467529296875, 0.112060546875, 0.2708740234375, 0.4296875, 0.5885009765625, 0.747314453125, 0.9061279296875, 1.06494140625, 1.2237548828125, 1.382568359375, 1.5413818359375, 1.7001953125, 1.8590087890625, 2.017822265625, 2.1766357421875, 2.33544921875, 2.4942626953125, 2.653076171875, 2.8118896484375, 2.970703125, 3.1295166015625, 3.288330078125, 3.4471435546875, 3.60595703125, 3.7647705078125, 3.923583984375, 4.0823974609375, 4.2412109375, 4.4000244140625, 4.558837890625, 4.7176513671875, 4.87646484375, 5.0352783203125, 5.194091796875, 5.3529052734375, 5.51171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 9.0, 7.0, 10.0, 8.0, 15.0, 19.0, 28.0, 23.0, 30.0, 46.0, 67.0, 72.0, 79.0, 86.0, 80.0, 87.0, 75.0, 53.0, 28.0, 21.0, 31.0, 23.0, 18.0, 15.0, 11.0, 12.0, 6.0, 11.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.16015625, -2.089691162109375, -2.01922607421875, -1.948760986328125, -1.8782958984375, -1.807830810546875, -1.73736572265625, -1.666900634765625, -1.596435546875, -1.525970458984375, -1.45550537109375, -1.385040283203125, -1.3145751953125, -1.244110107421875, -1.17364501953125, -1.103179931640625, -1.03271484375, -0.962249755859375, -0.89178466796875, -0.821319580078125, -0.7508544921875, -0.680389404296875, -0.60992431640625, -0.539459228515625, -0.468994140625, -0.398529052734375, -0.32806396484375, -0.257598876953125, -0.1871337890625, -0.116668701171875, -0.04620361328125, 0.024261474609375, 0.0947265625, 0.165191650390625, 0.23565673828125, 0.306121826171875, 0.3765869140625, 0.447052001953125, 0.51751708984375, 0.587982177734375, 0.658447265625, 0.728912353515625, 0.79937744140625, 0.869842529296875, 0.9403076171875, 1.010772705078125, 1.08123779296875, 1.151702880859375, 1.22216796875, 1.292633056640625, 1.36309814453125, 1.433563232421875, 1.5040283203125, 1.574493408203125, 1.64495849609375, 1.715423583984375, 1.785888671875, 1.856353759765625, 1.92681884765625, 1.997283935546875, 2.0677490234375, 2.138214111328125, 2.20867919921875, 2.279144287109375, 2.349609375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 8.0, 7.0, 11.0, 15.0, 14.0, 23.0, 43.0, 45.0, 68.0, 82.0, 92.0, 98.0, 102.0, 73.0, 76.0, 83.0, 51.0, 30.0, 17.0, 13.0, 10.0, 11.0, 12.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.715721130371094, -25.685707092285156, -24.65569305419922, -23.62567901611328, -22.59566307067871, -21.565649032592773, -20.535634994506836, -19.5056209564209, -18.475605010986328, -17.44559097290039, -16.415576934814453, -15.3855619430542, -14.355546951293945, -13.325532913208008, -12.29551887512207, -11.265504837036133, -10.235490798950195, -9.205476760864258, -8.175461769104004, -7.145447731018066, -6.115433216094971, -5.085418701171875, -4.0554046630859375, -3.025390148162842, -1.995375633239746, -0.9653612375259399, 0.06465315818786621, 1.0946674346923828, 2.1246819496154785, 3.154696464538574, 4.184710502624512, 5.214725017547607, 6.244739532470703, 7.274754047393799, 8.304768562316895, 9.334782600402832, 10.364797592163086, 11.394811630249023, 12.424825668334961, 13.454839706420898, 14.484854698181152, 15.51486873626709, 16.544883728027344, 17.57489776611328, 18.60491180419922, 19.634925842285156, 20.664939880371094, 21.694955825805664, 22.7249698638916, 23.75498390197754, 24.784997940063477, 25.815013885498047, 26.845027923583984, 27.875041961669922, 28.90505599975586, 29.935070037841797, 30.965084075927734, 31.995098114013672, 33.02511215209961, 34.05512619018555, 35.085140228271484, 36.11515808105469, 37.145172119140625, 38.17518615722656, 39.2052001953125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 7.0, 6.0, 15.0, 10.0, 9.0, 14.0, 20.0, 14.0, 19.0, 19.0, 17.0, 27.0, 34.0, 40.0, 34.0, 41.0, 41.0, 45.0, 30.0, 41.0, 32.0, 44.0, 40.0, 29.0, 35.0, 47.0, 41.0, 38.0, 33.0, 20.0, 19.0, 25.0, 24.0, 21.0, 19.0, 9.0, 13.0, 5.0, 7.0, 5.0, 5.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-23.517778396606445, -22.787986755371094, -22.05819320678711, -21.328399658203125, -20.598608016967773, -19.868816375732422, -19.139022827148438, -18.409229278564453, -17.6794376373291, -16.94964599609375, -16.219852447509766, -15.490059852600098, -14.76026725769043, -14.030474662780762, -13.300682067871094, -12.570889472961426, -11.841096878051758, -11.11130428314209, -10.381511688232422, -9.651719093322754, -8.921926498413086, -8.192133903503418, -7.46234130859375, -6.732548713684082, -6.002756118774414, -5.272963523864746, -4.543170928955078, -3.81337833404541, -3.083585739135742, -2.353793144226074, -1.6240005493164062, -0.8942079544067383, -0.16441726684570312, 0.5653753280639648, 1.2951679229736328, 2.024960517883301, 2.7547531127929688, 3.4845457077026367, 4.214338302612305, 4.944130897521973, 5.673923492431641, 6.403716087341309, 7.133508682250977, 7.8633012771606445, 8.593093872070312, 9.32288646697998, 10.052679061889648, 10.782471656799316, 11.512264251708984, 12.242056846618652, 12.97184944152832, 13.701642036437988, 14.431434631347656, 15.161227226257324, 15.891019821166992, 16.620811462402344, 17.350605010986328, 18.080398559570312, 18.810190200805664, 19.539981842041016, 20.269775390625, 20.999568939208984, 21.729360580444336, 22.459152221679688, 23.188945770263672]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 8.0, 7.0, 18.0, 18.0, 14.0, 25.0, 46.0, 68.0, 116.0, 178.0, 250.0, 473.0, 963.0, 2066.0, 5357.0, 17516.0, 121078.0, 3902390.0, 117223.0, 17646.0, 5017.0, 1947.0, 837.0, 445.0, 214.0, 141.0, 78.0, 48.0, 29.0, 26.0, 8.0, 8.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.104248046875, -11.76318359375, -11.422119140625, -11.0810546875, -10.739990234375, -10.39892578125, -10.057861328125, -9.716796875, -9.375732421875, -9.03466796875, -8.693603515625, -8.3525390625, -8.011474609375, -7.67041015625, -7.329345703125, -6.98828125, -6.647216796875, -6.30615234375, -5.965087890625, -5.6240234375, -5.282958984375, -4.94189453125, -4.600830078125, -4.259765625, -3.918701171875, -3.57763671875, -3.236572265625, -2.8955078125, -2.554443359375, -2.21337890625, -1.872314453125, -1.53125, -1.190185546875, -0.84912109375, -0.508056640625, -0.1669921875, 0.174072265625, 0.51513671875, 0.856201171875, 1.197265625, 1.538330078125, 1.87939453125, 2.220458984375, 2.5615234375, 2.902587890625, 3.24365234375, 3.584716796875, 3.92578125, 4.266845703125, 4.60791015625, 4.948974609375, 5.2900390625, 5.631103515625, 5.97216796875, 6.313232421875, 6.654296875, 6.995361328125, 7.33642578125, 7.677490234375, 8.0185546875, 8.359619140625, 8.70068359375, 9.041748046875, 9.3828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 9.0, 8.0, 15.0, 11.0, 21.0, 26.0, 34.0, 38.0, 38.0, 40.0, 51.0, 50.0, 43.0, 61.0, 56.0, 54.0, 53.0, 62.0, 49.0, 46.0, 37.0, 33.0, 31.0, 34.0, 18.0, 18.0, 14.0, 19.0, 4.0, 7.0, 8.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.25, -1.2160568237304688, -1.1821136474609375, -1.1481704711914062, -1.114227294921875, -1.0802841186523438, -1.0463409423828125, -1.0123977661132812, -0.97845458984375, -0.9445114135742188, -0.9105682373046875, -0.8766250610351562, -0.842681884765625, -0.8087387084960938, -0.7747955322265625, -0.7408523559570312, -0.7069091796875, -0.6729660034179688, -0.6390228271484375, -0.6050796508789062, -0.571136474609375, -0.5371932983398438, -0.5032501220703125, -0.46930694580078125, -0.43536376953125, -0.40142059326171875, -0.3674774169921875, -0.33353424072265625, -0.299591064453125, -0.26564788818359375, -0.2317047119140625, -0.19776153564453125, -0.163818359375, -0.12987518310546875, -0.0959320068359375, -0.06198883056640625, -0.028045654296875, 0.00589752197265625, 0.0398406982421875, 0.07378387451171875, 0.10772705078125, 0.14167022705078125, 0.1756134033203125, 0.20955657958984375, 0.243499755859375, 0.27744293212890625, 0.3113861083984375, 0.34532928466796875, 0.3792724609375, 0.41321563720703125, 0.4471588134765625, 0.48110198974609375, 0.515045166015625, 0.5489883422851562, 0.5829315185546875, 0.6168746948242188, 0.65081787109375, 0.6847610473632812, 0.7187042236328125, 0.7526473999023438, 0.786590576171875, 0.8205337524414062, 0.8544769287109375, 0.8884201049804688, 0.92236328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 3.0, 10.0, 10.0, 8.0, 19.0, 29.0, 28.0, 36.0, 60.0, 98.0, 112.0, 165.0, 247.0, 378.0, 551.0, 867.0, 1387.0, 2336.0, 4220.0, 8201.0, 17123.0, 42040.0, 131807.0, 1033434.0, 2667152.0, 187309.0, 53618.0, 21227.0, 9906.0, 4897.0, 2662.0, 1595.0, 960.0, 546.0, 396.0, 248.0, 171.0, 133.0, 87.0, 54.0, 41.0, 35.0, 20.0, 15.0, 14.0, 12.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.67578125, -4.53021240234375, -4.3846435546875, -4.23907470703125, -4.093505859375, -3.94793701171875, -3.8023681640625, -3.65679931640625, -3.51123046875, -3.36566162109375, -3.2200927734375, -3.07452392578125, -2.928955078125, -2.78338623046875, -2.6378173828125, -2.49224853515625, -2.3466796875, -2.20111083984375, -2.0555419921875, -1.90997314453125, -1.764404296875, -1.61883544921875, -1.4732666015625, -1.32769775390625, -1.18212890625, -1.03656005859375, -0.8909912109375, -0.74542236328125, -0.599853515625, -0.45428466796875, -0.3087158203125, -0.16314697265625, -0.017578125, 0.12799072265625, 0.2735595703125, 0.41912841796875, 0.564697265625, 0.71026611328125, 0.8558349609375, 1.00140380859375, 1.14697265625, 1.29254150390625, 1.4381103515625, 1.58367919921875, 1.729248046875, 1.87481689453125, 2.0203857421875, 2.16595458984375, 2.3115234375, 2.45709228515625, 2.6026611328125, 2.74822998046875, 2.893798828125, 3.03936767578125, 3.1849365234375, 3.33050537109375, 3.47607421875, 3.62164306640625, 3.7672119140625, 3.91278076171875, 4.058349609375, 4.20391845703125, 4.3494873046875, 4.49505615234375, 4.640625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 7.0, 4.0, 8.0, 14.0, 18.0, 17.0, 20.0, 47.0, 63.0, 78.0, 141.0, 250.0, 608.0, 1595.0, 573.0, 202.0, 107.0, 79.0, 56.0, 40.0, 28.0, 20.0, 15.0, 24.0, 13.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.355377197265625, -2.28692626953125, -2.218475341796875, -2.1500244140625, -2.081573486328125, -2.01312255859375, -1.944671630859375, -1.876220703125, -1.807769775390625, -1.73931884765625, -1.670867919921875, -1.6024169921875, -1.533966064453125, -1.46551513671875, -1.397064208984375, -1.32861328125, -1.260162353515625, -1.19171142578125, -1.123260498046875, -1.0548095703125, -0.986358642578125, -0.91790771484375, -0.849456787109375, -0.781005859375, -0.712554931640625, -0.64410400390625, -0.575653076171875, -0.5072021484375, -0.438751220703125, -0.37030029296875, -0.301849365234375, -0.2333984375, -0.164947509765625, -0.09649658203125, -0.028045654296875, 0.0404052734375, 0.108856201171875, 0.17730712890625, 0.245758056640625, 0.314208984375, 0.382659912109375, 0.45111083984375, 0.519561767578125, 0.5880126953125, 0.656463623046875, 0.72491455078125, 0.793365478515625, 0.86181640625, 0.930267333984375, 0.99871826171875, 1.067169189453125, 1.1356201171875, 1.204071044921875, 1.27252197265625, 1.340972900390625, 1.409423828125, 1.477874755859375, 1.54632568359375, 1.614776611328125, 1.6832275390625, 1.751678466796875, 1.82012939453125, 1.888580322265625, 1.95703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 8.0, 10.0, 19.0, 44.0, 68.0, 120.0, 149.0, 177.0, 151.0, 102.0, 68.0, 32.0, 24.0, 10.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.70559310913086, -19.080358505249023, -18.455123901367188, -17.82988929748535, -17.204654693603516, -16.57942008972168, -15.95418643951416, -15.328951835632324, -14.703717231750488, -14.078482627868652, -13.453248023986816, -12.82801342010498, -12.202779769897461, -11.577545166015625, -10.952310562133789, -10.327075958251953, -9.701841354370117, -9.076606750488281, -8.451372146606445, -7.826138019561768, -7.200903415679932, -6.575668811798096, -5.950434684753418, -5.325200080871582, -4.699965476989746, -4.07473087310791, -3.4494965076446533, -2.8242621421813965, -2.1990275382995605, -1.5737929344177246, -0.9485585689544678, -0.32332420349121094, 0.3019123077392578, 0.9271467924118042, 1.5523812770843506, 2.1776156425476074, 2.8028502464294434, 3.4280848503112793, 4.053318977355957, 4.678553581237793, 5.303788185119629, 5.929022789001465, 6.554257392883301, 7.1794915199279785, 7.8047261238098145, 8.429960250854492, 9.055194854736328, 9.680429458618164, 10.3056640625, 10.930898666381836, 11.556133270263672, 12.181367874145508, 12.806602478027344, 13.43183708190918, 14.0570707321167, 14.682305335998535, 15.307539939880371, 15.932774543762207, 16.558008193969727, 17.183242797851562, 17.8084774017334, 18.433712005615234, 19.05894660949707, 19.684181213378906, 20.309415817260742]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 2.0, 1.0, 7.0, 4.0, 5.0, 8.0, 12.0, 20.0, 19.0, 23.0, 20.0, 21.0, 23.0, 29.0, 31.0, 45.0, 46.0, 38.0, 49.0, 41.0, 35.0, 43.0, 46.0, 45.0, 31.0, 44.0, 42.0, 31.0, 27.0, 38.0, 26.0, 26.0, 13.0, 20.0, 14.0, 17.0, 16.0, 6.0, 9.0, 8.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.572405815124512, -7.335194110870361, -7.097982406616211, -6.8607707023620605, -6.62355899810791, -6.38634729385376, -6.149135589599609, -5.911923885345459, -5.674712181091309, -5.437500476837158, -5.200288772583008, -4.963077068328857, -4.725865364074707, -4.488653659820557, -4.251441955566406, -4.014230251312256, -3.7770187854766846, -3.539807081222534, -3.302595376968384, -3.0653836727142334, -2.828171968460083, -2.5909605026245117, -2.3537487983703613, -2.116537094116211, -1.879325270652771, -1.6421135663986206, -1.4049018621444702, -1.1676902770996094, -0.9304785132408142, -0.6932668685913086, -0.4560551643371582, -0.2188434600830078, 0.018368244171142578, 0.25557994842529297, 0.49279162287712097, 0.730003297328949, 0.9672150015830994, 1.204426646232605, 1.4416383504867554, 1.6788500547409058, 1.9160617589950562, 2.153273344039917, 2.3904850482940674, 2.6276967525482178, 2.864908456802368, 3.1021201610565186, 3.339331865310669, 3.5765435695648193, 3.8137552738189697, 4.050966739654541, 4.288178443908691, 4.525390148162842, 4.762601852416992, 4.999813556671143, 5.237025260925293, 5.474236965179443, 5.711448669433594, 5.948660373687744, 6.1858720779418945, 6.423083782196045, 6.660295486450195, 6.897507190704346, 7.134718894958496, 7.3719305992126465, 7.609142303466797]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 17.0, 5.0, 15.0, 18.0, 41.0, 84.0, 101.0, 187.0, 265.0, 475.0, 883.0, 1607.0, 3428.0, 7546.0, 18496.0, 52062.0, 164334.0, 460287.0, 226767.0, 69799.0, 24176.0, 9457.0, 4148.0, 1957.0, 1027.0, 523.0, 334.0, 183.0, 106.0, 75.0, 45.0, 29.0, 24.0, 22.0, 9.0, 5.0, 4.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.1640625, -6.9510498046875, -6.738037109375, -6.5250244140625, -6.31201171875, -6.0989990234375, -5.885986328125, -5.6729736328125, -5.4599609375, -5.2469482421875, -5.033935546875, -4.8209228515625, -4.60791015625, -4.3948974609375, -4.181884765625, -3.9688720703125, -3.755859375, -3.5428466796875, -3.329833984375, -3.1168212890625, -2.90380859375, -2.6907958984375, -2.477783203125, -2.2647705078125, -2.0517578125, -1.8387451171875, -1.625732421875, -1.4127197265625, -1.19970703125, -0.9866943359375, -0.773681640625, -0.5606689453125, -0.34765625, -0.1346435546875, 0.078369140625, 0.2913818359375, 0.50439453125, 0.7174072265625, 0.930419921875, 1.1434326171875, 1.3564453125, 1.5694580078125, 1.782470703125, 1.9954833984375, 2.20849609375, 2.4215087890625, 2.634521484375, 2.8475341796875, 3.060546875, 3.2735595703125, 3.486572265625, 3.6995849609375, 3.91259765625, 4.1256103515625, 4.338623046875, 4.5516357421875, 4.7646484375, 4.9776611328125, 5.190673828125, 5.4036865234375, 5.61669921875, 5.8297119140625, 6.042724609375, 6.2557373046875, 6.46875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 8.0, 3.0, 5.0, 8.0, 8.0, 16.0, 21.0, 18.0, 39.0, 39.0, 40.0, 37.0, 48.0, 51.0, 52.0, 52.0, 54.0, 48.0, 46.0, 41.0, 46.0, 45.0, 53.0, 34.0, 39.0, 31.0, 21.0, 24.0, 18.0, 9.0, 16.0, 3.0, 4.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.14453125, -1.11090087890625, -1.0772705078125, -1.04364013671875, -1.010009765625, -0.97637939453125, -0.9427490234375, -0.90911865234375, -0.87548828125, -0.84185791015625, -0.8082275390625, -0.77459716796875, -0.740966796875, -0.70733642578125, -0.6737060546875, -0.64007568359375, -0.6064453125, -0.57281494140625, -0.5391845703125, -0.50555419921875, -0.471923828125, -0.43829345703125, -0.4046630859375, -0.37103271484375, -0.33740234375, -0.30377197265625, -0.2701416015625, -0.23651123046875, -0.202880859375, -0.16925048828125, -0.1356201171875, -0.10198974609375, -0.068359375, -0.03472900390625, -0.0010986328125, 0.03253173828125, 0.066162109375, 0.09979248046875, 0.1334228515625, 0.16705322265625, 0.20068359375, 0.23431396484375, 0.2679443359375, 0.30157470703125, 0.335205078125, 0.36883544921875, 0.4024658203125, 0.43609619140625, 0.4697265625, 0.50335693359375, 0.5369873046875, 0.57061767578125, 0.604248046875, 0.63787841796875, 0.6715087890625, 0.70513916015625, 0.73876953125, 0.77239990234375, 0.8060302734375, 0.83966064453125, 0.873291015625, 0.90692138671875, 0.9405517578125, 0.97418212890625, 1.0078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 8.0, 9.0, 3.0, 8.0, 23.0, 23.0, 27.0, 38.0, 52.0, 60.0, 77.0, 112.0, 151.0, 223.0, 356.0, 552.0, 1038.0, 2118.0, 5896.0, 22926.0, 110433.0, 520430.0, 305670.0, 57592.0, 13035.0, 3910.0, 1531.0, 779.0, 449.0, 315.0, 188.0, 143.0, 92.0, 81.0, 53.0, 38.0, 31.0, 19.0, 15.0, 13.0, 8.0, 6.0, 7.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.8359375, -7.61077880859375, -7.3856201171875, -7.16046142578125, -6.935302734375, -6.71014404296875, -6.4849853515625, -6.25982666015625, -6.03466796875, -5.80950927734375, -5.5843505859375, -5.35919189453125, -5.134033203125, -4.90887451171875, -4.6837158203125, -4.45855712890625, -4.2333984375, -4.00823974609375, -3.7830810546875, -3.55792236328125, -3.332763671875, -3.10760498046875, -2.8824462890625, -2.65728759765625, -2.43212890625, -2.20697021484375, -1.9818115234375, -1.75665283203125, -1.531494140625, -1.30633544921875, -1.0811767578125, -0.85601806640625, -0.630859375, -0.40570068359375, -0.1805419921875, 0.04461669921875, 0.269775390625, 0.49493408203125, 0.7200927734375, 0.94525146484375, 1.17041015625, 1.39556884765625, 1.6207275390625, 1.84588623046875, 2.071044921875, 2.29620361328125, 2.5213623046875, 2.74652099609375, 2.9716796875, 3.19683837890625, 3.4219970703125, 3.64715576171875, 3.872314453125, 4.09747314453125, 4.3226318359375, 4.54779052734375, 4.77294921875, 4.99810791015625, 5.2232666015625, 5.44842529296875, 5.673583984375, 5.89874267578125, 6.1239013671875, 6.34906005859375, 6.57421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 5.0, 10.0, 12.0, 11.0, 16.0, 20.0, 17.0, 15.0, 24.0, 33.0, 51.0, 30.0, 41.0, 45.0, 50.0, 33.0, 55.0, 53.0, 53.0, 53.0, 57.0, 39.0, 41.0, 37.0, 36.0, 29.0, 24.0, 20.0, 17.0, 18.0, 13.0, 12.0, 9.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.62884521484375, -4.4803466796875, -4.33184814453125, -4.183349609375, -4.03485107421875, -3.8863525390625, -3.73785400390625, -3.58935546875, -3.44085693359375, -3.2923583984375, -3.14385986328125, -2.995361328125, -2.84686279296875, -2.6983642578125, -2.54986572265625, -2.4013671875, -2.25286865234375, -2.1043701171875, -1.95587158203125, -1.807373046875, -1.65887451171875, -1.5103759765625, -1.36187744140625, -1.21337890625, -1.06488037109375, -0.9163818359375, -0.76788330078125, -0.619384765625, -0.47088623046875, -0.3223876953125, -0.17388916015625, -0.025390625, 0.12310791015625, 0.2716064453125, 0.42010498046875, 0.568603515625, 0.71710205078125, 0.8656005859375, 1.01409912109375, 1.16259765625, 1.31109619140625, 1.4595947265625, 1.60809326171875, 1.756591796875, 1.90509033203125, 2.0535888671875, 2.20208740234375, 2.3505859375, 2.49908447265625, 2.6475830078125, 2.79608154296875, 2.944580078125, 3.09307861328125, 3.2415771484375, 3.39007568359375, 3.53857421875, 3.68707275390625, 3.8355712890625, 3.98406982421875, 4.132568359375, 4.28106689453125, 4.4295654296875, 4.57806396484375, 4.7265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 7.0, 19.0, 24.0, 32.0, 54.0, 96.0, 172.0, 293.0, 654.0, 1352.0, 3589.0, 12564.0, 87278.0, 788790.0, 130783.0, 15525.0, 4195.0, 1572.0, 684.0, 357.0, 214.0, 110.0, 75.0, 35.0, 21.0, 17.0, 10.0, 10.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.4296875, -9.197265625, -8.96484375, -8.732421875, -8.5, -8.267578125, -8.03515625, -7.802734375, -7.5703125, -7.337890625, -7.10546875, -6.873046875, -6.640625, -6.408203125, -6.17578125, -5.943359375, -5.7109375, -5.478515625, -5.24609375, -5.013671875, -4.78125, -4.548828125, -4.31640625, -4.083984375, -3.8515625, -3.619140625, -3.38671875, -3.154296875, -2.921875, -2.689453125, -2.45703125, -2.224609375, -1.9921875, -1.759765625, -1.52734375, -1.294921875, -1.0625, -0.830078125, -0.59765625, -0.365234375, -0.1328125, 0.099609375, 0.33203125, 0.564453125, 0.796875, 1.029296875, 1.26171875, 1.494140625, 1.7265625, 1.958984375, 2.19140625, 2.423828125, 2.65625, 2.888671875, 3.12109375, 3.353515625, 3.5859375, 3.818359375, 4.05078125, 4.283203125, 4.515625, 4.748046875, 4.98046875, 5.212890625, 5.4453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 13.0, 7.0, 13.0, 18.0, 18.0, 17.0, 32.0, 26.0, 35.0, 47.0, 63.0, 76.0, 86.0, 111.0, 85.0, 76.0, 51.0, 37.0, 38.0, 33.0, 19.0, 14.0, 17.0, 11.0, 4.0, 7.0, 7.0, 4.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004870891571044922, -0.0004704482853412628, -0.00045380741357803345, -0.0004371665418148041, -0.0004205256700515747, -0.00040388479828834534, -0.00038724392652511597, -0.0003706030547618866, -0.0003539621829986572, -0.00033732131123542786, -0.0003206804394721985, -0.0003040395677089691, -0.00028739869594573975, -0.0002707578241825104, -0.000254116952419281, -0.00023747608065605164, -0.00022083520889282227, -0.0002041943371295929, -0.00018755346536636353, -0.00017091259360313416, -0.00015427172183990479, -0.00013763085007667542, -0.00012098997831344604, -0.00010434910655021667, -8.77082347869873e-05, -7.106736302375793e-05, -5.4426491260528564e-05, -3.7785619497299194e-05, -2.1144747734069824e-05, -4.503875970840454e-06, 1.2136995792388916e-05, 2.8777867555618286e-05, 4.5418739318847656e-05, 6.205961108207703e-05, 7.87004828453064e-05, 9.534135460853577e-05, 0.00011198222637176514, 0.0001286230981349945, 0.00014526396989822388, 0.00016190484166145325, 0.00017854571342468262, 0.000195186585187912, 0.00021182745695114136, 0.00022846832871437073, 0.0002451092004776001, 0.00026175007224082947, 0.00027839094400405884, 0.0002950318157672882, 0.0003116726875305176, 0.00032831355929374695, 0.0003449544310569763, 0.0003615953028202057, 0.00037823617458343506, 0.00039487704634666443, 0.0004115179181098938, 0.00042815878987312317, 0.00044479966163635254, 0.0004614405333995819, 0.0004780814051628113, 0.0004947222769260406, 0.00051136314868927, 0.0005280040204524994, 0.0005446448922157288, 0.0005612857639789581, 0.0005779266357421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 5.0, 14.0, 11.0, 11.0, 22.0, 28.0, 41.0, 51.0, 73.0, 101.0, 191.0, 350.0, 727.0, 1884.0, 5565.0, 21218.0, 197750.0, 740807.0, 62466.0, 11278.0, 3320.0, 1322.0, 557.0, 289.0, 140.0, 98.0, 66.0, 44.0, 29.0, 23.0, 15.0, 18.0, 7.0, 1.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.0546875, -5.84063720703125, -5.6265869140625, -5.41253662109375, -5.198486328125, -4.98443603515625, -4.7703857421875, -4.55633544921875, -4.34228515625, -4.12823486328125, -3.9141845703125, -3.70013427734375, -3.486083984375, -3.27203369140625, -3.0579833984375, -2.84393310546875, -2.6298828125, -2.41583251953125, -2.2017822265625, -1.98773193359375, -1.773681640625, -1.55963134765625, -1.3455810546875, -1.13153076171875, -0.91748046875, -0.70343017578125, -0.4893798828125, -0.27532958984375, -0.061279296875, 0.15277099609375, 0.3668212890625, 0.58087158203125, 0.794921875, 1.00897216796875, 1.2230224609375, 1.43707275390625, 1.651123046875, 1.86517333984375, 2.0792236328125, 2.29327392578125, 2.50732421875, 2.72137451171875, 2.9354248046875, 3.14947509765625, 3.363525390625, 3.57757568359375, 3.7916259765625, 4.00567626953125, 4.2197265625, 4.43377685546875, 4.6478271484375, 4.86187744140625, 5.075927734375, 5.28997802734375, 5.5040283203125, 5.71807861328125, 5.93212890625, 6.14617919921875, 6.3602294921875, 6.57427978515625, 6.788330078125, 7.00238037109375, 7.2164306640625, 7.43048095703125, 7.64453125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 9.0, 9.0, 12.0, 24.0, 40.0, 83.0, 125.0, 165.0, 162.0, 134.0, 76.0, 38.0, 39.0, 16.0, 16.0, 9.0, 8.0, 1.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.5823974609375, -5.422607421875, -5.2628173828125, -5.10302734375, -4.9432373046875, -4.783447265625, -4.6236572265625, -4.4638671875, -4.3040771484375, -4.144287109375, -3.9844970703125, -3.82470703125, -3.6649169921875, -3.505126953125, -3.3453369140625, -3.185546875, -3.0257568359375, -2.865966796875, -2.7061767578125, -2.54638671875, -2.3865966796875, -2.226806640625, -2.0670166015625, -1.9072265625, -1.7474365234375, -1.587646484375, -1.4278564453125, -1.26806640625, -1.1082763671875, -0.948486328125, -0.7886962890625, -0.62890625, -0.4691162109375, -0.309326171875, -0.1495361328125, 0.01025390625, 0.1700439453125, 0.329833984375, 0.4896240234375, 0.6494140625, 0.8092041015625, 0.968994140625, 1.1287841796875, 1.28857421875, 1.4483642578125, 1.608154296875, 1.7679443359375, 1.927734375, 2.0875244140625, 2.247314453125, 2.4071044921875, 2.56689453125, 2.7266845703125, 2.886474609375, 3.0462646484375, 3.2060546875, 3.3658447265625, 3.525634765625, 3.6854248046875, 3.84521484375, 4.0050048828125, 4.164794921875, 4.3245849609375, 4.484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 12.0, 23.0, 52.0, 134.0, 236.0, 251.0, 160.0, 71.0, 35.0, 12.0, 9.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.72313690185547, -62.26317596435547, -59.80321502685547, -57.34325408935547, -54.88329315185547, -52.42333221435547, -49.96337127685547, -47.50341033935547, -45.04344940185547, -42.58348846435547, -40.12352752685547, -37.66356658935547, -35.20360565185547, -32.74364471435547, -30.28368377685547, -27.82372283935547, -25.36376190185547, -22.90380096435547, -20.44384002685547, -17.98387908935547, -15.523918151855469, -13.063957214355469, -10.603996276855469, -8.144035339355469, -5.684074401855469, -3.2241134643554688, -0.7641525268554688, 1.6958084106445312, 4.155769348144531, 6.615730285644531, 9.075691223144531, 11.535652160644531, 13.995613098144531, 16.45557403564453, 18.91553497314453, 21.37549591064453, 23.83545684814453, 26.29541778564453, 28.75537872314453, 31.21533966064453, 33.67530059814453, 36.13526153564453, 38.59522247314453, 41.05518341064453, 43.51514434814453, 45.97510528564453, 48.43506622314453, 50.89502716064453, 53.35498809814453, 55.81494903564453, 58.27490997314453, 60.73487091064453, 63.19483184814453, 65.65479278564453, 68.11475372314453, 70.57471466064453, 73.03467559814453, 75.49463653564453, 77.95459747314453, 80.41455841064453, 82.87451934814453, 85.33448028564453, 87.79444122314453, 90.25440216064453, 92.71436309814453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 5.0, 8.0, 9.0, 17.0, 19.0, 19.0, 18.0, 25.0, 20.0, 25.0, 37.0, 36.0, 40.0, 28.0, 38.0, 35.0, 36.0, 43.0, 39.0, 53.0, 43.0, 41.0, 35.0, 43.0, 34.0, 31.0, 31.0, 24.0, 27.0, 23.0, 18.0, 9.0, 16.0, 12.0, 3.0, 8.0, 15.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.24639320373535, -21.511661529541016, -20.77692985534668, -20.042198181152344, -19.307466506958008, -18.572734832763672, -17.83800506591797, -17.103271484375, -16.368541717529297, -15.633810043334961, -14.899078369140625, -14.164346694946289, -13.429615020751953, -12.694883346557617, -11.960152626037598, -11.225420951843262, -10.49068832397461, -9.755956649780273, -9.021224975585938, -8.286493301391602, -7.551762104034424, -6.817030429840088, -6.08229923248291, -5.347567558288574, -4.612835884094238, -3.8781042098999023, -3.1433727741241455, -2.4086413383483887, -1.6739096641540527, -0.9391779899597168, -0.20444679260253906, 0.5302848815917969, 1.2650184631347656, 1.999750018119812, 2.7344815731048584, 3.4692130088806152, 4.203944683074951, 4.938676357269287, 5.673407554626465, 6.408139228820801, 7.142870903015137, 7.877602577209473, 8.612334251403809, 9.347064971923828, 10.081796646118164, 10.8165283203125, 11.551259994506836, 12.285991668701172, 13.020723342895508, 13.755455017089844, 14.49018669128418, 15.224918365478516, 15.959650039672852, 16.694381713867188, 17.42911148071289, 18.16384506225586, 18.898574829101562, 19.6333065032959, 20.368038177490234, 21.10276985168457, 21.837501525878906, 22.572233200073242, 23.306964874267578, 24.04169464111328, 24.77642822265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 2.0, 9.0, 9.0, 9.0, 18.0, 26.0, 34.0, 36.0, 55.0, 115.0, 128.0, 180.0, 286.0, 432.0, 729.0, 1170.0, 1957.0, 3575.0, 6885.0, 14554.0, 36514.0, 131398.0, 2799093.0, 1037753.0, 101923.0, 31032.0, 12574.0, 6044.0, 3083.0, 1832.0, 1046.0, 597.0, 359.0, 243.0, 176.0, 132.0, 73.0, 46.0, 51.0, 25.0, 23.0, 17.0, 11.0, 3.0, 4.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.21484375, -5.056396484375, -4.89794921875, -4.739501953125, -4.5810546875, -4.422607421875, -4.26416015625, -4.105712890625, -3.947265625, -3.788818359375, -3.63037109375, -3.471923828125, -3.3134765625, -3.155029296875, -2.99658203125, -2.838134765625, -2.6796875, -2.521240234375, -2.36279296875, -2.204345703125, -2.0458984375, -1.887451171875, -1.72900390625, -1.570556640625, -1.412109375, -1.253662109375, -1.09521484375, -0.936767578125, -0.7783203125, -0.619873046875, -0.46142578125, -0.302978515625, -0.14453125, 0.013916015625, 0.17236328125, 0.330810546875, 0.4892578125, 0.647705078125, 0.80615234375, 0.964599609375, 1.123046875, 1.281494140625, 1.43994140625, 1.598388671875, 1.7568359375, 1.915283203125, 2.07373046875, 2.232177734375, 2.390625, 2.549072265625, 2.70751953125, 2.865966796875, 3.0244140625, 3.182861328125, 3.34130859375, 3.499755859375, 3.658203125, 3.816650390625, 3.97509765625, 4.133544921875, 4.2919921875, 4.450439453125, 4.60888671875, 4.767333984375, 4.92578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 11.0, 6.0, 17.0, 14.0, 10.0, 25.0, 29.0, 39.0, 39.0, 53.0, 35.0, 43.0, 54.0, 50.0, 53.0, 52.0, 62.0, 44.0, 47.0, 47.0, 37.0, 40.0, 29.0, 35.0, 30.0, 22.0, 11.0, 13.0, 9.0, 9.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19921875, -1.16302490234375, -1.1268310546875, -1.09063720703125, -1.054443359375, -1.01824951171875, -0.9820556640625, -0.94586181640625, -0.90966796875, -0.87347412109375, -0.8372802734375, -0.80108642578125, -0.764892578125, -0.72869873046875, -0.6925048828125, -0.65631103515625, -0.6201171875, -0.58392333984375, -0.5477294921875, -0.51153564453125, -0.475341796875, -0.43914794921875, -0.4029541015625, -0.36676025390625, -0.33056640625, -0.29437255859375, -0.2581787109375, -0.22198486328125, -0.185791015625, -0.14959716796875, -0.1134033203125, -0.07720947265625, -0.041015625, -0.00482177734375, 0.0313720703125, 0.06756591796875, 0.103759765625, 0.13995361328125, 0.1761474609375, 0.21234130859375, 0.24853515625, 0.28472900390625, 0.3209228515625, 0.35711669921875, 0.393310546875, 0.42950439453125, 0.4656982421875, 0.50189208984375, 0.5380859375, 0.57427978515625, 0.6104736328125, 0.64666748046875, 0.682861328125, 0.71905517578125, 0.7552490234375, 0.79144287109375, 0.82763671875, 0.86383056640625, 0.9000244140625, 0.93621826171875, 0.972412109375, 1.00860595703125, 1.0447998046875, 1.08099365234375, 1.1171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 16.0, 19.0, 21.0, 40.0, 70.0, 77.0, 135.0, 231.0, 371.0, 686.0, 1188.0, 2525.0, 5708.0, 15878.0, 60887.0, 474700.0, 3377492.0, 198694.0, 36212.0, 10919.0, 4062.0, 1885.0, 985.0, 588.0, 282.0, 204.0, 135.0, 75.0, 58.0, 46.0, 27.0, 16.0, 14.0, 6.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.09149169921875, -4.8822021484375, -4.67291259765625, -4.463623046875, -4.25433349609375, -4.0450439453125, -3.83575439453125, -3.62646484375, -3.41717529296875, -3.2078857421875, -2.99859619140625, -2.789306640625, -2.58001708984375, -2.3707275390625, -2.16143798828125, -1.9521484375, -1.74285888671875, -1.5335693359375, -1.32427978515625, -1.114990234375, -0.90570068359375, -0.6964111328125, -0.48712158203125, -0.27783203125, -0.06854248046875, 0.1407470703125, 0.35003662109375, 0.559326171875, 0.76861572265625, 0.9779052734375, 1.18719482421875, 1.396484375, 1.60577392578125, 1.8150634765625, 2.02435302734375, 2.233642578125, 2.44293212890625, 2.6522216796875, 2.86151123046875, 3.07080078125, 3.28009033203125, 3.4893798828125, 3.69866943359375, 3.907958984375, 4.11724853515625, 4.3265380859375, 4.53582763671875, 4.7451171875, 4.95440673828125, 5.1636962890625, 5.37298583984375, 5.582275390625, 5.79156494140625, 6.0008544921875, 6.21014404296875, 6.41943359375, 6.62872314453125, 6.8380126953125, 7.04730224609375, 7.256591796875, 7.46588134765625, 7.6751708984375, 7.88446044921875, 8.09375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 14.0, 16.0, 13.0, 25.0, 37.0, 51.0, 81.0, 157.0, 236.0, 636.0, 1558.0, 614.0, 238.0, 129.0, 82.0, 49.0, 37.0, 18.0, 17.0, 13.0, 9.0, 12.0, 5.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.19183349609375, -2.0985107421875, -2.00518798828125, -1.911865234375, -1.81854248046875, -1.7252197265625, -1.63189697265625, -1.53857421875, -1.44525146484375, -1.3519287109375, -1.25860595703125, -1.165283203125, -1.07196044921875, -0.9786376953125, -0.88531494140625, -0.7919921875, -0.69866943359375, -0.6053466796875, -0.51202392578125, -0.418701171875, -0.32537841796875, -0.2320556640625, -0.13873291015625, -0.04541015625, 0.04791259765625, 0.1412353515625, 0.23455810546875, 0.327880859375, 0.42120361328125, 0.5145263671875, 0.60784912109375, 0.701171875, 0.79449462890625, 0.8878173828125, 0.98114013671875, 1.074462890625, 1.16778564453125, 1.2611083984375, 1.35443115234375, 1.44775390625, 1.54107666015625, 1.6343994140625, 1.72772216796875, 1.821044921875, 1.91436767578125, 2.0076904296875, 2.10101318359375, 2.1943359375, 2.28765869140625, 2.3809814453125, 2.47430419921875, 2.567626953125, 2.66094970703125, 2.7542724609375, 2.84759521484375, 2.94091796875, 3.03424072265625, 3.1275634765625, 3.22088623046875, 3.314208984375, 3.40753173828125, 3.5008544921875, 3.59417724609375, 3.6875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 9.0, 9.0, 9.0, 28.0, 37.0, 43.0, 72.0, 98.0, 96.0, 147.0, 118.0, 105.0, 107.0, 51.0, 32.0, 12.0, 10.0, 13.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.24634552001953, -19.67736053466797, -19.108373641967773, -18.53938865661621, -17.97040367126465, -17.401418685913086, -16.83243179321289, -16.263446807861328, -15.694461822509766, -15.125475883483887, -14.556490898132324, -13.987504959106445, -13.418519973754883, -12.849534034729004, -12.280548095703125, -11.711563110351562, -11.142577171325684, -10.573591232299805, -10.004606246948242, -9.435620307922363, -8.8666353225708, -8.297649383544922, -7.728663921356201, -7.1596784591674805, -6.59069299697876, -6.021707534790039, -5.452722072601318, -4.883736610412598, -4.314750671386719, -3.745765447616577, -3.1767797470092773, -2.6077942848205566, -2.038808822631836, -1.4698233604431152, -0.900837779045105, -0.3318521976470947, 0.23713326454162598, 0.8061187267303467, 1.3751044273376465, 1.9440898895263672, 2.513075351715088, 3.0820608139038086, 3.6510462760925293, 4.22003173828125, 4.789017677307129, 5.358002662658691, 5.92698860168457, 6.495974063873291, 7.064959526062012, 7.633944988250732, 8.202930450439453, 8.771916389465332, 9.340901374816895, 9.909887313842773, 10.478872299194336, 11.047858238220215, 11.616844177246094, 12.185830116271973, 12.754815101623535, 13.323801040649414, 13.892786026000977, 14.461771965026855, 15.030757904052734, 15.599742889404297, 16.16872787475586]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 8.0, 13.0, 10.0, 11.0, 7.0, 8.0, 19.0, 15.0, 27.0, 22.0, 35.0, 30.0, 42.0, 46.0, 49.0, 40.0, 40.0, 54.0, 39.0, 46.0, 55.0, 35.0, 46.0, 33.0, 43.0, 25.0, 29.0, 21.0, 19.0, 24.0, 19.0, 17.0, 13.0, 7.0, 16.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.278190612792969, -8.989839553833008, -8.70148754119873, -8.41313648223877, -8.124784469604492, -7.836432933807373, -7.548081398010254, -7.259730339050293, -6.971378326416016, -6.6830267906188965, -6.394675254821777, -6.106323719024658, -5.817972183227539, -5.52962064743042, -5.241269111633301, -4.95291805267334, -4.664566516876221, -4.376214981079102, -4.087863445281982, -3.7995119094848633, -3.511160373687744, -3.222808837890625, -2.934457540512085, -2.646106004714966, -2.3577544689178467, -2.0694029331207275, -1.7810513973236084, -1.4926999807357788, -1.2043484449386597, -0.9159969091415405, -0.6276454925537109, -0.3392939567565918, -0.050942420959472656, 0.2374090850353241, 0.5257605910301208, 0.8141120672225952, 1.1024636030197144, 1.3908151388168335, 1.679166555404663, 1.9675180912017822, 2.2558696269989014, 2.5442211627960205, 2.8325726985931396, 3.1209239959716797, 3.409275531768799, 3.697627067565918, 3.985978603363037, 4.274330139160156, 4.562681674957275, 4.8510332107543945, 5.139384746551514, 5.427736282348633, 5.716087818145752, 6.004439353942871, 6.292790412902832, 6.581142425537109, 6.86949348449707, 7.1578450202941895, 7.446196556091309, 7.734548091888428, 8.022899627685547, 8.311250686645508, 8.599602699279785, 8.887953758239746, 9.176305770874023]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 11.0, 26.0, 30.0, 33.0, 47.0, 68.0, 120.0, 161.0, 285.0, 464.0, 791.0, 1302.0, 2275.0, 4217.0, 8657.0, 19114.0, 46770.0, 147216.0, 598489.0, 137082.0, 44708.0, 18527.0, 8523.0, 4209.0, 2254.0, 1236.0, 732.0, 413.0, 262.0, 158.0, 108.0, 91.0, 44.0, 32.0, 30.0, 19.0, 14.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.72265625, -6.5218505859375, -6.321044921875, -6.1202392578125, -5.91943359375, -5.7186279296875, -5.517822265625, -5.3170166015625, -5.1162109375, -4.9154052734375, -4.714599609375, -4.5137939453125, -4.31298828125, -4.1121826171875, -3.911376953125, -3.7105712890625, -3.509765625, -3.3089599609375, -3.108154296875, -2.9073486328125, -2.70654296875, -2.5057373046875, -2.304931640625, -2.1041259765625, -1.9033203125, -1.7025146484375, -1.501708984375, -1.3009033203125, -1.10009765625, -0.8992919921875, -0.698486328125, -0.4976806640625, -0.296875, -0.0960693359375, 0.104736328125, 0.3055419921875, 0.50634765625, 0.7071533203125, 0.907958984375, 1.1087646484375, 1.3095703125, 1.5103759765625, 1.711181640625, 1.9119873046875, 2.11279296875, 2.3135986328125, 2.514404296875, 2.7152099609375, 2.916015625, 3.1168212890625, 3.317626953125, 3.5184326171875, 3.71923828125, 3.9200439453125, 4.120849609375, 4.3216552734375, 4.5224609375, 4.7232666015625, 4.924072265625, 5.1248779296875, 5.32568359375, 5.5264892578125, 5.727294921875, 5.9281005859375, 6.12890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 6.0, 8.0, 19.0, 21.0, 25.0, 21.0, 34.0, 21.0, 35.0, 39.0, 33.0, 45.0, 66.0, 45.0, 49.0, 48.0, 51.0, 42.0, 45.0, 39.0, 44.0, 38.0, 31.0, 34.0, 34.0, 27.0, 21.0, 16.0, 10.0, 12.0, 4.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.103607177734375, -1.06854248046875, -1.033477783203125, -0.9984130859375, -0.963348388671875, -0.92828369140625, -0.893218994140625, -0.858154296875, -0.823089599609375, -0.78802490234375, -0.752960205078125, -0.7178955078125, -0.682830810546875, -0.64776611328125, -0.612701416015625, -0.57763671875, -0.542572021484375, -0.50750732421875, -0.472442626953125, -0.4373779296875, -0.402313232421875, -0.36724853515625, -0.332183837890625, -0.297119140625, -0.262054443359375, -0.22698974609375, -0.191925048828125, -0.1568603515625, -0.121795654296875, -0.08673095703125, -0.051666259765625, -0.0166015625, 0.018463134765625, 0.05352783203125, 0.088592529296875, 0.1236572265625, 0.158721923828125, 0.19378662109375, 0.228851318359375, 0.263916015625, 0.298980712890625, 0.33404541015625, 0.369110107421875, 0.4041748046875, 0.439239501953125, 0.47430419921875, 0.509368896484375, 0.54443359375, 0.579498291015625, 0.61456298828125, 0.649627685546875, 0.6846923828125, 0.719757080078125, 0.75482177734375, 0.789886474609375, 0.824951171875, 0.860015869140625, 0.89508056640625, 0.930145263671875, 0.9652099609375, 1.000274658203125, 1.03533935546875, 1.070404052734375, 1.10546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 15.0, 14.0, 29.0, 30.0, 51.0, 39.0, 90.0, 116.0, 162.0, 268.0, 391.0, 622.0, 1212.0, 2948.0, 9629.0, 43544.0, 388448.0, 531701.0, 51696.0, 11077.0, 3239.0, 1318.0, 697.0, 362.0, 260.0, 169.0, 109.0, 82.0, 53.0, 54.0, 33.0, 23.0, 18.0, 14.0, 11.0, 3.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.9921875, -9.69873046875, -9.4052734375, -9.11181640625, -8.818359375, -8.52490234375, -8.2314453125, -7.93798828125, -7.64453125, -7.35107421875, -7.0576171875, -6.76416015625, -6.470703125, -6.17724609375, -5.8837890625, -5.59033203125, -5.296875, -5.00341796875, -4.7099609375, -4.41650390625, -4.123046875, -3.82958984375, -3.5361328125, -3.24267578125, -2.94921875, -2.65576171875, -2.3623046875, -2.06884765625, -1.775390625, -1.48193359375, -1.1884765625, -0.89501953125, -0.6015625, -0.30810546875, -0.0146484375, 0.27880859375, 0.572265625, 0.86572265625, 1.1591796875, 1.45263671875, 1.74609375, 2.03955078125, 2.3330078125, 2.62646484375, 2.919921875, 3.21337890625, 3.5068359375, 3.80029296875, 4.09375, 4.38720703125, 4.6806640625, 4.97412109375, 5.267578125, 5.56103515625, 5.8544921875, 6.14794921875, 6.44140625, 6.73486328125, 7.0283203125, 7.32177734375, 7.615234375, 7.90869140625, 8.2021484375, 8.49560546875, 8.7890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 1.0, 4.0, 3.0, 8.0, 8.0, 12.0, 11.0, 16.0, 23.0, 17.0, 25.0, 16.0, 28.0, 30.0, 31.0, 41.0, 40.0, 55.0, 56.0, 54.0, 36.0, 42.0, 52.0, 47.0, 49.0, 29.0, 34.0, 30.0, 34.0, 22.0, 28.0, 21.0, 15.0, 12.0, 18.0, 9.0, 8.0, 5.0, 3.0, 7.0, 1.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.41802978515625, -4.2735595703125, -4.12908935546875, -3.984619140625, -3.84014892578125, -3.6956787109375, -3.55120849609375, -3.40673828125, -3.26226806640625, -3.1177978515625, -2.97332763671875, -2.828857421875, -2.68438720703125, -2.5399169921875, -2.39544677734375, -2.2509765625, -2.10650634765625, -1.9620361328125, -1.81756591796875, -1.673095703125, -1.52862548828125, -1.3841552734375, -1.23968505859375, -1.09521484375, -0.95074462890625, -0.8062744140625, -0.66180419921875, -0.517333984375, -0.37286376953125, -0.2283935546875, -0.08392333984375, 0.060546875, 0.20501708984375, 0.3494873046875, 0.49395751953125, 0.638427734375, 0.78289794921875, 0.9273681640625, 1.07183837890625, 1.21630859375, 1.36077880859375, 1.5052490234375, 1.64971923828125, 1.794189453125, 1.93865966796875, 2.0831298828125, 2.22760009765625, 2.3720703125, 2.51654052734375, 2.6610107421875, 2.80548095703125, 2.949951171875, 3.09442138671875, 3.2388916015625, 3.38336181640625, 3.52783203125, 3.67230224609375, 3.8167724609375, 3.96124267578125, 4.105712890625, 4.25018310546875, 4.3946533203125, 4.53912353515625, 4.68359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 24.0, 26.0, 61.0, 102.0, 310.0, 745.0, 2763.0, 14421.0, 195981.0, 796946.0, 30700.0, 4517.0, 1189.0, 401.0, 155.0, 83.0, 43.0, 21.0, 16.0, 8.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.6015625, -11.305419921875, -11.00927734375, -10.713134765625, -10.4169921875, -10.120849609375, -9.82470703125, -9.528564453125, -9.232421875, -8.936279296875, -8.64013671875, -8.343994140625, -8.0478515625, -7.751708984375, -7.45556640625, -7.159423828125, -6.86328125, -6.567138671875, -6.27099609375, -5.974853515625, -5.6787109375, -5.382568359375, -5.08642578125, -4.790283203125, -4.494140625, -4.197998046875, -3.90185546875, -3.605712890625, -3.3095703125, -3.013427734375, -2.71728515625, -2.421142578125, -2.125, -1.828857421875, -1.53271484375, -1.236572265625, -0.9404296875, -0.644287109375, -0.34814453125, -0.052001953125, 0.244140625, 0.540283203125, 0.83642578125, 1.132568359375, 1.4287109375, 1.724853515625, 2.02099609375, 2.317138671875, 2.61328125, 2.909423828125, 3.20556640625, 3.501708984375, 3.7978515625, 4.093994140625, 4.39013671875, 4.686279296875, 4.982421875, 5.278564453125, 5.57470703125, 5.870849609375, 6.1669921875, 6.463134765625, 6.75927734375, 7.055419921875, 7.3515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 12.0, 11.0, 22.0, 32.0, 48.0, 179.0, 448.0, 99.0, 52.0, 36.0, 21.0, 12.0, 8.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019092559814453125, -0.0018502622842788696, -0.0017912685871124268, -0.0017322748899459839, -0.001673281192779541, -0.0016142874956130981, -0.0015552937984466553, -0.0014963001012802124, -0.0014373064041137695, -0.0013783127069473267, -0.0013193190097808838, -0.001260325312614441, -0.001201331615447998, -0.0011423379182815552, -0.0010833442211151123, -0.0010243505239486694, -0.0009653568267822266, -0.0009063631296157837, -0.0008473694324493408, -0.000788375735282898, -0.0007293820381164551, -0.0006703883409500122, -0.0006113946437835693, -0.0005524009466171265, -0.0004934072494506836, -0.0004344135522842407, -0.00037541985511779785, -0.000316426157951355, -0.0002574324607849121, -0.00019843876361846924, -0.00013944506645202637, -8.04513692855835e-05, -2.1457672119140625e-05, 3.7536025047302246e-05, 9.652972221374512e-05, 0.000155523419380188, 0.00021451711654663086, 0.00027351081371307373, 0.0003325045108795166, 0.00039149820804595947, 0.00045049190521240234, 0.0005094856023788452, 0.0005684792995452881, 0.000627472996711731, 0.0006864666938781738, 0.0007454603910446167, 0.0008044540882110596, 0.0008634477853775024, 0.0009224414825439453, 0.0009814351797103882, 0.001040428876876831, 0.001099422574043274, 0.0011584162712097168, 0.0012174099683761597, 0.0012764036655426025, 0.0013353973627090454, 0.0013943910598754883, 0.0014533847570419312, 0.001512378454208374, 0.001571372151374817, 0.0016303658485412598, 0.0016893595457077026, 0.0017483532428741455, 0.0018073469400405884, 0.0018663406372070312]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 12.0, 8.0, 18.0, 26.0, 42.0, 50.0, 77.0, 117.0, 204.0, 361.0, 737.0, 1800.0, 6168.0, 30783.0, 408389.0, 554271.0, 35270.0, 6534.0, 1904.0, 749.0, 408.0, 211.0, 150.0, 71.0, 55.0, 43.0, 26.0, 11.0, 11.0, 8.0, 8.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.375, -7.17034912109375, -6.9656982421875, -6.76104736328125, -6.556396484375, -6.35174560546875, -6.1470947265625, -5.94244384765625, -5.73779296875, -5.53314208984375, -5.3284912109375, -5.12384033203125, -4.919189453125, -4.71453857421875, -4.5098876953125, -4.30523681640625, -4.1005859375, -3.89593505859375, -3.6912841796875, -3.48663330078125, -3.281982421875, -3.07733154296875, -2.8726806640625, -2.66802978515625, -2.46337890625, -2.25872802734375, -2.0540771484375, -1.84942626953125, -1.644775390625, -1.44012451171875, -1.2354736328125, -1.03082275390625, -0.826171875, -0.62152099609375, -0.4168701171875, -0.21221923828125, -0.007568359375, 0.19708251953125, 0.4017333984375, 0.60638427734375, 0.81103515625, 1.01568603515625, 1.2203369140625, 1.42498779296875, 1.629638671875, 1.83428955078125, 2.0389404296875, 2.24359130859375, 2.4482421875, 2.65289306640625, 2.8575439453125, 3.06219482421875, 3.266845703125, 3.47149658203125, 3.6761474609375, 3.88079833984375, 4.08544921875, 4.29010009765625, 4.4947509765625, 4.69940185546875, 4.904052734375, 5.10870361328125, 5.3133544921875, 5.51800537109375, 5.72265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 7.0, 11.0, 13.0, 22.0, 22.0, 34.0, 71.0, 138.0, 229.0, 194.0, 87.0, 50.0, 24.0, 16.0, 13.0, 19.0, 7.0, 7.0, 4.0, 1.0, 4.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39453125, -5.24761962890625, -5.1007080078125, -4.95379638671875, -4.806884765625, -4.65997314453125, -4.5130615234375, -4.36614990234375, -4.21923828125, -4.07232666015625, -3.9254150390625, -3.77850341796875, -3.631591796875, -3.48468017578125, -3.3377685546875, -3.19085693359375, -3.0439453125, -2.89703369140625, -2.7501220703125, -2.60321044921875, -2.456298828125, -2.30938720703125, -2.1624755859375, -2.01556396484375, -1.86865234375, -1.72174072265625, -1.5748291015625, -1.42791748046875, -1.281005859375, -1.13409423828125, -0.9871826171875, -0.84027099609375, -0.693359375, -0.54644775390625, -0.3995361328125, -0.25262451171875, -0.105712890625, 0.04119873046875, 0.1881103515625, 0.33502197265625, 0.48193359375, 0.62884521484375, 0.7757568359375, 0.92266845703125, 1.069580078125, 1.21649169921875, 1.3634033203125, 1.51031494140625, 1.6572265625, 1.80413818359375, 1.9510498046875, 2.09796142578125, 2.244873046875, 2.39178466796875, 2.5386962890625, 2.68560791015625, 2.83251953125, 2.97943115234375, 3.1263427734375, 3.27325439453125, 3.420166015625, 3.56707763671875, 3.7139892578125, 3.86090087890625, 4.0078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 12.0, 39.0, 97.0, 209.0, 259.0, 215.0, 109.0, 35.0, 21.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.82325744628906, -69.84823608398438, -66.87322235107422, -63.89820098876953, -60.92318344116211, -57.94816589355469, -54.97314453125, -51.99812698364258, -49.023109436035156, -46.048091888427734, -43.07307434082031, -40.098052978515625, -37.1230354309082, -34.14801788330078, -31.172998428344727, -28.197978973388672, -25.22296142578125, -22.247943878173828, -19.272924423217773, -16.29790496826172, -13.322887420654297, -10.347868919372559, -7.37285041809082, -4.397830963134766, -1.4228134155273438, 1.5522050857543945, 4.527223587036133, 7.502242088317871, 10.47726058959961, 13.452279090881348, 16.427297592163086, 19.40231704711914, 22.377342224121094, 25.352359771728516, 28.32737922668457, 31.302398681640625, 34.27741622924805, 37.25243377685547, 40.227455139160156, 43.20247268676758, 46.177490234375, 49.15250778198242, 52.127525329589844, 55.10254669189453, 58.07756423950195, 61.052581787109375, 64.02760314941406, 67.00262451171875, 69.9776382446289, 72.9526596069336, 75.92767333984375, 78.90269470214844, 81.87771606445312, 84.85272979736328, 87.82775115966797, 90.80276489257812, 93.77778625488281, 96.7528076171875, 99.72782135009766, 102.70284271240234, 105.6778564453125, 108.65287780761719, 111.62789916992188, 114.60292053222656, 117.57793426513672]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 1.0, 8.0, 6.0, 7.0, 8.0, 12.0, 15.0, 15.0, 12.0, 9.0, 20.0, 29.0, 21.0, 30.0, 35.0, 31.0, 26.0, 38.0, 42.0, 45.0, 45.0, 44.0, 42.0, 31.0, 36.0, 36.0, 44.0, 24.0, 28.0, 24.0, 32.0, 33.0, 15.0, 18.0, 21.0, 21.0, 18.0, 15.0, 10.0, 12.0, 7.0, 8.0, 5.0, 10.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.64881706237793, -21.933399200439453, -21.21798324584961, -20.502565383911133, -19.787147521972656, -19.071731567382812, -18.356313705444336, -17.64089584350586, -16.925479888916016, -16.21006202697754, -15.494645118713379, -14.779228210449219, -14.063810348510742, -13.348393440246582, -12.632976531982422, -11.917558670043945, -11.202140808105469, -10.486723899841309, -9.771306037902832, -9.055889129638672, -8.340471267700195, -7.625054359436035, -6.909637451171875, -6.194220066070557, -5.478802680969238, -4.76338529586792, -4.047967910766602, -3.3325510025024414, -2.617133617401123, -1.9017162322998047, -1.1862993240356445, -0.47088193893432617, 0.244537353515625, 0.9599546194076538, 1.6753718852996826, 2.390789031982422, 3.1062064170837402, 3.8216238021850586, 4.537040710449219, 5.252458095550537, 5.9678754806518555, 6.683292865753174, 7.398710250854492, 8.114127159118652, 8.829544067382812, 9.544961929321289, 10.26037883758545, 10.97579574584961, 11.691213607788086, 12.406630516052246, 13.122048377990723, 13.837465286254883, 14.55288314819336, 15.26830005645752, 15.98371696472168, 16.699134826660156, 17.41455078125, 18.129968643188477, 18.84538459777832, 19.560802459716797, 20.276220321655273, 20.99163818359375, 21.707054138183594, 22.42247200012207, 23.137889862060547]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 15.0, 16.0, 26.0, 39.0, 76.0, 93.0, 146.0, 266.0, 456.0, 722.0, 1289.0, 2652.0, 5465.0, 13014.0, 37836.0, 207206.0, 3649163.0, 212744.0, 38661.0, 13147.0, 5496.0, 2663.0, 1290.0, 723.0, 418.0, 227.0, 147.0, 94.0, 59.0, 39.0, 29.0, 14.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.8359375, -7.615234375, -7.39453125, -7.173828125, -6.953125, -6.732421875, -6.51171875, -6.291015625, -6.0703125, -5.849609375, -5.62890625, -5.408203125, -5.1875, -4.966796875, -4.74609375, -4.525390625, -4.3046875, -4.083984375, -3.86328125, -3.642578125, -3.421875, -3.201171875, -2.98046875, -2.759765625, -2.5390625, -2.318359375, -2.09765625, -1.876953125, -1.65625, -1.435546875, -1.21484375, -0.994140625, -0.7734375, -0.552734375, -0.33203125, -0.111328125, 0.109375, 0.330078125, 0.55078125, 0.771484375, 0.9921875, 1.212890625, 1.43359375, 1.654296875, 1.875, 2.095703125, 2.31640625, 2.537109375, 2.7578125, 2.978515625, 3.19921875, 3.419921875, 3.640625, 3.861328125, 4.08203125, 4.302734375, 4.5234375, 4.744140625, 4.96484375, 5.185546875, 5.40625, 5.626953125, 5.84765625, 6.068359375, 6.2890625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 6.0, 4.0, 14.0, 6.0, 7.0, 13.0, 18.0, 16.0, 18.0, 20.0, 33.0, 24.0, 51.0, 34.0, 40.0, 29.0, 43.0, 44.0, 55.0, 36.0, 35.0, 37.0, 40.0, 51.0, 36.0, 44.0, 31.0, 30.0, 29.0, 28.0, 26.0, 17.0, 8.0, 14.0, 11.0, 10.0, 6.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-1.1650390625, -1.1313018798828125, -1.097564697265625, -1.0638275146484375, -1.03009033203125, -0.9963531494140625, -0.962615966796875, -0.9288787841796875, -0.8951416015625, -0.8614044189453125, -0.827667236328125, -0.7939300537109375, -0.76019287109375, -0.7264556884765625, -0.692718505859375, -0.6589813232421875, -0.625244140625, -0.5915069580078125, -0.557769775390625, -0.5240325927734375, -0.49029541015625, -0.4565582275390625, -0.422821044921875, -0.3890838623046875, -0.3553466796875, -0.3216094970703125, -0.287872314453125, -0.2541351318359375, -0.22039794921875, -0.1866607666015625, -0.152923583984375, -0.1191864013671875, -0.08544921875, -0.0517120361328125, -0.017974853515625, 0.0157623291015625, 0.04949951171875, 0.0832366943359375, 0.116973876953125, 0.1507110595703125, 0.1844482421875, 0.2181854248046875, 0.251922607421875, 0.2856597900390625, 0.31939697265625, 0.3531341552734375, 0.386871337890625, 0.4206085205078125, 0.454345703125, 0.4880828857421875, 0.521820068359375, 0.5555572509765625, 0.58929443359375, 0.6230316162109375, 0.656768798828125, 0.6905059814453125, 0.7242431640625, 0.7579803466796875, 0.791717529296875, 0.8254547119140625, 0.85919189453125, 0.8929290771484375, 0.926666259765625, 0.9604034423828125, 0.994140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 9.0, 14.0, 13.0, 17.0, 30.0, 56.0, 59.0, 96.0, 130.0, 178.0, 309.0, 489.0, 902.0, 1904.0, 4527.0, 13595.0, 52184.0, 508627.0, 3442933.0, 129386.0, 25334.0, 7699.0, 2849.0, 1221.0, 608.0, 339.0, 249.0, 177.0, 107.0, 70.0, 55.0, 40.0, 19.0, 16.0, 14.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.22906494140625, -7.9815673828125, -7.73406982421875, -7.486572265625, -7.23907470703125, -6.9915771484375, -6.74407958984375, -6.49658203125, -6.24908447265625, -6.0015869140625, -5.75408935546875, -5.506591796875, -5.25909423828125, -5.0115966796875, -4.76409912109375, -4.5166015625, -4.26910400390625, -4.0216064453125, -3.77410888671875, -3.526611328125, -3.27911376953125, -3.0316162109375, -2.78411865234375, -2.53662109375, -2.28912353515625, -2.0416259765625, -1.79412841796875, -1.546630859375, -1.29913330078125, -1.0516357421875, -0.80413818359375, -0.556640625, -0.30914306640625, -0.0616455078125, 0.18585205078125, 0.433349609375, 0.68084716796875, 0.9283447265625, 1.17584228515625, 1.42333984375, 1.67083740234375, 1.9183349609375, 2.16583251953125, 2.413330078125, 2.66082763671875, 2.9083251953125, 3.15582275390625, 3.4033203125, 3.65081787109375, 3.8983154296875, 4.14581298828125, 4.393310546875, 4.64080810546875, 4.8883056640625, 5.13580322265625, 5.38330078125, 5.63079833984375, 5.8782958984375, 6.12579345703125, 6.373291015625, 6.62078857421875, 6.8682861328125, 7.11578369140625, 7.36328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 9.0, 15.0, 17.0, 25.0, 24.0, 55.0, 84.0, 207.0, 575.0, 2022.0, 579.0, 208.0, 91.0, 61.0, 45.0, 9.0, 20.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.114410400390625, -3.99835205078125, -3.882293701171875, -3.7662353515625, -3.650177001953125, -3.53411865234375, -3.418060302734375, -3.302001953125, -3.185943603515625, -3.06988525390625, -2.953826904296875, -2.8377685546875, -2.721710205078125, -2.60565185546875, -2.489593505859375, -2.37353515625, -2.257476806640625, -2.14141845703125, -2.025360107421875, -1.9093017578125, -1.793243408203125, -1.67718505859375, -1.561126708984375, -1.445068359375, -1.329010009765625, -1.21295166015625, -1.096893310546875, -0.9808349609375, -0.864776611328125, -0.74871826171875, -0.632659912109375, -0.5166015625, -0.400543212890625, -0.28448486328125, -0.168426513671875, -0.0523681640625, 0.063690185546875, 0.17974853515625, 0.295806884765625, 0.411865234375, 0.527923583984375, 0.64398193359375, 0.760040283203125, 0.8760986328125, 0.992156982421875, 1.10821533203125, 1.224273681640625, 1.34033203125, 1.456390380859375, 1.57244873046875, 1.688507080078125, 1.8045654296875, 1.920623779296875, 2.03668212890625, 2.152740478515625, 2.268798828125, 2.384857177734375, 2.50091552734375, 2.616973876953125, 2.7330322265625, 2.849090576171875, 2.96514892578125, 3.081207275390625, 3.197265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 6.0, 12.0, 13.0, 13.0, 36.0, 49.0, 75.0, 107.0, 133.0, 114.0, 149.0, 105.0, 66.0, 45.0, 33.0, 21.0, 9.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.04202651977539, -22.510051727294922, -21.978076934814453, -21.446102142333984, -20.914127349853516, -20.38215446472168, -19.85017967224121, -19.318204879760742, -18.786230087280273, -18.254255294799805, -17.722280502319336, -17.190305709838867, -16.65833282470703, -16.126358032226562, -15.594383239746094, -15.062408447265625, -14.530433654785156, -13.998458862304688, -13.466484069824219, -12.934510231018066, -12.402535438537598, -11.870560646057129, -11.338586807250977, -10.806612014770508, -10.274637222290039, -9.74266242980957, -9.210687637329102, -8.67871379852295, -8.14673900604248, -7.614764213562012, -7.082789897918701, -6.550815582275391, -6.018838882446289, -5.48686408996582, -4.95488977432251, -4.422915458679199, -3.8909406661987305, -3.358966112136841, -2.826991558074951, -2.2950170040130615, -1.7630424499511719, -1.2310678958892822, -0.6990933418273926, -0.16711878776550293, 0.3648557662963867, 0.8968303203582764, 1.428804874420166, 1.9607794284820557, 2.4927539825439453, 3.024728536605835, 3.5567030906677246, 4.088677406311035, 4.620652198791504, 5.152626991271973, 5.684601306915283, 6.216575622558594, 6.7485504150390625, 7.280525207519531, 7.812499523162842, 8.344473838806152, 8.876448631286621, 9.40842342376709, 9.940397262573242, 10.472372055053711, 11.00434684753418]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 9.0, 8.0, 13.0, 11.0, 22.0, 15.0, 22.0, 16.0, 14.0, 17.0, 34.0, 22.0, 40.0, 34.0, 44.0, 36.0, 44.0, 44.0, 35.0, 50.0, 36.0, 41.0, 40.0, 30.0, 31.0, 37.0, 38.0, 27.0, 32.0, 15.0, 22.0, 20.0, 22.0, 14.0, 13.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.785093784332275, -6.556012153625488, -6.326930522918701, -6.097848892211914, -5.868766784667969, -5.639685153961182, -5.4106035232543945, -5.181521892547607, -4.95244026184082, -4.723358631134033, -4.494277000427246, -4.265194892883301, -4.036113262176514, -3.8070316314697266, -3.5779500007629395, -3.3488683700561523, -3.119786262512207, -2.89070463180542, -2.6616227626800537, -2.4325411319732666, -2.2034592628479004, -1.9743776321411133, -1.7452960014343262, -1.5162142515182495, -1.2871325016021729, -1.0580507516860962, -0.8289690613746643, -0.5998873710632324, -0.37080562114715576, -0.1417238712310791, 0.08735775947570801, 0.31643950939178467, 0.5455207824707031, 0.7746025323867798, 1.0036842823028564, 1.2327659130096436, 1.4618476629257202, 1.6909294128417969, 1.920011043548584, 2.149092674255371, 2.3781745433807373, 2.6072561740875244, 2.8363380432128906, 3.0654196739196777, 3.294501304626465, 3.523583173751831, 3.752664804458618, 3.9817466735839844, 4.2108283042907715, 4.439909934997559, 4.668991565704346, 4.898073196411133, 5.127155303955078, 5.356236934661865, 5.585318565368652, 5.8144001960754395, 6.043481826782227, 6.272563457489014, 6.501645088195801, 6.730727195739746, 6.959808826446533, 7.18889045715332, 7.417972087860107, 7.6470537185668945, 7.87613582611084]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 12.0, 15.0, 13.0, 31.0, 33.0, 60.0, 80.0, 163.0, 268.0, 578.0, 1142.0, 2805.0, 7529.0, 21849.0, 77187.0, 522381.0, 331079.0, 56029.0, 17122.0, 5877.0, 2245.0, 991.0, 459.0, 232.0, 125.0, 89.0, 50.0, 35.0, 23.0, 14.0, 9.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.720458984375, -6.48779296875, -6.255126953125, -6.0224609375, -5.789794921875, -5.55712890625, -5.324462890625, -5.091796875, -4.859130859375, -4.62646484375, -4.393798828125, -4.1611328125, -3.928466796875, -3.69580078125, -3.463134765625, -3.23046875, -2.997802734375, -2.76513671875, -2.532470703125, -2.2998046875, -2.067138671875, -1.83447265625, -1.601806640625, -1.369140625, -1.136474609375, -0.90380859375, -0.671142578125, -0.4384765625, -0.205810546875, 0.02685546875, 0.259521484375, 0.4921875, 0.724853515625, 0.95751953125, 1.190185546875, 1.4228515625, 1.655517578125, 1.88818359375, 2.120849609375, 2.353515625, 2.586181640625, 2.81884765625, 3.051513671875, 3.2841796875, 3.516845703125, 3.74951171875, 3.982177734375, 4.21484375, 4.447509765625, 4.68017578125, 4.912841796875, 5.1455078125, 5.378173828125, 5.61083984375, 5.843505859375, 6.076171875, 6.308837890625, 6.54150390625, 6.774169921875, 7.0068359375, 7.239501953125, 7.47216796875, 7.704833984375, 7.9375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 7.0, 12.0, 9.0, 9.0, 21.0, 18.0, 14.0, 24.0, 31.0, 28.0, 40.0, 41.0, 33.0, 45.0, 41.0, 39.0, 37.0, 49.0, 48.0, 39.0, 49.0, 40.0, 37.0, 51.0, 30.0, 30.0, 24.0, 31.0, 20.0, 17.0, 12.0, 12.0, 14.0, 9.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1796875, -1.1433258056640625, -1.106964111328125, -1.0706024169921875, -1.03424072265625, -0.9978790283203125, -0.961517333984375, -0.9251556396484375, -0.8887939453125, -0.8524322509765625, -0.816070556640625, -0.7797088623046875, -0.74334716796875, -0.7069854736328125, -0.670623779296875, -0.6342620849609375, -0.597900390625, -0.5615386962890625, -0.525177001953125, -0.4888153076171875, -0.45245361328125, -0.4160919189453125, -0.379730224609375, -0.3433685302734375, -0.3070068359375, -0.2706451416015625, -0.234283447265625, -0.1979217529296875, -0.16156005859375, -0.1251983642578125, -0.088836669921875, -0.0524749755859375, -0.01611328125, 0.0202484130859375, 0.056610107421875, 0.0929718017578125, 0.12933349609375, 0.1656951904296875, 0.202056884765625, 0.2384185791015625, 0.2747802734375, 0.3111419677734375, 0.347503662109375, 0.3838653564453125, 0.42022705078125, 0.4565887451171875, 0.492950439453125, 0.5293121337890625, 0.565673828125, 0.6020355224609375, 0.638397216796875, 0.6747589111328125, 0.71112060546875, 0.7474822998046875, 0.783843994140625, 0.8202056884765625, 0.8565673828125, 0.8929290771484375, 0.929290771484375, 0.9656524658203125, 1.00201416015625, 1.0383758544921875, 1.074737548828125, 1.1110992431640625, 1.1474609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 12.0, 12.0, 9.0, 15.0, 20.0, 45.0, 52.0, 87.0, 163.0, 218.0, 383.0, 739.0, 1739.0, 4629.0, 15018.0, 57573.0, 639398.0, 272988.0, 38471.0, 10741.0, 3415.0, 1338.0, 639.0, 343.0, 184.0, 108.0, 66.0, 53.0, 31.0, 24.0, 11.0, 6.0, 4.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3671875, -7.082275390625, -6.79736328125, -6.512451171875, -6.2275390625, -5.942626953125, -5.65771484375, -5.372802734375, -5.087890625, -4.802978515625, -4.51806640625, -4.233154296875, -3.9482421875, -3.663330078125, -3.37841796875, -3.093505859375, -2.80859375, -2.523681640625, -2.23876953125, -1.953857421875, -1.6689453125, -1.384033203125, -1.09912109375, -0.814208984375, -0.529296875, -0.244384765625, 0.04052734375, 0.325439453125, 0.6103515625, 0.895263671875, 1.18017578125, 1.465087890625, 1.75, 2.034912109375, 2.31982421875, 2.604736328125, 2.8896484375, 3.174560546875, 3.45947265625, 3.744384765625, 4.029296875, 4.314208984375, 4.59912109375, 4.884033203125, 5.1689453125, 5.453857421875, 5.73876953125, 6.023681640625, 6.30859375, 6.593505859375, 6.87841796875, 7.163330078125, 7.4482421875, 7.733154296875, 8.01806640625, 8.302978515625, 8.587890625, 8.872802734375, 9.15771484375, 9.442626953125, 9.7275390625, 10.012451171875, 10.29736328125, 10.582275390625, 10.8671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 16.0, 14.0, 21.0, 34.0, 38.0, 37.0, 55.0, 57.0, 71.0, 72.0, 81.0, 71.0, 52.0, 62.0, 57.0, 47.0, 38.0, 38.0, 27.0, 20.0, 12.0, 5.0, 10.0, 10.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8828125, -6.6414794921875, -6.400146484375, -6.1588134765625, -5.91748046875, -5.6761474609375, -5.434814453125, -5.1934814453125, -4.9521484375, -4.7108154296875, -4.469482421875, -4.2281494140625, -3.98681640625, -3.7454833984375, -3.504150390625, -3.2628173828125, -3.021484375, -2.7801513671875, -2.538818359375, -2.2974853515625, -2.05615234375, -1.8148193359375, -1.573486328125, -1.3321533203125, -1.0908203125, -0.8494873046875, -0.608154296875, -0.3668212890625, -0.12548828125, 0.1158447265625, 0.357177734375, 0.5985107421875, 0.83984375, 1.0811767578125, 1.322509765625, 1.5638427734375, 1.80517578125, 2.0465087890625, 2.287841796875, 2.5291748046875, 2.7705078125, 3.0118408203125, 3.253173828125, 3.4945068359375, 3.73583984375, 3.9771728515625, 4.218505859375, 4.4598388671875, 4.701171875, 4.9425048828125, 5.183837890625, 5.4251708984375, 5.66650390625, 5.9078369140625, 6.149169921875, 6.3905029296875, 6.6318359375, 6.8731689453125, 7.114501953125, 7.3558349609375, 7.59716796875, 7.8385009765625, 8.079833984375, 8.3211669921875, 8.5625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 13.0, 17.0, 32.0, 53.0, 78.0, 154.0, 254.0, 489.0, 947.0, 2026.0, 4805.0, 12329.0, 32944.0, 118666.0, 637778.0, 172125.0, 40798.0, 14614.0, 5680.0, 2461.0, 1050.0, 526.0, 287.0, 160.0, 106.0, 62.0, 34.0, 23.0, 15.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65625, -2.55999755859375, -2.4637451171875, -2.36749267578125, -2.271240234375, -2.17498779296875, -2.0787353515625, -1.98248291015625, -1.88623046875, -1.78997802734375, -1.6937255859375, -1.59747314453125, -1.501220703125, -1.40496826171875, -1.3087158203125, -1.21246337890625, -1.1162109375, -1.01995849609375, -0.9237060546875, -0.82745361328125, -0.731201171875, -0.63494873046875, -0.5386962890625, -0.44244384765625, -0.34619140625, -0.24993896484375, -0.1536865234375, -0.05743408203125, 0.038818359375, 0.13507080078125, 0.2313232421875, 0.32757568359375, 0.423828125, 0.52008056640625, 0.6163330078125, 0.71258544921875, 0.808837890625, 0.90509033203125, 1.0013427734375, 1.09759521484375, 1.19384765625, 1.29010009765625, 1.3863525390625, 1.48260498046875, 1.578857421875, 1.67510986328125, 1.7713623046875, 1.86761474609375, 1.9638671875, 2.06011962890625, 2.1563720703125, 2.25262451171875, 2.348876953125, 2.44512939453125, 2.5413818359375, 2.63763427734375, 2.73388671875, 2.83013916015625, 2.9263916015625, 3.02264404296875, 3.118896484375, 3.21514892578125, 3.3114013671875, 3.40765380859375, 3.50390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 15.0, 9.0, 16.0, 22.0, 28.0, 80.0, 300.0, 305.0, 85.0, 38.0, 14.0, 15.0, 12.0, 9.0, 7.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00139617919921875, -0.0013573914766311646, -0.001318603754043579, -0.0012798160314559937, -0.0012410283088684082, -0.0012022405862808228, -0.0011634528636932373, -0.0011246651411056519, -0.0010858774185180664, -0.001047089695930481, -0.0010083019733428955, -0.0009695142507553101, -0.0009307265281677246, -0.0008919388055801392, -0.0008531510829925537, -0.0008143633604049683, -0.0007755756378173828, -0.0007367879152297974, -0.0006980001926422119, -0.0006592124700546265, -0.000620424747467041, -0.0005816370248794556, -0.0005428493022918701, -0.0005040615797042847, -0.0004652738571166992, -0.00042648613452911377, -0.0003876984119415283, -0.00034891068935394287, -0.0003101229667663574, -0.00027133524417877197, -0.00023254752159118652, -0.00019375979900360107, -0.00015497207641601562, -0.00011618435382843018, -7.739663124084473e-05, -3.860890865325928e-05, 1.7881393432617188e-07, 3.896653652191162e-05, 7.775425910949707e-05, 0.00011654198169708252, 0.00015532970428466797, 0.00019411742687225342, 0.00023290514945983887, 0.0002716928720474243, 0.00031048059463500977, 0.0003492683172225952, 0.00038805603981018066, 0.0004268437623977661, 0.00046563148498535156, 0.000504419207572937, 0.0005432069301605225, 0.0005819946527481079, 0.0006207823753356934, 0.0006595700979232788, 0.0006983578205108643, 0.0007371455430984497, 0.0007759332656860352, 0.0008147209882736206, 0.0008535087108612061, 0.0008922964334487915, 0.000931084156036377, 0.0009698718786239624, 0.0010086596012115479, 0.0010474473237991333, 0.0010862350463867188]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 6.0, 4.0, 8.0, 13.0, 13.0, 20.0, 29.0, 38.0, 62.0, 90.0, 133.0, 219.0, 375.0, 665.0, 1278.0, 2572.0, 5755.0, 13693.0, 34474.0, 120705.0, 628399.0, 169885.0, 41326.0, 15890.0, 6668.0, 2891.0, 1444.0, 777.0, 413.0, 253.0, 144.0, 100.0, 76.0, 42.0, 26.0, 21.0, 8.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.073272705078125, -1.99224853515625, -1.911224365234375, -1.8302001953125, -1.749176025390625, -1.66815185546875, -1.587127685546875, -1.506103515625, -1.425079345703125, -1.34405517578125, -1.263031005859375, -1.1820068359375, -1.100982666015625, -1.01995849609375, -0.938934326171875, -0.85791015625, -0.776885986328125, -0.69586181640625, -0.614837646484375, -0.5338134765625, -0.452789306640625, -0.37176513671875, -0.290740966796875, -0.209716796875, -0.128692626953125, -0.04766845703125, 0.033355712890625, 0.1143798828125, 0.195404052734375, 0.27642822265625, 0.357452392578125, 0.4384765625, 0.519500732421875, 0.60052490234375, 0.681549072265625, 0.7625732421875, 0.843597412109375, 0.92462158203125, 1.005645751953125, 1.086669921875, 1.167694091796875, 1.24871826171875, 1.329742431640625, 1.4107666015625, 1.491790771484375, 1.57281494140625, 1.653839111328125, 1.73486328125, 1.815887451171875, 1.89691162109375, 1.977935791015625, 2.0589599609375, 2.139984130859375, 2.22100830078125, 2.302032470703125, 2.383056640625, 2.464080810546875, 2.54510498046875, 2.626129150390625, 2.7071533203125, 2.788177490234375, 2.86920166015625, 2.950225830078125, 3.03125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 4.0, 3.0, 7.0, 1.0, 7.0, 7.0, 9.0, 11.0, 14.0, 11.0, 20.0, 20.0, 37.0, 49.0, 86.0, 114.0, 130.0, 119.0, 96.0, 67.0, 38.0, 23.0, 16.0, 17.0, 16.0, 17.0, 10.0, 4.0, 9.0, 4.0, 7.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9208984375, -1.8563385009765625, -1.791778564453125, -1.7272186279296875, -1.66265869140625, -1.5980987548828125, -1.533538818359375, -1.4689788818359375, -1.4044189453125, -1.3398590087890625, -1.275299072265625, -1.2107391357421875, -1.14617919921875, -1.0816192626953125, -1.017059326171875, -0.9524993896484375, -0.887939453125, -0.8233795166015625, -0.758819580078125, -0.6942596435546875, -0.62969970703125, -0.5651397705078125, -0.500579833984375, -0.4360198974609375, -0.3714599609375, -0.3069000244140625, -0.242340087890625, -0.1777801513671875, -0.11322021484375, -0.0486602783203125, 0.015899658203125, 0.0804595947265625, 0.14501953125, 0.2095794677734375, 0.274139404296875, 0.3386993408203125, 0.40325927734375, 0.4678192138671875, 0.532379150390625, 0.5969390869140625, 0.6614990234375, 0.7260589599609375, 0.790618896484375, 0.8551788330078125, 0.91973876953125, 0.9842987060546875, 1.048858642578125, 1.1134185791015625, 1.177978515625, 1.2425384521484375, 1.307098388671875, 1.3716583251953125, 1.43621826171875, 1.5007781982421875, 1.565338134765625, 1.6298980712890625, 1.6944580078125, 1.7590179443359375, 1.823577880859375, 1.8881378173828125, 1.95269775390625, 2.0172576904296875, 2.081817626953125, 2.1463775634765625, 2.2109375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 21.0, 29.0, 40.0, 63.0, 88.0, 130.0, 137.0, 104.0, 107.0, 83.0, 72.0, 47.0, 24.0, 17.0, 8.0, 10.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.31786346435547, -27.983177185058594, -26.64849090576172, -25.313804626464844, -23.9791202545166, -22.644433975219727, -21.30974769592285, -19.97506332397461, -18.640377044677734, -17.30569076538086, -15.9710054397583, -14.636319160461426, -13.301633834838867, -11.966947555541992, -10.632261276245117, -9.297575950622559, -7.962888717651367, -6.62820291519165, -5.293517112731934, -3.9588308334350586, -2.624145030975342, -1.289459228515625, 0.04522705078125, 1.3799123764038086, 2.7145986557006836, 4.0492844581604, 5.383970260620117, 6.718656539916992, 8.053342819213867, 9.388028144836426, 10.7227144241333, 12.05739974975586, 13.392086029052734, 14.72677230834961, 16.061458587646484, 17.39614486694336, 18.7308292388916, 20.065515518188477, 21.40020179748535, 22.734886169433594, 24.06957244873047, 25.404258728027344, 26.73894500732422, 28.073631286621094, 29.408315658569336, 30.74300193786621, 32.07769012451172, 33.41237258911133, 34.74706268310547, 36.081748962402344, 37.41643524169922, 38.751121520996094, 40.08580780029297, 41.420494079589844, 42.75518035888672, 44.08986282348633, 45.4245491027832, 46.75923538208008, 48.09392166137695, 49.42860794067383, 50.7632942199707, 52.09797668457031, 53.43266296386719, 54.76734924316406, 56.10203552246094]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 10.0, 6.0, 9.0, 10.0, 9.0, 7.0, 17.0, 19.0, 15.0, 25.0, 26.0, 27.0, 22.0, 24.0, 28.0, 33.0, 35.0, 40.0, 42.0, 41.0, 41.0, 50.0, 30.0, 45.0, 32.0, 41.0, 48.0, 28.0, 30.0, 29.0, 23.0, 18.0, 23.0, 21.0, 14.0, 18.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 7.0, 10.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.662212371826172, -20.99093246459961, -20.319652557373047, -19.648372650146484, -18.977092742919922, -18.30581283569336, -17.634532928466797, -16.963253021240234, -16.291973114013672, -15.62069320678711, -14.949413299560547, -14.278133392333984, -13.606853485107422, -12.93557357788086, -12.264294624328613, -11.59301471710205, -10.921735763549805, -10.250455856323242, -9.57917594909668, -8.907896041870117, -8.236616134643555, -7.56533670425415, -6.894057273864746, -6.222777366638184, -5.551497459411621, -4.880217552185059, -4.208937644958496, -3.537658214569092, -2.8663783073425293, -2.195098400115967, -1.5238189697265625, -0.8525390625, -0.1812591552734375, 0.49002063274383545, 1.1613004207611084, 1.8325800895690918, 2.5038599967956543, 3.175139904022217, 3.846419334411621, 4.517699241638184, 5.188979148864746, 5.860259056091309, 6.531538963317871, 7.202818393707275, 7.874098300933838, 8.545377731323242, 9.216657638549805, 9.887937545776367, 10.55921745300293, 11.230497360229492, 11.901777267456055, 12.573057174682617, 13.24433708190918, 13.915616989135742, 14.586895942687988, 15.25817584991455, 15.929455757141113, 16.60073471069336, 17.272014617919922, 17.943294525146484, 18.614574432373047, 19.28585433959961, 19.957134246826172, 20.628414154052734, 21.299694061279297]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 6.0, 11.0, 14.0, 25.0, 33.0, 32.0, 53.0, 117.0, 168.0, 288.0, 498.0, 852.0, 1595.0, 2881.0, 6498.0, 15591.0, 50177.0, 434826.0, 3531982.0, 105058.0, 25262.0, 9501.0, 4259.0, 1994.0, 1085.0, 558.0, 349.0, 202.0, 129.0, 81.0, 43.0, 33.0, 15.0, 15.0, 18.0, 11.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -6.99493408203125, -6.7281494140625, -6.46136474609375, -6.194580078125, -5.92779541015625, -5.6610107421875, -5.39422607421875, -5.12744140625, -4.86065673828125, -4.5938720703125, -4.32708740234375, -4.060302734375, -3.79351806640625, -3.5267333984375, -3.25994873046875, -2.9931640625, -2.72637939453125, -2.4595947265625, -2.19281005859375, -1.926025390625, -1.65924072265625, -1.3924560546875, -1.12567138671875, -0.85888671875, -0.59210205078125, -0.3253173828125, -0.05853271484375, 0.208251953125, 0.47503662109375, 0.7418212890625, 1.00860595703125, 1.275390625, 1.54217529296875, 1.8089599609375, 2.07574462890625, 2.342529296875, 2.60931396484375, 2.8760986328125, 3.14288330078125, 3.40966796875, 3.67645263671875, 3.9432373046875, 4.21002197265625, 4.476806640625, 4.74359130859375, 5.0103759765625, 5.27716064453125, 5.5439453125, 5.81072998046875, 6.0775146484375, 6.34429931640625, 6.611083984375, 6.87786865234375, 7.1446533203125, 7.41143798828125, 7.67822265625, 7.94500732421875, 8.2117919921875, 8.47857666015625, 8.745361328125, 9.01214599609375, 9.2789306640625, 9.54571533203125, 9.8125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 4.0, 8.0, 8.0, 5.0, 13.0, 9.0, 11.0, 20.0, 13.0, 22.0, 24.0, 28.0, 24.0, 29.0, 30.0, 29.0, 36.0, 37.0, 45.0, 40.0, 37.0, 46.0, 36.0, 24.0, 40.0, 47.0, 45.0, 46.0, 34.0, 26.0, 14.0, 19.0, 29.0, 20.0, 20.0, 15.0, 13.0, 10.0, 7.0, 9.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.072265625, -1.0380859375, -1.00390625, -0.9697265625, -0.935546875, -0.9013671875, -0.8671875, -0.8330078125, -0.798828125, -0.7646484375, -0.73046875, -0.6962890625, -0.662109375, -0.6279296875, -0.59375, -0.5595703125, -0.525390625, -0.4912109375, -0.45703125, -0.4228515625, -0.388671875, -0.3544921875, -0.3203125, -0.2861328125, -0.251953125, -0.2177734375, -0.18359375, -0.1494140625, -0.115234375, -0.0810546875, -0.046875, -0.0126953125, 0.021484375, 0.0556640625, 0.08984375, 0.1240234375, 0.158203125, 0.1923828125, 0.2265625, 0.2607421875, 0.294921875, 0.3291015625, 0.36328125, 0.3974609375, 0.431640625, 0.4658203125, 0.5, 0.5341796875, 0.568359375, 0.6025390625, 0.63671875, 0.6708984375, 0.705078125, 0.7392578125, 0.7734375, 0.8076171875, 0.841796875, 0.8759765625, 0.91015625, 0.9443359375, 0.978515625, 1.0126953125, 1.046875, 1.0810546875, 1.115234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 4.0, 7.0, 11.0, 16.0, 23.0, 31.0, 42.0, 60.0, 103.0, 123.0, 190.0, 282.0, 423.0, 747.0, 1092.0, 1804.0, 3010.0, 4952.0, 9298.0, 17681.0, 39534.0, 114630.0, 652570.0, 3020372.0, 213342.0, 60778.0, 24735.0, 12120.0, 6481.0, 3627.0, 2204.0, 1391.0, 912.0, 550.0, 364.0, 242.0, 149.0, 115.0, 80.0, 54.0, 40.0, 28.0, 31.0, 9.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.61102294921875, -5.4368896484375, -5.26275634765625, -5.088623046875, -4.91448974609375, -4.7403564453125, -4.56622314453125, -4.39208984375, -4.21795654296875, -4.0438232421875, -3.86968994140625, -3.695556640625, -3.52142333984375, -3.3472900390625, -3.17315673828125, -2.9990234375, -2.82489013671875, -2.6507568359375, -2.47662353515625, -2.302490234375, -2.12835693359375, -1.9542236328125, -1.78009033203125, -1.60595703125, -1.43182373046875, -1.2576904296875, -1.08355712890625, -0.909423828125, -0.73529052734375, -0.5611572265625, -0.38702392578125, -0.212890625, -0.03875732421875, 0.1353759765625, 0.30950927734375, 0.483642578125, 0.65777587890625, 0.8319091796875, 1.00604248046875, 1.18017578125, 1.35430908203125, 1.5284423828125, 1.70257568359375, 1.876708984375, 2.05084228515625, 2.2249755859375, 2.39910888671875, 2.5732421875, 2.74737548828125, 2.9215087890625, 3.09564208984375, 3.269775390625, 3.44390869140625, 3.6180419921875, 3.79217529296875, 3.96630859375, 4.14044189453125, 4.3145751953125, 4.48870849609375, 4.662841796875, 4.83697509765625, 5.0111083984375, 5.18524169921875, 5.359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 12.0, 4.0, 13.0, 14.0, 23.0, 18.0, 26.0, 48.0, 92.0, 102.0, 177.0, 416.0, 1939.0, 552.0, 236.0, 100.0, 92.0, 48.0, 40.0, 25.0, 24.0, 15.0, 8.0, 8.0, 6.0, 5.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.310546875, -3.2176513671875, -3.124755859375, -3.0318603515625, -2.93896484375, -2.8460693359375, -2.753173828125, -2.6602783203125, -2.5673828125, -2.4744873046875, -2.381591796875, -2.2886962890625, -2.19580078125, -2.1029052734375, -2.010009765625, -1.9171142578125, -1.82421875, -1.7313232421875, -1.638427734375, -1.5455322265625, -1.45263671875, -1.3597412109375, -1.266845703125, -1.1739501953125, -1.0810546875, -0.9881591796875, -0.895263671875, -0.8023681640625, -0.70947265625, -0.6165771484375, -0.523681640625, -0.4307861328125, -0.337890625, -0.2449951171875, -0.152099609375, -0.0592041015625, 0.03369140625, 0.1265869140625, 0.219482421875, 0.3123779296875, 0.4052734375, 0.4981689453125, 0.591064453125, 0.6839599609375, 0.77685546875, 0.8697509765625, 0.962646484375, 1.0555419921875, 1.1484375, 1.2413330078125, 1.334228515625, 1.4271240234375, 1.52001953125, 1.6129150390625, 1.705810546875, 1.7987060546875, 1.8916015625, 1.9844970703125, 2.077392578125, 2.1702880859375, 2.26318359375, 2.3560791015625, 2.448974609375, 2.5418701171875, 2.634765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 24.0, 80.0, 175.0, 231.0, 234.0, 134.0, 78.0, 26.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.13190841674805, -40.93213653564453, -39.732364654541016, -38.5325927734375, -37.33282470703125, -36.133052825927734, -34.93328094482422, -33.7335090637207, -32.53373718261719, -31.333965301513672, -30.134193420410156, -28.934423446655273, -27.734651565551758, -26.534879684448242, -25.33510971069336, -24.135337829589844, -22.935565948486328, -21.735794067382812, -20.536022186279297, -19.336252212524414, -18.1364803314209, -16.936708450317383, -15.736937522888184, -14.537166595458984, -13.337394714355469, -12.137622833251953, -10.937851905822754, -9.738080978393555, -8.538309097290039, -7.338537693023682, -6.138766288757324, -4.938995361328125, -3.739227294921875, -2.5394558906555176, -1.3396844863891602, -0.13991308212280273, 1.0598583221435547, 2.259629726409912, 3.4594011306762695, 4.659172058105469, 5.858943939208984, 7.058715343475342, 8.2584867477417, 9.458257675170898, 10.658029556274414, 11.85780143737793, 13.057572364807129, 14.257343292236328, 15.457115173339844, 16.65688705444336, 17.856658935546875, 19.056428909301758, 20.256200790405273, 21.45597267150879, 22.655742645263672, 23.855514526367188, 25.055286407470703, 26.25505828857422, 27.454830169677734, 28.654600143432617, 29.854372024536133, 31.05414390563965, 32.25391387939453, 33.45368576049805, 34.65345764160156]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 8.0, 8.0, 9.0, 11.0, 4.0, 5.0, 14.0, 13.0, 17.0, 17.0, 17.0, 26.0, 14.0, 35.0, 41.0, 30.0, 37.0, 39.0, 45.0, 32.0, 45.0, 52.0, 41.0, 40.0, 37.0, 30.0, 41.0, 39.0, 28.0, 35.0, 31.0, 24.0, 20.0, 19.0, 19.0, 13.0, 15.0, 5.0, 10.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.676658630371094, -8.408642768859863, -8.140626907348633, -7.8726115226745605, -7.60459566116333, -7.336580276489258, -7.068564414978027, -6.800548553466797, -6.532532691955566, -6.264516830444336, -5.996501445770264, -5.728485584259033, -5.460469722747803, -5.1924543380737305, -4.9244384765625, -4.6564226150512695, -4.388407230377197, -4.120391368865967, -3.8523757457733154, -3.584360122680664, -3.3163442611694336, -3.0483286380767822, -2.780313014984131, -2.5122971534729004, -2.244281530380249, -1.976265788078308, -1.7082500457763672, -1.4402344226837158, -1.172218680381775, -0.904202938079834, -0.6361873149871826, -0.3681715726852417, -0.10015583038330078, 0.16785988211631775, 0.4358755946159363, 0.7038912773132324, 0.9719070196151733, 1.2399227619171143, 1.5079383850097656, 1.7759541273117065, 2.0439698696136475, 2.311985492706299, 2.5800013542175293, 2.8480169773101807, 3.116032600402832, 3.3840484619140625, 3.652064085006714, 3.9200797080993652, 4.188095569610596, 4.456111431121826, 4.724126815795898, 4.992142677307129, 5.260158538818359, 5.52817440032959, 5.796189785003662, 6.064205646514893, 6.332221031188965, 6.600236892700195, 6.868252277374268, 7.136268138885498, 7.4042840003967285, 7.672299385070801, 7.940315246582031, 8.208331108093262, 8.476346969604492]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 9.0, 18.0, 26.0, 31.0, 46.0, 80.0, 134.0, 199.0, 372.0, 479.0, 832.0, 1455.0, 2613.0, 4855.0, 9218.0, 18235.0, 35782.0, 70284.0, 133846.0, 285949.0, 244190.0, 115261.0, 60370.0, 30886.0, 15534.0, 8028.0, 4184.0, 2323.0, 1314.0, 765.0, 439.0, 280.0, 184.0, 105.0, 61.0, 43.0, 37.0, 21.0, 21.0, 8.0, 7.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.777435302734375, -3.64666748046875, -3.515899658203125, -3.3851318359375, -3.254364013671875, -3.12359619140625, -2.992828369140625, -2.862060546875, -2.731292724609375, -2.60052490234375, -2.469757080078125, -2.3389892578125, -2.208221435546875, -2.07745361328125, -1.946685791015625, -1.81591796875, -1.685150146484375, -1.55438232421875, -1.423614501953125, -1.2928466796875, -1.162078857421875, -1.03131103515625, -0.900543212890625, -0.769775390625, -0.639007568359375, -0.50823974609375, -0.377471923828125, -0.2467041015625, -0.115936279296875, 0.01483154296875, 0.145599365234375, 0.2763671875, 0.407135009765625, 0.53790283203125, 0.668670654296875, 0.7994384765625, 0.930206298828125, 1.06097412109375, 1.191741943359375, 1.322509765625, 1.453277587890625, 1.58404541015625, 1.714813232421875, 1.8455810546875, 1.976348876953125, 2.10711669921875, 2.237884521484375, 2.36865234375, 2.499420166015625, 2.63018798828125, 2.760955810546875, 2.8917236328125, 3.022491455078125, 3.15325927734375, 3.284027099609375, 3.414794921875, 3.545562744140625, 3.67633056640625, 3.807098388671875, 3.9378662109375, 4.068634033203125, 4.19940185546875, 4.330169677734375, 4.4609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 3.0, 9.0, 8.0, 8.0, 17.0, 20.0, 14.0, 15.0, 17.0, 27.0, 22.0, 33.0, 33.0, 30.0, 34.0, 39.0, 45.0, 29.0, 49.0, 41.0, 41.0, 37.0, 44.0, 41.0, 41.0, 36.0, 27.0, 26.0, 19.0, 22.0, 25.0, 22.0, 20.0, 9.0, 16.0, 16.0, 10.0, 4.0, 12.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.2607421875, -1.2244415283203125, -1.188140869140625, -1.1518402099609375, -1.11553955078125, -1.0792388916015625, -1.042938232421875, -1.0066375732421875, -0.9703369140625, -0.9340362548828125, -0.897735595703125, -0.8614349365234375, -0.82513427734375, -0.7888336181640625, -0.752532958984375, -0.7162322998046875, -0.679931640625, -0.6436309814453125, -0.607330322265625, -0.5710296630859375, -0.53472900390625, -0.4984283447265625, -0.462127685546875, -0.4258270263671875, -0.3895263671875, -0.3532257080078125, -0.316925048828125, -0.2806243896484375, -0.24432373046875, -0.2080230712890625, -0.171722412109375, -0.1354217529296875, -0.09912109375, -0.0628204345703125, -0.026519775390625, 0.0097808837890625, 0.04608154296875, 0.0823822021484375, 0.118682861328125, 0.1549835205078125, 0.1912841796875, 0.2275848388671875, 0.263885498046875, 0.3001861572265625, 0.33648681640625, 0.3727874755859375, 0.409088134765625, 0.4453887939453125, 0.481689453125, 0.5179901123046875, 0.554290771484375, 0.5905914306640625, 0.62689208984375, 0.6631927490234375, 0.699493408203125, 0.7357940673828125, 0.7720947265625, 0.8083953857421875, 0.844696044921875, 0.8809967041015625, 0.91729736328125, 0.9535980224609375, 0.989898681640625, 1.0261993408203125, 1.0625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 7.0, 11.0, 15.0, 28.0, 29.0, 44.0, 48.0, 96.0, 103.0, 138.0, 191.0, 229.0, 428.0, 675.0, 1281.0, 3487.0, 20995.0, 182026.0, 710484.0, 109486.0, 13183.0, 2642.0, 1089.0, 614.0, 356.0, 257.0, 169.0, 127.0, 80.0, 68.0, 46.0, 34.0, 25.0, 20.0, 17.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.015625, -12.6370849609375, -12.258544921875, -11.8800048828125, -11.50146484375, -11.1229248046875, -10.744384765625, -10.3658447265625, -9.9873046875, -9.6087646484375, -9.230224609375, -8.8516845703125, -8.47314453125, -8.0946044921875, -7.716064453125, -7.3375244140625, -6.958984375, -6.5804443359375, -6.201904296875, -5.8233642578125, -5.44482421875, -5.0662841796875, -4.687744140625, -4.3092041015625, -3.9306640625, -3.5521240234375, -3.173583984375, -2.7950439453125, -2.41650390625, -2.0379638671875, -1.659423828125, -1.2808837890625, -0.90234375, -0.5238037109375, -0.145263671875, 0.2332763671875, 0.61181640625, 0.9903564453125, 1.368896484375, 1.7474365234375, 2.1259765625, 2.5045166015625, 2.883056640625, 3.2615966796875, 3.64013671875, 4.0186767578125, 4.397216796875, 4.7757568359375, 5.154296875, 5.5328369140625, 5.911376953125, 6.2899169921875, 6.66845703125, 7.0469970703125, 7.425537109375, 7.8040771484375, 8.1826171875, 8.5611572265625, 8.939697265625, 9.3182373046875, 9.69677734375, 10.0753173828125, 10.453857421875, 10.8323974609375, 11.2109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 10.0, 8.0, 10.0, 17.0, 32.0, 26.0, 19.0, 28.0, 49.0, 41.0, 53.0, 51.0, 44.0, 56.0, 53.0, 64.0, 66.0, 42.0, 48.0, 40.0, 38.0, 40.0, 32.0, 27.0, 12.0, 22.0, 13.0, 9.0, 11.0, 7.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.8125, -8.5684814453125, -8.324462890625, -8.0804443359375, -7.83642578125, -7.5924072265625, -7.348388671875, -7.1043701171875, -6.8603515625, -6.6163330078125, -6.372314453125, -6.1282958984375, -5.88427734375, -5.6402587890625, -5.396240234375, -5.1522216796875, -4.908203125, -4.6641845703125, -4.420166015625, -4.1761474609375, -3.93212890625, -3.6881103515625, -3.444091796875, -3.2000732421875, -2.9560546875, -2.7120361328125, -2.468017578125, -2.2239990234375, -1.97998046875, -1.7359619140625, -1.491943359375, -1.2479248046875, -1.00390625, -0.7598876953125, -0.515869140625, -0.2718505859375, -0.02783203125, 0.2161865234375, 0.460205078125, 0.7042236328125, 0.9482421875, 1.1922607421875, 1.436279296875, 1.6802978515625, 1.92431640625, 2.1683349609375, 2.412353515625, 2.6563720703125, 2.900390625, 3.1444091796875, 3.388427734375, 3.6324462890625, 3.87646484375, 4.1204833984375, 4.364501953125, 4.6085205078125, 4.8525390625, 5.0965576171875, 5.340576171875, 5.5845947265625, 5.82861328125, 6.0726318359375, 6.316650390625, 6.5606689453125, 6.8046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 14.0, 23.0, 23.0, 36.0, 52.0, 80.0, 157.0, 295.0, 486.0, 949.0, 1997.0, 4605.0, 12729.0, 42528.0, 167582.0, 586392.0, 167157.0, 42381.0, 12431.0, 4519.0, 1934.0, 987.0, 498.0, 247.0, 148.0, 100.0, 69.0, 34.0, 30.0, 19.0, 14.0, 7.0, 10.0, 3.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7578125, -3.62115478515625, -3.4844970703125, -3.34783935546875, -3.211181640625, -3.07452392578125, -2.9378662109375, -2.80120849609375, -2.66455078125, -2.52789306640625, -2.3912353515625, -2.25457763671875, -2.117919921875, -1.98126220703125, -1.8446044921875, -1.70794677734375, -1.5712890625, -1.43463134765625, -1.2979736328125, -1.16131591796875, -1.024658203125, -0.88800048828125, -0.7513427734375, -0.61468505859375, -0.47802734375, -0.34136962890625, -0.2047119140625, -0.06805419921875, 0.068603515625, 0.20526123046875, 0.3419189453125, 0.47857666015625, 0.615234375, 0.75189208984375, 0.8885498046875, 1.02520751953125, 1.161865234375, 1.29852294921875, 1.4351806640625, 1.57183837890625, 1.70849609375, 1.84515380859375, 1.9818115234375, 2.11846923828125, 2.255126953125, 2.39178466796875, 2.5284423828125, 2.66510009765625, 2.8017578125, 2.93841552734375, 3.0750732421875, 3.21173095703125, 3.348388671875, 3.48504638671875, 3.6217041015625, 3.75836181640625, 3.89501953125, 4.03167724609375, 4.1683349609375, 4.30499267578125, 4.441650390625, 4.57830810546875, 4.7149658203125, 4.85162353515625, 4.98828125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 8.0, 6.0, 11.0, 15.0, 21.0, 22.0, 30.0, 36.0, 53.0, 63.0, 72.0, 111.0, 156.0, 92.0, 64.0, 35.0, 41.0, 27.0, 22.0, 18.0, 20.0, 17.0, 9.0, 11.0, 3.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008721351623535156, -0.000845007598400116, -0.0008178800344467163, -0.0007907524704933167, -0.000763624906539917, -0.0007364973425865173, -0.0007093697786331177, -0.000682242214679718, -0.0006551146507263184, -0.0006279870867729187, -0.000600859522819519, -0.0005737319588661194, -0.0005466043949127197, -0.0005194768309593201, -0.0004923492670059204, -0.00046522170305252075, -0.0004380941390991211, -0.00041096657514572144, -0.0003838390111923218, -0.0003567114472389221, -0.00032958388328552246, -0.0003024563193321228, -0.00027532875537872314, -0.0002482011914253235, -0.00022107362747192383, -0.00019394606351852417, -0.0001668184995651245, -0.00013969093561172485, -0.0001125633716583252, -8.543580770492554e-05, -5.830824375152588e-05, -3.118067979812622e-05, -4.0531158447265625e-06, 2.3074448108673096e-05, 5.0202012062072754e-05, 7.732957601547241e-05, 0.00010445713996887207, 0.00013158470392227173, 0.0001587122678756714, 0.00018583983182907104, 0.0002129673957824707, 0.00024009495973587036, 0.00026722252368927, 0.0002943500876426697, 0.00032147765159606934, 0.000348605215549469, 0.00037573277950286865, 0.0004028603434562683, 0.00042998790740966797, 0.0004571154713630676, 0.0004842430353164673, 0.0005113705992698669, 0.0005384981632232666, 0.0005656257271766663, 0.0005927532911300659, 0.0006198808550834656, 0.0006470084190368652, 0.0006741359829902649, 0.0007012635469436646, 0.0007283911108970642, 0.0007555186748504639, 0.0007826462388038635, 0.0008097738027572632, 0.0008369013667106628, 0.0008640289306640625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 16.0, 22.0, 31.0, 28.0, 42.0, 86.0, 128.0, 176.0, 367.0, 619.0, 1448.0, 4216.0, 19116.0, 168016.0, 736146.0, 99616.0, 12863.0, 3091.0, 1161.0, 541.0, 283.0, 160.0, 111.0, 71.0, 44.0, 31.0, 36.0, 16.0, 9.0, 10.0, 6.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.3125, -6.09771728515625, -5.8829345703125, -5.66815185546875, -5.453369140625, -5.23858642578125, -5.0238037109375, -4.80902099609375, -4.59423828125, -4.37945556640625, -4.1646728515625, -3.94989013671875, -3.735107421875, -3.52032470703125, -3.3055419921875, -3.09075927734375, -2.8759765625, -2.66119384765625, -2.4464111328125, -2.23162841796875, -2.016845703125, -1.80206298828125, -1.5872802734375, -1.37249755859375, -1.15771484375, -0.94293212890625, -0.7281494140625, -0.51336669921875, -0.298583984375, -0.08380126953125, 0.1309814453125, 0.34576416015625, 0.560546875, 0.77532958984375, 0.9901123046875, 1.20489501953125, 1.419677734375, 1.63446044921875, 1.8492431640625, 2.06402587890625, 2.27880859375, 2.49359130859375, 2.7083740234375, 2.92315673828125, 3.137939453125, 3.35272216796875, 3.5675048828125, 3.78228759765625, 3.9970703125, 4.21185302734375, 4.4266357421875, 4.64141845703125, 4.856201171875, 5.07098388671875, 5.2857666015625, 5.50054931640625, 5.71533203125, 5.93011474609375, 6.1448974609375, 6.35968017578125, 6.574462890625, 6.78924560546875, 7.0040283203125, 7.21881103515625, 7.43359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 7.0, 12.0, 11.0, 18.0, 23.0, 26.0, 40.0, 41.0, 57.0, 88.0, 107.0, 158.0, 97.0, 72.0, 54.0, 39.0, 38.0, 29.0, 17.0, 21.0, 6.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.24957275390625, -5.0968017578125, -4.94403076171875, -4.791259765625, -4.63848876953125, -4.4857177734375, -4.33294677734375, -4.18017578125, -4.02740478515625, -3.8746337890625, -3.72186279296875, -3.569091796875, -3.41632080078125, -3.2635498046875, -3.11077880859375, -2.9580078125, -2.80523681640625, -2.6524658203125, -2.49969482421875, -2.346923828125, -2.19415283203125, -2.0413818359375, -1.88861083984375, -1.73583984375, -1.58306884765625, -1.4302978515625, -1.27752685546875, -1.124755859375, -0.97198486328125, -0.8192138671875, -0.66644287109375, -0.513671875, -0.36090087890625, -0.2081298828125, -0.05535888671875, 0.097412109375, 0.25018310546875, 0.4029541015625, 0.55572509765625, 0.70849609375, 0.86126708984375, 1.0140380859375, 1.16680908203125, 1.319580078125, 1.47235107421875, 1.6251220703125, 1.77789306640625, 1.9306640625, 2.08343505859375, 2.2362060546875, 2.38897705078125, 2.541748046875, 2.69451904296875, 2.8472900390625, 3.00006103515625, 3.15283203125, 3.30560302734375, 3.4583740234375, 3.61114501953125, 3.763916015625, 3.91668701171875, 4.0694580078125, 4.22222900390625, 4.375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 14.0, 16.0, 32.0, 95.0, 129.0, 187.0, 199.0, 134.0, 103.0, 53.0, 25.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.10092163085938, -75.42745971679688, -72.75399017333984, -70.08052825927734, -67.40705871582031, -64.73359680175781, -62.06013107299805, -59.38666534423828, -56.713199615478516, -54.03973388671875, -51.366268157958984, -48.69280242919922, -46.01934051513672, -43.34587097167969, -40.67240905761719, -37.99894332885742, -35.325477600097656, -32.65201187133789, -29.978546142578125, -27.305082321166992, -24.631616592407227, -21.95815086364746, -19.284687042236328, -16.611221313476562, -13.937755584716797, -11.264289855957031, -8.590825080871582, -5.917360305786133, -3.243894577026367, -0.5704288482666016, 2.1030349731445312, 4.776500701904297, 7.449974060058594, 10.12343978881836, 12.796904563903809, 15.470369338989258, 18.143835067749023, 20.81730079650879, 23.490764617919922, 26.164230346679688, 28.837696075439453, 31.51116180419922, 34.184627532958984, 36.85809326171875, 39.53155517578125, 42.20502471923828, 44.87848663330078, 47.55195236206055, 50.22541809082031, 52.89888381958008, 55.572349548339844, 58.245811462402344, 60.919281005859375, 63.592742919921875, 66.26620483398438, 68.9396743774414, 71.61314392089844, 74.28660583496094, 76.96007537841797, 79.63353729248047, 82.3070068359375, 84.98046875, 87.6539306640625, 90.32740020751953, 93.00086212158203]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 7.0, 11.0, 19.0, 14.0, 16.0, 19.0, 23.0, 25.0, 25.0, 29.0, 38.0, 37.0, 39.0, 42.0, 52.0, 51.0, 58.0, 48.0, 59.0, 42.0, 37.0, 45.0, 34.0, 40.0, 32.0, 28.0, 27.0, 16.0, 19.0, 18.0, 8.0, 4.0, 10.0, 3.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.343772888183594, -36.130653381347656, -34.917537689208984, -33.70441818237305, -32.49129867553711, -31.278182983398438, -30.0650634765625, -28.851945877075195, -27.63882827758789, -26.425710678100586, -25.21259117126465, -23.999473571777344, -22.78635597229004, -21.573238372802734, -20.360118865966797, -19.147001266479492, -17.933881759643555, -16.72076416015625, -15.507645606994629, -14.294527053833008, -13.081409454345703, -11.868290901184082, -10.655172348022461, -9.442054748535156, -8.228936195373535, -7.015818119049072, -5.802700042724609, -4.589581489562988, -3.3764634132385254, -2.1633453369140625, -0.9502267837524414, 0.2628908157348633, 1.4760093688964844, 2.6891274452209473, 3.9022457599639893, 5.115364074707031, 6.328482151031494, 7.541600227355957, 8.754718780517578, 9.967836380004883, 11.180954933166504, 12.394073486328125, 13.60719108581543, 14.82030963897705, 16.033428192138672, 17.246545791625977, 18.45966339111328, 19.67278289794922, 20.885900497436523, 22.099018096923828, 23.312137603759766, 24.52525520324707, 25.738372802734375, 26.951492309570312, 28.164609909057617, 29.377727508544922, 30.59084701538086, 31.803964614868164, 33.01708221435547, 34.230201721191406, 35.443321228027344, 36.656436920166016, 37.86955642700195, 39.082672119140625, 40.29579162597656]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 10.0, 18.0, 17.0, 24.0, 32.0, 45.0, 69.0, 107.0, 175.0, 219.0, 377.0, 618.0, 1016.0, 1827.0, 3340.0, 6894.0, 16729.0, 54558.0, 362795.0, 3466188.0, 211866.0, 40833.0, 13847.0, 5947.0, 2946.0, 1518.0, 865.0, 491.0, 271.0, 232.0, 125.0, 83.0, 57.0, 47.0, 26.0, 23.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.389404296875, -8.13037109375, -7.871337890625, -7.6123046875, -7.353271484375, -7.09423828125, -6.835205078125, -6.576171875, -6.317138671875, -6.05810546875, -5.799072265625, -5.5400390625, -5.281005859375, -5.02197265625, -4.762939453125, -4.50390625, -4.244873046875, -3.98583984375, -3.726806640625, -3.4677734375, -3.208740234375, -2.94970703125, -2.690673828125, -2.431640625, -2.172607421875, -1.91357421875, -1.654541015625, -1.3955078125, -1.136474609375, -0.87744140625, -0.618408203125, -0.359375, -0.100341796875, 0.15869140625, 0.417724609375, 0.6767578125, 0.935791015625, 1.19482421875, 1.453857421875, 1.712890625, 1.971923828125, 2.23095703125, 2.489990234375, 2.7490234375, 3.008056640625, 3.26708984375, 3.526123046875, 3.78515625, 4.044189453125, 4.30322265625, 4.562255859375, 4.8212890625, 5.080322265625, 5.33935546875, 5.598388671875, 5.857421875, 6.116455078125, 6.37548828125, 6.634521484375, 6.8935546875, 7.152587890625, 7.41162109375, 7.670654296875, 7.9296875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 0.0, 1.0, 6.0, 7.0, 5.0, 6.0, 9.0, 12.0, 14.0, 19.0, 15.0, 19.0, 18.0, 23.0, 29.0, 26.0, 31.0, 27.0, 38.0, 38.0, 36.0, 41.0, 39.0, 40.0, 46.0, 36.0, 31.0, 27.0, 50.0, 48.0, 26.0, 28.0, 33.0, 26.0, 20.0, 23.0, 17.0, 25.0, 16.0, 8.0, 8.0, 12.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2763671875, -1.235137939453125, -1.19390869140625, -1.152679443359375, -1.1114501953125, -1.070220947265625, -1.02899169921875, -0.987762451171875, -0.946533203125, -0.905303955078125, -0.86407470703125, -0.822845458984375, -0.7816162109375, -0.740386962890625, -0.69915771484375, -0.657928466796875, -0.61669921875, -0.575469970703125, -0.53424072265625, -0.493011474609375, -0.4517822265625, -0.410552978515625, -0.36932373046875, -0.328094482421875, -0.286865234375, -0.245635986328125, -0.20440673828125, -0.163177490234375, -0.1219482421875, -0.080718994140625, -0.03948974609375, 0.001739501953125, 0.04296875, 0.084197998046875, 0.12542724609375, 0.166656494140625, 0.2078857421875, 0.249114990234375, 0.29034423828125, 0.331573486328125, 0.372802734375, 0.414031982421875, 0.45526123046875, 0.496490478515625, 0.5377197265625, 0.578948974609375, 0.62017822265625, 0.661407470703125, 0.70263671875, 0.743865966796875, 0.78509521484375, 0.826324462890625, 0.8675537109375, 0.908782958984375, 0.95001220703125, 0.991241455078125, 1.032470703125, 1.073699951171875, 1.11492919921875, 1.156158447265625, 1.1973876953125, 1.238616943359375, 1.27984619140625, 1.321075439453125, 1.3623046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 5.0, 9.0, 7.0, 10.0, 29.0, 46.0, 47.0, 75.0, 122.0, 177.0, 297.0, 429.0, 772.0, 1301.0, 2262.0, 4345.0, 8686.0, 19091.0, 48007.0, 162810.0, 1385308.0, 2276005.0, 190085.0, 53568.0, 20979.0, 9199.0, 4679.0, 2452.0, 1334.0, 744.0, 507.0, 326.0, 183.0, 115.0, 75.0, 54.0, 46.0, 21.0, 24.0, 16.0, 8.0, 7.0, 10.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.5859375, -7.3631591796875, -7.140380859375, -6.9176025390625, -6.69482421875, -6.4720458984375, -6.249267578125, -6.0264892578125, -5.8037109375, -5.5809326171875, -5.358154296875, -5.1353759765625, -4.91259765625, -4.6898193359375, -4.467041015625, -4.2442626953125, -4.021484375, -3.7987060546875, -3.575927734375, -3.3531494140625, -3.13037109375, -2.9075927734375, -2.684814453125, -2.4620361328125, -2.2392578125, -2.0164794921875, -1.793701171875, -1.5709228515625, -1.34814453125, -1.1253662109375, -0.902587890625, -0.6798095703125, -0.45703125, -0.2342529296875, -0.011474609375, 0.2113037109375, 0.43408203125, 0.6568603515625, 0.879638671875, 1.1024169921875, 1.3251953125, 1.5479736328125, 1.770751953125, 1.9935302734375, 2.21630859375, 2.4390869140625, 2.661865234375, 2.8846435546875, 3.107421875, 3.3302001953125, 3.552978515625, 3.7757568359375, 3.99853515625, 4.2213134765625, 4.444091796875, 4.6668701171875, 4.8896484375, 5.1124267578125, 5.335205078125, 5.5579833984375, 5.78076171875, 6.0035400390625, 6.226318359375, 6.4490966796875, 6.671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 9.0, 9.0, 13.0, 21.0, 23.0, 35.0, 32.0, 62.0, 106.0, 163.0, 322.0, 876.0, 1339.0, 420.0, 201.0, 136.0, 74.0, 61.0, 40.0, 30.0, 25.0, 10.0, 12.0, 12.0, 9.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.0447998046875, -3.906005859375, -3.7672119140625, -3.62841796875, -3.4896240234375, -3.350830078125, -3.2120361328125, -3.0732421875, -2.9344482421875, -2.795654296875, -2.6568603515625, -2.51806640625, -2.3792724609375, -2.240478515625, -2.1016845703125, -1.962890625, -1.8240966796875, -1.685302734375, -1.5465087890625, -1.40771484375, -1.2689208984375, -1.130126953125, -0.9913330078125, -0.8525390625, -0.7137451171875, -0.574951171875, -0.4361572265625, -0.29736328125, -0.1585693359375, -0.019775390625, 0.1190185546875, 0.2578125, 0.3966064453125, 0.535400390625, 0.6741943359375, 0.81298828125, 0.9517822265625, 1.090576171875, 1.2293701171875, 1.3681640625, 1.5069580078125, 1.645751953125, 1.7845458984375, 1.92333984375, 2.0621337890625, 2.200927734375, 2.3397216796875, 2.478515625, 2.6173095703125, 2.756103515625, 2.8948974609375, 3.03369140625, 3.1724853515625, 3.311279296875, 3.4500732421875, 3.5888671875, 3.7276611328125, 3.866455078125, 4.0052490234375, 4.14404296875, 4.2828369140625, 4.421630859375, 4.5604248046875, 4.69921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 14.0, 33.0, 87.0, 110.0, 145.0, 182.0, 152.0, 113.0, 76.0, 45.0, 13.0, 11.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.29136657714844, -35.9809684753418, -34.67056655883789, -33.36016845703125, -32.049766540527344, -30.739368438720703, -29.428970336914062, -28.11857032775879, -26.808170318603516, -25.497770309448242, -24.18737030029297, -22.876972198486328, -21.566572189331055, -20.25617218017578, -18.94577407836914, -17.635374069213867, -16.324974060058594, -15.01457405090332, -13.704174995422363, -12.393775939941406, -11.083375930786133, -9.77297592163086, -8.462576866149902, -7.152177810668945, -5.841777801513672, -4.531378269195557, -3.2209787368774414, -1.9105792045593262, -0.6001796722412109, 0.7102198600769043, 2.0206193923950195, 3.3310184478759766, 4.64141845703125, 5.951817989349365, 7.2622175216674805, 8.572616577148438, 9.883016586303711, 11.193416595458984, 12.503815650939941, 13.814214706420898, 15.124614715576172, 16.435014724731445, 17.74541473388672, 19.05581283569336, 20.366212844848633, 21.676612854003906, 22.987010955810547, 24.29741096496582, 25.607810974121094, 26.918210983276367, 28.22861099243164, 29.53900909423828, 30.849409103393555, 32.15980911254883, 33.47020721435547, 34.780609130859375, 36.091007232666016, 37.401405334472656, 38.71180725097656, 40.0222053527832, 41.332603454589844, 42.64300537109375, 43.95340347290039, 45.26380157470703, 46.57420349121094]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 16.0, 6.0, 18.0, 20.0, 16.0, 31.0, 34.0, 42.0, 33.0, 52.0, 32.0, 57.0, 46.0, 49.0, 59.0, 54.0, 54.0, 53.0, 56.0, 42.0, 36.0, 29.0, 41.0, 22.0, 16.0, 16.0, 12.0, 8.0, 16.0, 9.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.120235443115234, -19.56670379638672, -19.013172149658203, -18.459638595581055, -17.90610694885254, -17.352575302124023, -16.799043655395508, -16.24551010131836, -15.691978454589844, -15.138446807861328, -14.584914207458496, -14.03138256072998, -13.477849960327148, -12.924318313598633, -12.370786666870117, -11.817254066467285, -11.26372241973877, -10.710190773010254, -10.156658172607422, -9.603126525878906, -9.049593925476074, -8.496062278747559, -7.942530155181885, -7.388998031616211, -6.835465908050537, -6.281933784484863, -5.7284016609191895, -5.174869537353516, -4.621337890625, -4.067805290222168, -3.5142736434936523, -2.9607415199279785, -2.407210350036621, -1.8536782264709473, -1.300146222114563, -0.7466142177581787, -0.19308209419250488, 0.36045002937316895, 0.9139819145202637, 1.4675140380859375, 2.0210461616516113, 2.574578285217285, 3.128110408782959, 3.6816422939300537, 4.235174179077148, 4.7887067794799805, 5.342238426208496, 5.89577054977417, 6.449302673339844, 7.002834796905518, 7.556366920471191, 8.109898567199707, 8.663431167602539, 9.216962814331055, 9.77049446105957, 10.324027061462402, 10.877559661865234, 11.43109130859375, 11.984623908996582, 12.538155555725098, 13.09168815612793, 13.645219802856445, 14.198751449584961, 14.752284049987793, 15.305815696716309]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 8.0, 9.0, 13.0, 13.0, 36.0, 49.0, 77.0, 124.0, 198.0, 345.0, 608.0, 1117.0, 2326.0, 4860.0, 11301.0, 26909.0, 68701.0, 172293.0, 325340.0, 252804.0, 108338.0, 41979.0, 17155.0, 7274.0, 3175.0, 1572.0, 833.0, 437.0, 250.0, 136.0, 95.0, 54.0, 28.0, 23.0, 18.0, 18.0, 7.0, 2.0, 5.0, 3.0, 2.0, 8.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.90625, -5.731201171875, -5.55615234375, -5.381103515625, -5.2060546875, -5.031005859375, -4.85595703125, -4.680908203125, -4.505859375, -4.330810546875, -4.15576171875, -3.980712890625, -3.8056640625, -3.630615234375, -3.45556640625, -3.280517578125, -3.10546875, -2.930419921875, -2.75537109375, -2.580322265625, -2.4052734375, -2.230224609375, -2.05517578125, -1.880126953125, -1.705078125, -1.530029296875, -1.35498046875, -1.179931640625, -1.0048828125, -0.829833984375, -0.65478515625, -0.479736328125, -0.3046875, -0.129638671875, 0.04541015625, 0.220458984375, 0.3955078125, 0.570556640625, 0.74560546875, 0.920654296875, 1.095703125, 1.270751953125, 1.44580078125, 1.620849609375, 1.7958984375, 1.970947265625, 2.14599609375, 2.321044921875, 2.49609375, 2.671142578125, 2.84619140625, 3.021240234375, 3.1962890625, 3.371337890625, 3.54638671875, 3.721435546875, 3.896484375, 4.071533203125, 4.24658203125, 4.421630859375, 4.5966796875, 4.771728515625, 4.94677734375, 5.121826171875, 5.296875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 7.0, 9.0, 6.0, 10.0, 16.0, 19.0, 23.0, 25.0, 22.0, 18.0, 26.0, 30.0, 29.0, 28.0, 39.0, 38.0, 40.0, 40.0, 50.0, 38.0, 39.0, 34.0, 30.0, 44.0, 35.0, 39.0, 36.0, 33.0, 27.0, 26.0, 20.0, 19.0, 20.0, 12.0, 12.0, 9.0, 9.0, 9.0, 7.0, 5.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.439453125, -1.3949432373046875, -1.350433349609375, -1.3059234619140625, -1.26141357421875, -1.2169036865234375, -1.172393798828125, -1.1278839111328125, -1.0833740234375, -1.0388641357421875, -0.994354248046875, -0.9498443603515625, -0.90533447265625, -0.8608245849609375, -0.816314697265625, -0.7718048095703125, -0.727294921875, -0.6827850341796875, -0.638275146484375, -0.5937652587890625, -0.54925537109375, -0.5047454833984375, -0.460235595703125, -0.4157257080078125, -0.3712158203125, -0.3267059326171875, -0.282196044921875, -0.2376861572265625, -0.19317626953125, -0.1486663818359375, -0.104156494140625, -0.0596466064453125, -0.01513671875, 0.0293731689453125, 0.073883056640625, 0.1183929443359375, 0.16290283203125, 0.2074127197265625, 0.251922607421875, 0.2964324951171875, 0.3409423828125, 0.3854522705078125, 0.429962158203125, 0.4744720458984375, 0.51898193359375, 0.5634918212890625, 0.608001708984375, 0.6525115966796875, 0.697021484375, 0.7415313720703125, 0.786041259765625, 0.8305511474609375, 0.87506103515625, 0.9195709228515625, 0.964080810546875, 1.0085906982421875, 1.0531005859375, 1.0976104736328125, 1.142120361328125, 1.1866302490234375, 1.23114013671875, 1.2756500244140625, 1.320159912109375, 1.3646697998046875, 1.4091796875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 11.0, 10.0, 18.0, 20.0, 32.0, 37.0, 57.0, 76.0, 87.0, 124.0, 213.0, 335.0, 564.0, 956.0, 1907.0, 6294.0, 38882.0, 352895.0, 558770.0, 71820.0, 9866.0, 2661.0, 1095.0, 630.0, 385.0, 241.0, 178.0, 97.0, 85.0, 56.0, 44.0, 29.0, 18.0, 16.0, 13.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.0390625, -14.6341552734375, -14.229248046875, -13.8243408203125, -13.41943359375, -13.0145263671875, -12.609619140625, -12.2047119140625, -11.7998046875, -11.3948974609375, -10.989990234375, -10.5850830078125, -10.18017578125, -9.7752685546875, -9.370361328125, -8.9654541015625, -8.560546875, -8.1556396484375, -7.750732421875, -7.3458251953125, -6.94091796875, -6.5360107421875, -6.131103515625, -5.7261962890625, -5.3212890625, -4.9163818359375, -4.511474609375, -4.1065673828125, -3.70166015625, -3.2967529296875, -2.891845703125, -2.4869384765625, -2.08203125, -1.6771240234375, -1.272216796875, -0.8673095703125, -0.46240234375, -0.0574951171875, 0.347412109375, 0.7523193359375, 1.1572265625, 1.5621337890625, 1.967041015625, 2.3719482421875, 2.77685546875, 3.1817626953125, 3.586669921875, 3.9915771484375, 4.396484375, 4.8013916015625, 5.206298828125, 5.6112060546875, 6.01611328125, 6.4210205078125, 6.825927734375, 7.2308349609375, 7.6357421875, 8.0406494140625, 8.445556640625, 8.8504638671875, 9.25537109375, 9.6602783203125, 10.065185546875, 10.4700927734375, 10.875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 6.0, 10.0, 7.0, 13.0, 19.0, 16.0, 26.0, 14.0, 24.0, 32.0, 27.0, 42.0, 53.0, 39.0, 55.0, 43.0, 50.0, 36.0, 36.0, 49.0, 52.0, 39.0, 39.0, 33.0, 22.0, 30.0, 33.0, 23.0, 18.0, 18.0, 17.0, 14.0, 12.0, 3.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.3515625, -9.065673828125, -8.77978515625, -8.493896484375, -8.2080078125, -7.922119140625, -7.63623046875, -7.350341796875, -7.064453125, -6.778564453125, -6.49267578125, -6.206787109375, -5.9208984375, -5.635009765625, -5.34912109375, -5.063232421875, -4.77734375, -4.491455078125, -4.20556640625, -3.919677734375, -3.6337890625, -3.347900390625, -3.06201171875, -2.776123046875, -2.490234375, -2.204345703125, -1.91845703125, -1.632568359375, -1.3466796875, -1.060791015625, -0.77490234375, -0.489013671875, -0.203125, 0.082763671875, 0.36865234375, 0.654541015625, 0.9404296875, 1.226318359375, 1.51220703125, 1.798095703125, 2.083984375, 2.369873046875, 2.65576171875, 2.941650390625, 3.2275390625, 3.513427734375, 3.79931640625, 4.085205078125, 4.37109375, 4.656982421875, 4.94287109375, 5.228759765625, 5.5146484375, 5.800537109375, 6.08642578125, 6.372314453125, 6.658203125, 6.944091796875, 7.22998046875, 7.515869140625, 7.8017578125, 8.087646484375, 8.37353515625, 8.659423828125, 8.9453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 8.0, 7.0, 9.0, 30.0, 37.0, 56.0, 90.0, 157.0, 303.0, 731.0, 1882.0, 6491.0, 28290.0, 152467.0, 541475.0, 255199.0, 46680.0, 9942.0, 2838.0, 942.0, 413.0, 204.0, 104.0, 63.0, 22.0, 43.0, 27.0, 12.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.86328125, -6.68572998046875, -6.5081787109375, -6.33062744140625, -6.153076171875, -5.97552490234375, -5.7979736328125, -5.62042236328125, -5.44287109375, -5.26531982421875, -5.0877685546875, -4.91021728515625, -4.732666015625, -4.55511474609375, -4.3775634765625, -4.20001220703125, -4.0224609375, -3.84490966796875, -3.6673583984375, -3.48980712890625, -3.312255859375, -3.13470458984375, -2.9571533203125, -2.77960205078125, -2.60205078125, -2.42449951171875, -2.2469482421875, -2.06939697265625, -1.891845703125, -1.71429443359375, -1.5367431640625, -1.35919189453125, -1.181640625, -1.00408935546875, -0.8265380859375, -0.64898681640625, -0.471435546875, -0.29388427734375, -0.1163330078125, 0.06121826171875, 0.23876953125, 0.41632080078125, 0.5938720703125, 0.77142333984375, 0.948974609375, 1.12652587890625, 1.3040771484375, 1.48162841796875, 1.6591796875, 1.83673095703125, 2.0142822265625, 2.19183349609375, 2.369384765625, 2.54693603515625, 2.7244873046875, 2.90203857421875, 3.07958984375, 3.25714111328125, 3.4346923828125, 3.61224365234375, 3.789794921875, 3.96734619140625, 4.1448974609375, 4.32244873046875, 4.5]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 11.0, 11.0, 14.0, 11.0, 17.0, 32.0, 31.0, 52.0, 59.0, 67.0, 75.0, 106.0, 91.0, 85.0, 70.0, 62.0, 44.0, 37.0, 29.0, 24.0, 17.0, 12.0, 16.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012073516845703125, -0.0011765360832214355, -0.0011457204818725586, -0.0011149048805236816, -0.0010840892791748047, -0.0010532736778259277, -0.0010224580764770508, -0.0009916424751281738, -0.0009608268737792969, -0.0009300112724304199, -0.000899195671081543, -0.000868380069732666, -0.0008375644683837891, -0.0008067488670349121, -0.0007759332656860352, -0.0007451176643371582, -0.0007143020629882812, -0.0006834864616394043, -0.0006526708602905273, -0.0006218552589416504, -0.0005910396575927734, -0.0005602240562438965, -0.0005294084548950195, -0.0004985928535461426, -0.0004677772521972656, -0.00043696165084838867, -0.0004061460494995117, -0.00037533044815063477, -0.0003445148468017578, -0.00031369924545288086, -0.0002828836441040039, -0.00025206804275512695, -0.00022125244140625, -0.00019043684005737305, -0.0001596212387084961, -0.00012880563735961914, -9.799003601074219e-05, -6.717443466186523e-05, -3.635883331298828e-05, -5.543231964111328e-06, 2.5272369384765625e-05, 5.608797073364258e-05, 8.690357208251953e-05, 0.00011771917343139648, 0.00014853477478027344, 0.0001793503761291504, 0.00021016597747802734, 0.0002409815788269043, 0.00027179718017578125, 0.0003026127815246582, 0.00033342838287353516, 0.0003642439842224121, 0.00039505958557128906, 0.000425875186920166, 0.00045669078826904297, 0.0004875063896179199, 0.0005183219909667969, 0.0005491375923156738, 0.0005799531936645508, 0.0006107687950134277, 0.0006415843963623047, 0.0006723999977111816, 0.0007032155990600586, 0.0007340312004089355, 0.0007648468017578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 9.0, 9.0, 15.0, 22.0, 42.0, 55.0, 68.0, 118.0, 184.0, 338.0, 566.0, 1090.0, 2296.0, 6262.0, 26558.0, 156065.0, 559748.0, 240398.0, 40216.0, 8714.0, 2849.0, 1240.0, 651.0, 378.0, 232.0, 140.0, 83.0, 78.0, 31.0, 22.0, 14.0, 14.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.1640625, -5.99102783203125, -5.8179931640625, -5.64495849609375, -5.471923828125, -5.29888916015625, -5.1258544921875, -4.95281982421875, -4.77978515625, -4.60675048828125, -4.4337158203125, -4.26068115234375, -4.087646484375, -3.91461181640625, -3.7415771484375, -3.56854248046875, -3.3955078125, -3.22247314453125, -3.0494384765625, -2.87640380859375, -2.703369140625, -2.53033447265625, -2.3572998046875, -2.18426513671875, -2.01123046875, -1.83819580078125, -1.6651611328125, -1.49212646484375, -1.319091796875, -1.14605712890625, -0.9730224609375, -0.79998779296875, -0.626953125, -0.45391845703125, -0.2808837890625, -0.10784912109375, 0.065185546875, 0.23822021484375, 0.4112548828125, 0.58428955078125, 0.75732421875, 0.93035888671875, 1.1033935546875, 1.27642822265625, 1.449462890625, 1.62249755859375, 1.7955322265625, 1.96856689453125, 2.1416015625, 2.31463623046875, 2.4876708984375, 2.66070556640625, 2.833740234375, 3.00677490234375, 3.1798095703125, 3.35284423828125, 3.52587890625, 3.69891357421875, 3.8719482421875, 4.04498291015625, 4.218017578125, 4.39105224609375, 4.5640869140625, 4.73712158203125, 4.91015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 9.0, 12.0, 12.0, 24.0, 29.0, 32.0, 61.0, 54.0, 76.0, 80.0, 84.0, 87.0, 73.0, 81.0, 68.0, 55.0, 35.0, 34.0, 20.0, 16.0, 21.0, 6.0, 8.0, 5.0, 2.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.515380859375, -4.37451171875, -4.233642578125, -4.0927734375, -3.951904296875, -3.81103515625, -3.670166015625, -3.529296875, -3.388427734375, -3.24755859375, -3.106689453125, -2.9658203125, -2.824951171875, -2.68408203125, -2.543212890625, -2.40234375, -2.261474609375, -2.12060546875, -1.979736328125, -1.8388671875, -1.697998046875, -1.55712890625, -1.416259765625, -1.275390625, -1.134521484375, -0.99365234375, -0.852783203125, -0.7119140625, -0.571044921875, -0.43017578125, -0.289306640625, -0.1484375, -0.007568359375, 0.13330078125, 0.274169921875, 0.4150390625, 0.555908203125, 0.69677734375, 0.837646484375, 0.978515625, 1.119384765625, 1.26025390625, 1.401123046875, 1.5419921875, 1.682861328125, 1.82373046875, 1.964599609375, 2.10546875, 2.246337890625, 2.38720703125, 2.528076171875, 2.6689453125, 2.809814453125, 2.95068359375, 3.091552734375, 3.232421875, 3.373291015625, 3.51416015625, 3.655029296875, 3.7958984375, 3.936767578125, 4.07763671875, 4.218505859375, 4.359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 44.0, 114.0, 212.0, 261.0, 204.0, 113.0, 35.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.90145874023438, -152.48587036132812, -148.07029724121094, -143.6547088623047, -139.2391357421875, -134.82354736328125, -130.407958984375, -125.99237823486328, -121.57679748535156, -117.16121673583984, -112.74563598632812, -108.33004760742188, -103.91446685791016, -99.49888610839844, -95.08329772949219, -90.66771697998047, -86.25213623046875, -81.83655548095703, -77.42097473144531, -73.00538635253906, -68.58980560302734, -64.17422485351562, -59.75864028930664, -55.343055725097656, -50.92747497558594, -46.51189422607422, -42.096309661865234, -37.68072509765625, -33.26514434814453, -28.84956169128418, -24.433979034423828, -20.018396377563477, -15.602813720703125, -11.187231063842773, -6.771648406982422, -2.3560657501220703, 2.0595169067382812, 6.475099563598633, 10.890682220458984, 15.306264877319336, 19.721847534179688, 24.13743019104004, 28.55301284790039, 32.968597412109375, 37.384178161621094, 41.79975891113281, 46.2153434753418, 50.63092803955078, 55.0465087890625, 59.46208953857422, 63.8776741027832, 68.29325866699219, 72.7088394165039, 77.12442016601562, 81.54000854492188, 85.9555892944336, 90.37117004394531, 94.78675079345703, 99.20233154296875, 103.617919921875, 108.03350067138672, 112.44908142089844, 116.86466979980469, 121.2802505493164, 125.69583129882812]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 6.0, 6.0, 8.0, 12.0, 7.0, 10.0, 9.0, 18.0, 16.0, 22.0, 27.0, 23.0, 38.0, 33.0, 34.0, 37.0, 44.0, 50.0, 46.0, 35.0, 46.0, 54.0, 50.0, 40.0, 49.0, 32.0, 36.0, 25.0, 21.0, 29.0, 16.0, 26.0, 17.0, 11.0, 11.0, 12.0, 12.0, 3.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-51.0140380859375, -49.59974670410156, -48.18545150756836, -46.77116012573242, -45.35686492919922, -43.94257354736328, -42.528282165527344, -41.11398696899414, -39.69969177246094, -38.285400390625, -36.8711051940918, -35.45681381225586, -34.042518615722656, -32.62822723388672, -31.21393394470215, -29.799640655517578, -28.38534927368164, -26.97105598449707, -25.5567626953125, -24.142471313476562, -22.72817611694336, -21.313884735107422, -19.89959144592285, -18.48529815673828, -17.07100486755371, -15.65671157836914, -14.24241828918457, -12.828125953674316, -11.413832664489746, -9.999539375305176, -8.585247039794922, -7.170953750610352, -5.756660461425781, -4.342367172241211, -2.928074359893799, -1.5137815475463867, -0.0994882583618164, 1.314805030822754, 2.729097366333008, 4.143390655517578, 5.557683944702148, 6.971977233886719, 8.386270523071289, 9.800562858581543, 11.214856147766113, 12.629149436950684, 14.043441772460938, 15.457735061645508, 16.872028350830078, 18.28632164001465, 19.70061492919922, 21.114906311035156, 22.52920150756836, 23.943492889404297, 25.357786178588867, 26.772079467773438, 28.186372756958008, 29.600666046142578, 31.01495933532715, 32.42925262451172, 33.843544006347656, 35.25783920288086, 36.6721305847168, 38.08642578125, 39.50071716308594]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 6.0, 5.0, 5.0, 10.0, 18.0, 23.0, 26.0, 33.0, 37.0, 47.0, 68.0, 98.0, 149.0, 189.0, 298.0, 496.0, 995.0, 2139.0, 5790.0, 29592.0, 3968563.0, 164557.0, 13992.0, 3625.0, 1502.0, 779.0, 395.0, 232.0, 165.0, 104.0, 90.0, 47.0, 52.0, 35.0, 22.0, 19.0, 23.0, 18.0, 9.0, 9.0, 8.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.616943359375, -13.10888671875, -12.600830078125, -12.0927734375, -11.584716796875, -11.07666015625, -10.568603515625, -10.060546875, -9.552490234375, -9.04443359375, -8.536376953125, -8.0283203125, -7.520263671875, -7.01220703125, -6.504150390625, -5.99609375, -5.488037109375, -4.97998046875, -4.471923828125, -3.9638671875, -3.455810546875, -2.94775390625, -2.439697265625, -1.931640625, -1.423583984375, -0.91552734375, -0.407470703125, 0.1005859375, 0.608642578125, 1.11669921875, 1.624755859375, 2.1328125, 2.640869140625, 3.14892578125, 3.656982421875, 4.1650390625, 4.673095703125, 5.18115234375, 5.689208984375, 6.197265625, 6.705322265625, 7.21337890625, 7.721435546875, 8.2294921875, 8.737548828125, 9.24560546875, 9.753662109375, 10.26171875, 10.769775390625, 11.27783203125, 11.785888671875, 12.2939453125, 12.802001953125, 13.31005859375, 13.818115234375, 14.326171875, 14.834228515625, 15.34228515625, 15.850341796875, 16.3583984375, 16.866455078125, 17.37451171875, 17.882568359375, 18.390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 11.0, 9.0, 13.0, 17.0, 17.0, 17.0, 22.0, 32.0, 35.0, 38.0, 32.0, 39.0, 45.0, 50.0, 44.0, 49.0, 40.0, 39.0, 34.0, 51.0, 33.0, 37.0, 37.0, 42.0, 33.0, 30.0, 16.0, 21.0, 21.0, 16.0, 5.0, 15.0, 10.0, 3.0, 7.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.751953125, -1.6958160400390625, -1.639678955078125, -1.5835418701171875, -1.52740478515625, -1.4712677001953125, -1.415130615234375, -1.3589935302734375, -1.3028564453125, -1.2467193603515625, -1.190582275390625, -1.1344451904296875, -1.07830810546875, -1.0221710205078125, -0.966033935546875, -0.9098968505859375, -0.853759765625, -0.7976226806640625, -0.741485595703125, -0.6853485107421875, -0.62921142578125, -0.5730743408203125, -0.516937255859375, -0.4608001708984375, -0.4046630859375, -0.3485260009765625, -0.292388916015625, -0.2362518310546875, -0.18011474609375, -0.1239776611328125, -0.067840576171875, -0.0117034912109375, 0.04443359375, 0.1005706787109375, 0.156707763671875, 0.2128448486328125, 0.26898193359375, 0.3251190185546875, 0.381256103515625, 0.4373931884765625, 0.4935302734375, 0.5496673583984375, 0.605804443359375, 0.6619415283203125, 0.71807861328125, 0.7742156982421875, 0.830352783203125, 0.8864898681640625, 0.942626953125, 0.9987640380859375, 1.054901123046875, 1.1110382080078125, 1.16717529296875, 1.2233123779296875, 1.279449462890625, 1.3355865478515625, 1.3917236328125, 1.4478607177734375, 1.503997802734375, 1.5601348876953125, 1.61627197265625, 1.6724090576171875, 1.728546142578125, 1.7846832275390625, 1.8408203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 8.0, 5.0, 10.0, 10.0, 15.0, 14.0, 22.0, 32.0, 45.0, 51.0, 78.0, 116.0, 172.0, 271.0, 454.0, 903.0, 2026.0, 6745.0, 56093.0, 4082111.0, 35922.0, 5416.0, 1752.0, 795.0, 407.0, 243.0, 154.0, 117.0, 90.0, 56.0, 39.0, 24.0, 25.0, 16.0, 15.0, 12.0, 1.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -27.095703125, -26.28515625, -25.474609375, -24.6640625, -23.853515625, -23.04296875, -22.232421875, -21.421875, -20.611328125, -19.80078125, -18.990234375, -18.1796875, -17.369140625, -16.55859375, -15.748046875, -14.9375, -14.126953125, -13.31640625, -12.505859375, -11.6953125, -10.884765625, -10.07421875, -9.263671875, -8.453125, -7.642578125, -6.83203125, -6.021484375, -5.2109375, -4.400390625, -3.58984375, -2.779296875, -1.96875, -1.158203125, -0.34765625, 0.462890625, 1.2734375, 2.083984375, 2.89453125, 3.705078125, 4.515625, 5.326171875, 6.13671875, 6.947265625, 7.7578125, 8.568359375, 9.37890625, 10.189453125, 11.0, 11.810546875, 12.62109375, 13.431640625, 14.2421875, 15.052734375, 15.86328125, 16.673828125, 17.484375, 18.294921875, 19.10546875, 19.916015625, 20.7265625, 21.537109375, 22.34765625, 23.158203125, 23.96875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 9.0, 4.0, 12.0, 19.0, 33.0, 85.0, 586.0, 3103.0, 143.0, 38.0, 15.0, 13.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.46875, -5.3323974609375, -5.196044921875, -5.0596923828125, -4.92333984375, -4.7869873046875, -4.650634765625, -4.5142822265625, -4.3779296875, -4.2415771484375, -4.105224609375, -3.9688720703125, -3.83251953125, -3.6961669921875, -3.559814453125, -3.4234619140625, -3.287109375, -3.1507568359375, -3.014404296875, -2.8780517578125, -2.74169921875, -2.6053466796875, -2.468994140625, -2.3326416015625, -2.1962890625, -2.0599365234375, -1.923583984375, -1.7872314453125, -1.65087890625, -1.5145263671875, -1.378173828125, -1.2418212890625, -1.10546875, -0.9691162109375, -0.832763671875, -0.6964111328125, -0.56005859375, -0.4237060546875, -0.287353515625, -0.1510009765625, -0.0146484375, 0.1217041015625, 0.258056640625, 0.3944091796875, 0.53076171875, 0.6671142578125, 0.803466796875, 0.9398193359375, 1.076171875, 1.2125244140625, 1.348876953125, 1.4852294921875, 1.62158203125, 1.7579345703125, 1.894287109375, 2.0306396484375, 2.1669921875, 2.3033447265625, 2.439697265625, 2.5760498046875, 2.71240234375, 2.8487548828125, 2.985107421875, 3.1214599609375, 3.2578125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 2.0, 5.0, 2.0, 4.0, 10.0, 4.0, 5.0, 9.0, 7.0, 12.0, 16.0, 11.0, 28.0, 33.0, 64.0, 67.0, 92.0, 102.0, 120.0, 107.0, 95.0, 74.0, 38.0, 37.0, 28.0, 13.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.764802932739258, -12.39647102355957, -12.028138160705566, -11.659806251525879, -11.291474342346191, -10.923141479492188, -10.5548095703125, -10.186477661132812, -9.818144798278809, -9.449812889099121, -9.081480026245117, -8.71314811706543, -8.344816207885742, -7.976483345031738, -7.608151435852051, -7.239819049835205, -6.871487140655518, -6.503154754638672, -6.134822845458984, -5.766490459442139, -5.398158073425293, -5.0298261642456055, -4.66149377822876, -4.293161392211914, -3.9248292446136475, -3.556497097015381, -3.188164710998535, -2.8198325634002686, -2.451500415802002, -2.0831680297851562, -1.7148358821868896, -1.346503496170044, -0.9781713485717773, -0.6098390817642212, -0.24150687456130981, 0.12682533264160156, 0.4951575994491577, 0.8634898662567139, 1.2318220138549805, 1.6001543998718262, 1.9684865474700928, 2.3368186950683594, 2.705151081085205, 3.0734832286834717, 3.4418153762817383, 3.810147762298584, 4.17848014831543, 4.546812057495117, 4.915144443511963, 5.283476829528809, 5.651808738708496, 6.020141124725342, 6.3884735107421875, 6.756805419921875, 7.125137805938721, 7.493470191955566, 7.861802101135254, 8.230134010314941, 8.598466873168945, 8.966798782348633, 9.33513069152832, 9.703463554382324, 10.071795463562012, 10.440128326416016, 10.808460235595703]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 12.0, 8.0, 6.0, 16.0, 14.0, 12.0, 11.0, 24.0, 23.0, 30.0, 27.0, 38.0, 44.0, 47.0, 49.0, 43.0, 50.0, 41.0, 42.0, 53.0, 52.0, 51.0, 35.0, 40.0, 38.0, 39.0, 11.0, 28.0, 22.0, 13.0, 19.0, 4.0, 12.0, 4.0, 8.0, 6.0, 3.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.845468521118164, -8.60477066040039, -8.364072799682617, -8.123374938964844, -7.882676601409912, -7.6419782638549805, -7.401280403137207, -7.160582542419434, -6.91988468170166, -6.679186820983887, -6.438488483428955, -6.197790622711182, -5.957092761993408, -5.716394424438477, -5.475696563720703, -5.23499870300293, -4.994300365447998, -4.753602504730225, -4.512904167175293, -4.2722063064575195, -4.031508445739746, -3.7908103466033936, -3.550112247467041, -3.3094143867492676, -3.068716287612915, -2.8280181884765625, -2.587320327758789, -2.3466222286224365, -2.105924129486084, -1.8652262687683105, -1.624528169631958, -1.383830189704895, -1.1431326866149902, -0.9024347066879272, -0.6617366671562195, -0.4210386276245117, -0.18034064769744873, 0.06035733222961426, 0.3010554313659668, 0.5417534112930298, 0.7824513912200928, 1.0231493711471558, 1.2638473510742188, 1.5045454502105713, 1.7452434301376343, 1.9859414100646973, 2.22663950920105, 2.4673376083374023, 2.708035469055176, 2.9487335681915283, 3.1894314289093018, 3.4301295280456543, 3.6708273887634277, 3.9115254878997803, 4.152223587036133, 4.392921447753906, 4.63361930847168, 4.874317169189453, 5.115015506744385, 5.355713367462158, 5.596411228179932, 5.837109565734863, 6.077807426452637, 6.31850528717041, 6.559203624725342]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 10.0, 21.0, 18.0, 17.0, 38.0, 54.0, 66.0, 102.0, 215.0, 409.0, 888.0, 1923.0, 4656.0, 12158.0, 32324.0, 85912.0, 206074.0, 326035.0, 222988.0, 95473.0, 36137.0, 13625.0, 5288.0, 2116.0, 917.0, 466.0, 224.0, 125.0, 76.0, 47.0, 38.0, 30.0, 16.0, 15.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.6396484375, -5.455078125, -5.2705078125, -5.0859375, -4.9013671875, -4.716796875, -4.5322265625, -4.34765625, -4.1630859375, -3.978515625, -3.7939453125, -3.609375, -3.4248046875, -3.240234375, -3.0556640625, -2.87109375, -2.6865234375, -2.501953125, -2.3173828125, -2.1328125, -1.9482421875, -1.763671875, -1.5791015625, -1.39453125, -1.2099609375, -1.025390625, -0.8408203125, -0.65625, -0.4716796875, -0.287109375, -0.1025390625, 0.08203125, 0.2666015625, 0.451171875, 0.6357421875, 0.8203125, 1.0048828125, 1.189453125, 1.3740234375, 1.55859375, 1.7431640625, 1.927734375, 2.1123046875, 2.296875, 2.4814453125, 2.666015625, 2.8505859375, 3.03515625, 3.2197265625, 3.404296875, 3.5888671875, 3.7734375, 3.9580078125, 4.142578125, 4.3271484375, 4.51171875, 4.6962890625, 4.880859375, 5.0654296875, 5.25, 5.4345703125, 5.619140625, 5.8037109375, 5.98828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 16.0, 14.0, 14.0, 18.0, 22.0, 22.0, 25.0, 37.0, 44.0, 37.0, 45.0, 51.0, 45.0, 43.0, 46.0, 52.0, 47.0, 53.0, 43.0, 39.0, 41.0, 38.0, 26.0, 32.0, 20.0, 24.0, 17.0, 15.0, 10.0, 11.0, 6.0, 2.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.1846923828125, -2.115478515625, -2.0462646484375, -1.97705078125, -1.9078369140625, -1.838623046875, -1.7694091796875, -1.7001953125, -1.6309814453125, -1.561767578125, -1.4925537109375, -1.42333984375, -1.3541259765625, -1.284912109375, -1.2156982421875, -1.146484375, -1.0772705078125, -1.008056640625, -0.9388427734375, -0.86962890625, -0.8004150390625, -0.731201171875, -0.6619873046875, -0.5927734375, -0.5235595703125, -0.454345703125, -0.3851318359375, -0.31591796875, -0.2467041015625, -0.177490234375, -0.1082763671875, -0.0390625, 0.0301513671875, 0.099365234375, 0.1685791015625, 0.23779296875, 0.3070068359375, 0.376220703125, 0.4454345703125, 0.5146484375, 0.5838623046875, 0.653076171875, 0.7222900390625, 0.79150390625, 0.8607177734375, 0.929931640625, 0.9991455078125, 1.068359375, 1.1375732421875, 1.206787109375, 1.2760009765625, 1.34521484375, 1.4144287109375, 1.483642578125, 1.5528564453125, 1.6220703125, 1.6912841796875, 1.760498046875, 1.8297119140625, 1.89892578125, 1.9681396484375, 2.037353515625, 2.1065673828125, 2.17578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 9.0, 8.0, 17.0, 16.0, 33.0, 29.0, 56.0, 80.0, 123.0, 187.0, 275.0, 435.0, 809.0, 1753.0, 5829.0, 48308.0, 611235.0, 347237.0, 25164.0, 3858.0, 1328.0, 630.0, 403.0, 245.0, 173.0, 91.0, 71.0, 45.0, 28.0, 16.0, 15.0, 16.0, 11.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.8046875, -15.3087158203125, -14.812744140625, -14.3167724609375, -13.82080078125, -13.3248291015625, -12.828857421875, -12.3328857421875, -11.8369140625, -11.3409423828125, -10.844970703125, -10.3489990234375, -9.85302734375, -9.3570556640625, -8.861083984375, -8.3651123046875, -7.869140625, -7.3731689453125, -6.877197265625, -6.3812255859375, -5.88525390625, -5.3892822265625, -4.893310546875, -4.3973388671875, -3.9013671875, -3.4053955078125, -2.909423828125, -2.4134521484375, -1.91748046875, -1.4215087890625, -0.925537109375, -0.4295654296875, 0.06640625, 0.5623779296875, 1.058349609375, 1.5543212890625, 2.05029296875, 2.5462646484375, 3.042236328125, 3.5382080078125, 4.0341796875, 4.5301513671875, 5.026123046875, 5.5220947265625, 6.01806640625, 6.5140380859375, 7.010009765625, 7.5059814453125, 8.001953125, 8.4979248046875, 8.993896484375, 9.4898681640625, 9.98583984375, 10.4818115234375, 10.977783203125, 11.4737548828125, 11.9697265625, 12.4656982421875, 12.961669921875, 13.4576416015625, 13.95361328125, 14.4495849609375, 14.945556640625, 15.4415283203125, 15.9375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 12.0, 8.0, 9.0, 16.0, 15.0, 27.0, 26.0, 30.0, 30.0, 35.0, 38.0, 45.0, 34.0, 57.0, 50.0, 56.0, 56.0, 45.0, 49.0, 54.0, 43.0, 40.0, 42.0, 30.0, 25.0, 24.0, 15.0, 22.0, 12.0, 14.0, 4.0, 6.0, 7.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4375, -14.0411376953125, -13.644775390625, -13.2484130859375, -12.85205078125, -12.4556884765625, -12.059326171875, -11.6629638671875, -11.2666015625, -10.8702392578125, -10.473876953125, -10.0775146484375, -9.68115234375, -9.2847900390625, -8.888427734375, -8.4920654296875, -8.095703125, -7.6993408203125, -7.302978515625, -6.9066162109375, -6.51025390625, -6.1138916015625, -5.717529296875, -5.3211669921875, -4.9248046875, -4.5284423828125, -4.132080078125, -3.7357177734375, -3.33935546875, -2.9429931640625, -2.546630859375, -2.1502685546875, -1.75390625, -1.3575439453125, -0.961181640625, -0.5648193359375, -0.16845703125, 0.2279052734375, 0.624267578125, 1.0206298828125, 1.4169921875, 1.8133544921875, 2.209716796875, 2.6060791015625, 3.00244140625, 3.3988037109375, 3.795166015625, 4.1915283203125, 4.587890625, 4.9842529296875, 5.380615234375, 5.7769775390625, 6.17333984375, 6.5697021484375, 6.966064453125, 7.3624267578125, 7.7587890625, 8.1551513671875, 8.551513671875, 8.9478759765625, 9.34423828125, 9.7406005859375, 10.136962890625, 10.5333251953125, 10.9296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 7.0, 12.0, 7.0, 27.0, 49.0, 121.0, 169.0, 336.0, 774.0, 1882.0, 5900.0, 25663.0, 167466.0, 623996.0, 184106.0, 28100.0, 6330.0, 2014.0, 797.0, 365.0, 176.0, 107.0, 64.0, 30.0, 21.0, 10.0, 7.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.91558837890625, -3.7491455078125, -3.58270263671875, -3.416259765625, -3.24981689453125, -3.0833740234375, -2.91693115234375, -2.75048828125, -2.58404541015625, -2.4176025390625, -2.25115966796875, -2.084716796875, -1.91827392578125, -1.7518310546875, -1.58538818359375, -1.4189453125, -1.25250244140625, -1.0860595703125, -0.91961669921875, -0.753173828125, -0.58673095703125, -0.4202880859375, -0.25384521484375, -0.08740234375, 0.07904052734375, 0.2454833984375, 0.41192626953125, 0.578369140625, 0.74481201171875, 0.9112548828125, 1.07769775390625, 1.244140625, 1.41058349609375, 1.5770263671875, 1.74346923828125, 1.909912109375, 2.07635498046875, 2.2427978515625, 2.40924072265625, 2.57568359375, 2.74212646484375, 2.9085693359375, 3.07501220703125, 3.241455078125, 3.40789794921875, 3.5743408203125, 3.74078369140625, 3.9072265625, 4.07366943359375, 4.2401123046875, 4.40655517578125, 4.572998046875, 4.73944091796875, 4.9058837890625, 5.07232666015625, 5.23876953125, 5.40521240234375, 5.5716552734375, 5.73809814453125, 5.904541015625, 6.07098388671875, 6.2374267578125, 6.40386962890625, 6.5703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 7.0, 15.0, 10.0, 12.0, 25.0, 30.0, 33.0, 39.0, 47.0, 56.0, 66.0, 65.0, 69.0, 64.0, 50.0, 51.0, 49.0, 39.0, 37.0, 40.0, 32.0, 34.0, 24.0, 19.0, 12.0, 13.0, 7.0, 7.0, 9.0, 4.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0006237030029296875, -0.0006044954061508179, -0.0005852878093719482, -0.0005660802125930786, -0.000546872615814209, -0.0005276650190353394, -0.0005084574222564697, -0.0004892498254776001, -0.00047004222869873047, -0.00045083463191986084, -0.0004316270351409912, -0.0004124194383621216, -0.00039321184158325195, -0.0003740042448043823, -0.0003547966480255127, -0.00033558905124664307, -0.00031638145446777344, -0.0002971738576889038, -0.0002779662609100342, -0.00025875866413116455, -0.00023955106735229492, -0.0002203434705734253, -0.00020113587379455566, -0.00018192827701568604, -0.0001627206802368164, -0.00014351308345794678, -0.00012430548667907715, -0.00010509788990020752, -8.589029312133789e-05, -6.668269634246826e-05, -4.747509956359863e-05, -2.8267502784729004e-05, -9.059906005859375e-06, 1.0147690773010254e-05, 2.9355287551879883e-05, 4.856288433074951e-05, 6.777048110961914e-05, 8.697807788848877e-05, 0.0001061856746673584, 0.00012539327144622803, 0.00014460086822509766, 0.00016380846500396729, 0.00018301606178283691, 0.00020222365856170654, 0.00022143125534057617, 0.0002406388521194458, 0.00025984644889831543, 0.00027905404567718506, 0.0002982616424560547, 0.0003174692392349243, 0.00033667683601379395, 0.0003558844327926636, 0.0003750920295715332, 0.00039429962635040283, 0.00041350722312927246, 0.0004327148199081421, 0.0004519224166870117, 0.00047113001346588135, 0.000490337610244751, 0.0005095452070236206, 0.0005287528038024902, 0.0005479604005813599, 0.0005671679973602295, 0.0005863755941390991, 0.0006055831909179688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 7.0, 11.0, 12.0, 16.0, 27.0, 48.0, 64.0, 106.0, 188.0, 340.0, 684.0, 1840.0, 5515.0, 34148.0, 451007.0, 506532.0, 38616.0, 5961.0, 1827.0, 734.0, 370.0, 201.0, 109.0, 62.0, 46.0, 30.0, 18.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.8297119140625, -6.616455078125, -6.4031982421875, -6.18994140625, -5.9766845703125, -5.763427734375, -5.5501708984375, -5.3369140625, -5.1236572265625, -4.910400390625, -4.6971435546875, -4.48388671875, -4.2706298828125, -4.057373046875, -3.8441162109375, -3.630859375, -3.4176025390625, -3.204345703125, -2.9910888671875, -2.77783203125, -2.5645751953125, -2.351318359375, -2.1380615234375, -1.9248046875, -1.7115478515625, -1.498291015625, -1.2850341796875, -1.07177734375, -0.8585205078125, -0.645263671875, -0.4320068359375, -0.21875, -0.0054931640625, 0.207763671875, 0.4210205078125, 0.63427734375, 0.8475341796875, 1.060791015625, 1.2740478515625, 1.4873046875, 1.7005615234375, 1.913818359375, 2.1270751953125, 2.34033203125, 2.5535888671875, 2.766845703125, 2.9801025390625, 3.193359375, 3.4066162109375, 3.619873046875, 3.8331298828125, 4.04638671875, 4.2596435546875, 4.472900390625, 4.6861572265625, 4.8994140625, 5.1126708984375, 5.325927734375, 5.5391845703125, 5.75244140625, 5.9656982421875, 6.178955078125, 6.3922119140625, 6.60546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 15.0, 9.0, 21.0, 23.0, 22.0, 42.0, 59.0, 67.0, 68.0, 90.0, 97.0, 89.0, 66.0, 71.0, 52.0, 43.0, 30.0, 32.0, 29.0, 15.0, 12.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.580535888671875, -3.44036865234375, -3.300201416015625, -3.1600341796875, -3.019866943359375, -2.87969970703125, -2.739532470703125, -2.599365234375, -2.459197998046875, -2.31903076171875, -2.178863525390625, -2.0386962890625, -1.898529052734375, -1.75836181640625, -1.618194580078125, -1.47802734375, -1.337860107421875, -1.19769287109375, -1.057525634765625, -0.9173583984375, -0.777191162109375, -0.63702392578125, -0.496856689453125, -0.356689453125, -0.216522216796875, -0.07635498046875, 0.063812255859375, 0.2039794921875, 0.344146728515625, 0.48431396484375, 0.624481201171875, 0.7646484375, 0.904815673828125, 1.04498291015625, 1.185150146484375, 1.3253173828125, 1.465484619140625, 1.60565185546875, 1.745819091796875, 1.885986328125, 2.026153564453125, 2.16632080078125, 2.306488037109375, 2.4466552734375, 2.586822509765625, 2.72698974609375, 2.867156982421875, 3.00732421875, 3.147491455078125, 3.28765869140625, 3.427825927734375, 3.5679931640625, 3.708160400390625, 3.84832763671875, 3.988494873046875, 4.128662109375, 4.268829345703125, 4.40899658203125, 4.549163818359375, 4.6893310546875, 4.829498291015625, 4.96966552734375, 5.109832763671875, 5.25]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 10.0, 13.0, 42.0, 117.0, 157.0, 193.0, 209.0, 137.0, 77.0, 25.0, 14.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.56956481933594, -191.56192016601562, -187.55426025390625, -183.54661560058594, -179.53897094726562, -175.53131103515625, -171.52366638183594, -167.51600646972656, -163.50836181640625, -159.50071716308594, -155.49305725097656, -151.48541259765625, -147.47775268554688, -143.47010803222656, -139.46246337890625, -135.45480346679688, -131.44715881347656, -127.43950653076172, -123.43185424804688, -119.42420959472656, -115.41655731201172, -111.40890502929688, -107.40126037597656, -103.39360809326172, -99.38595581054688, -95.37830352783203, -91.37065124511719, -87.36300659179688, -83.35535430908203, -79.34770202636719, -75.34005737304688, -71.33240509033203, -67.32474517822266, -63.31709289550781, -59.309444427490234, -55.301795959472656, -51.29414367675781, -47.28649139404297, -43.27884292602539, -39.27119445800781, -35.26354217529297, -31.255891799926758, -27.248241424560547, -23.240591049194336, -19.232940673828125, -15.225290298461914, -11.217639923095703, -7.209989547729492, -3.2023391723632812, 0.8053112030029297, 4.812961578369141, 8.820611953735352, 12.828262329101562, 16.835912704467773, 20.843563079833984, 24.851213455200195, 28.858863830566406, 32.86651611328125, 36.87416458129883, 40.881813049316406, 44.88946533203125, 48.897117614746094, 52.90476608276367, 56.91241455078125, 60.920066833496094]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 7.0, 8.0, 10.0, 14.0, 11.0, 15.0, 13.0, 23.0, 21.0, 26.0, 32.0, 26.0, 36.0, 40.0, 39.0, 59.0, 52.0, 51.0, 41.0, 45.0, 58.0, 43.0, 45.0, 34.0, 37.0, 37.0, 24.0, 32.0, 19.0, 23.0, 14.0, 14.0, 9.0, 5.0, 7.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-63.24349594116211, -61.334815979003906, -59.4261360168457, -57.517452239990234, -55.60877227783203, -53.70009231567383, -51.791412353515625, -49.882728576660156, -47.97404861450195, -46.06536865234375, -44.15668869018555, -42.24800491333008, -40.339324951171875, -38.43064498901367, -36.52196502685547, -34.61328125, -32.70460510253906, -30.79592514038086, -28.887243270874023, -26.97856330871582, -25.069881439208984, -23.16120147705078, -21.252521514892578, -19.343839645385742, -17.435157775878906, -15.526476860046387, -13.617795944213867, -11.709115982055664, -9.800434112548828, -7.891754150390625, -5.9830732345581055, -4.074392318725586, -2.16571044921875, -0.25702965259552, 1.65165114402771, 3.5603318214416504, 5.46901273727417, 7.377693176269531, 9.28637409210205, 11.19505500793457, 13.10373592376709, 15.01241683959961, 16.921096801757812, 18.82977867126465, 20.73845863342285, 22.647140502929688, 24.55582046508789, 26.464500427246094, 28.37318229675293, 30.281862258911133, 32.19054412841797, 34.09922409057617, 36.007904052734375, 37.916587829589844, 39.82526779174805, 41.73394775390625, 43.64262771606445, 45.551307678222656, 47.45998764038086, 49.36867141723633, 51.27735137939453, 53.186031341552734, 55.09471130371094, 57.003395080566406, 58.91207504272461]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 10.0, 12.0, 15.0, 14.0, 20.0, 31.0, 32.0, 51.0, 50.0, 105.0, 121.0, 151.0, 210.0, 323.0, 521.0, 789.0, 1240.0, 2353.0, 4933.0, 13878.0, 66065.0, 3908739.0, 158010.0, 22304.0, 6869.0, 2957.0, 1553.0, 946.0, 588.0, 381.0, 231.0, 215.0, 148.0, 94.0, 86.0, 39.0, 44.0, 43.0, 19.0, 21.0, 16.0, 11.0, 11.0, 5.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.984375, -9.6788330078125, -9.373291015625, -9.0677490234375, -8.76220703125, -8.4566650390625, -8.151123046875, -7.8455810546875, -7.5400390625, -7.2344970703125, -6.928955078125, -6.6234130859375, -6.31787109375, -6.0123291015625, -5.706787109375, -5.4012451171875, -5.095703125, -4.7901611328125, -4.484619140625, -4.1790771484375, -3.87353515625, -3.5679931640625, -3.262451171875, -2.9569091796875, -2.6513671875, -2.3458251953125, -2.040283203125, -1.7347412109375, -1.42919921875, -1.1236572265625, -0.818115234375, -0.5125732421875, -0.20703125, 0.0985107421875, 0.404052734375, 0.7095947265625, 1.01513671875, 1.3206787109375, 1.626220703125, 1.9317626953125, 2.2373046875, 2.5428466796875, 2.848388671875, 3.1539306640625, 3.45947265625, 3.7650146484375, 4.070556640625, 4.3760986328125, 4.681640625, 4.9871826171875, 5.292724609375, 5.5982666015625, 5.90380859375, 6.2093505859375, 6.514892578125, 6.8204345703125, 7.1259765625, 7.4315185546875, 7.737060546875, 8.0426025390625, 8.34814453125, 8.6536865234375, 8.959228515625, 9.2647705078125, 9.5703125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 8.0, 6.0, 8.0, 12.0, 11.0, 15.0, 17.0, 21.0, 16.0, 28.0, 34.0, 31.0, 46.0, 41.0, 55.0, 54.0, 62.0, 50.0, 55.0, 35.0, 45.0, 52.0, 37.0, 36.0, 48.0, 33.0, 38.0, 19.0, 12.0, 14.0, 9.0, 8.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.099609375, -2.02862548828125, -1.9576416015625, -1.88665771484375, -1.815673828125, -1.74468994140625, -1.6737060546875, -1.60272216796875, -1.53173828125, -1.46075439453125, -1.3897705078125, -1.31878662109375, -1.247802734375, -1.17681884765625, -1.1058349609375, -1.03485107421875, -0.9638671875, -0.89288330078125, -0.8218994140625, -0.75091552734375, -0.679931640625, -0.60894775390625, -0.5379638671875, -0.46697998046875, -0.39599609375, -0.32501220703125, -0.2540283203125, -0.18304443359375, -0.112060546875, -0.04107666015625, 0.0299072265625, 0.10089111328125, 0.171875, 0.24285888671875, 0.3138427734375, 0.38482666015625, 0.455810546875, 0.52679443359375, 0.5977783203125, 0.66876220703125, 0.73974609375, 0.81072998046875, 0.8817138671875, 0.95269775390625, 1.023681640625, 1.09466552734375, 1.1656494140625, 1.23663330078125, 1.3076171875, 1.37860107421875, 1.4495849609375, 1.52056884765625, 1.591552734375, 1.66253662109375, 1.7335205078125, 1.80450439453125, 1.87548828125, 1.94647216796875, 2.0174560546875, 2.08843994140625, 2.159423828125, 2.23040771484375, 2.3013916015625, 2.37237548828125, 2.443359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 11.0, 12.0, 13.0, 19.0, 31.0, 34.0, 49.0, 61.0, 107.0, 114.0, 167.0, 208.0, 316.0, 438.0, 636.0, 921.0, 1553.0, 2748.0, 5291.0, 12994.0, 48045.0, 855638.0, 3185841.0, 52206.0, 13578.0, 5548.0, 2789.0, 1584.0, 1050.0, 667.0, 418.0, 313.0, 224.0, 158.0, 137.0, 96.0, 79.0, 46.0, 34.0, 26.0, 18.0, 13.0, 11.0, 8.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.9609375, -9.64990234375, -9.3388671875, -9.02783203125, -8.716796875, -8.40576171875, -8.0947265625, -7.78369140625, -7.47265625, -7.16162109375, -6.8505859375, -6.53955078125, -6.228515625, -5.91748046875, -5.6064453125, -5.29541015625, -4.984375, -4.67333984375, -4.3623046875, -4.05126953125, -3.740234375, -3.42919921875, -3.1181640625, -2.80712890625, -2.49609375, -2.18505859375, -1.8740234375, -1.56298828125, -1.251953125, -0.94091796875, -0.6298828125, -0.31884765625, -0.0078125, 0.30322265625, 0.6142578125, 0.92529296875, 1.236328125, 1.54736328125, 1.8583984375, 2.16943359375, 2.48046875, 2.79150390625, 3.1025390625, 3.41357421875, 3.724609375, 4.03564453125, 4.3466796875, 4.65771484375, 4.96875, 5.27978515625, 5.5908203125, 5.90185546875, 6.212890625, 6.52392578125, 6.8349609375, 7.14599609375, 7.45703125, 7.76806640625, 8.0791015625, 8.39013671875, 8.701171875, 9.01220703125, 9.3232421875, 9.63427734375, 9.9453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 1.0, 4.0, 7.0, 14.0, 22.0, 37.0, 72.0, 163.0, 2689.0, 710.0, 156.0, 79.0, 33.0, 21.0, 17.0, 9.0, 6.0, 9.0, 1.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.663787841796875, -2.57171630859375, -2.479644775390625, -2.3875732421875, -2.295501708984375, -2.20343017578125, -2.111358642578125, -2.019287109375, -1.927215576171875, -1.83514404296875, -1.743072509765625, -1.6510009765625, -1.558929443359375, -1.46685791015625, -1.374786376953125, -1.28271484375, -1.190643310546875, -1.09857177734375, -1.006500244140625, -0.9144287109375, -0.822357177734375, -0.73028564453125, -0.638214111328125, -0.546142578125, -0.454071044921875, -0.36199951171875, -0.269927978515625, -0.1778564453125, -0.085784912109375, 0.00628662109375, 0.098358154296875, 0.1904296875, 0.282501220703125, 0.37457275390625, 0.466644287109375, 0.5587158203125, 0.650787353515625, 0.74285888671875, 0.834930419921875, 0.927001953125, 1.019073486328125, 1.11114501953125, 1.203216552734375, 1.2952880859375, 1.387359619140625, 1.47943115234375, 1.571502685546875, 1.66357421875, 1.755645751953125, 1.84771728515625, 1.939788818359375, 2.0318603515625, 2.123931884765625, 2.21600341796875, 2.308074951171875, 2.400146484375, 2.492218017578125, 2.58428955078125, 2.676361083984375, 2.7684326171875, 2.860504150390625, 2.95257568359375, 3.044647216796875, 3.13671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 10.0, 24.0, 24.0, 18.0, 36.0, 65.0, 63.0, 63.0, 74.0, 72.0, 72.0, 66.0, 73.0, 59.0, 60.0, 43.0, 50.0, 26.0, 18.0, 15.0, 12.0, 8.0, 5.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.847022533416748, -6.5972065925598145, -6.347391128540039, -6.0975751876831055, -5.84775972366333, -5.5979437828063965, -5.348128318786621, -5.0983123779296875, -4.848496437072754, -4.59868049621582, -4.348865032196045, -4.099049091339111, -3.849233627319336, -3.5994176864624023, -3.349601984024048, -3.0997862815856934, -2.849970817565918, -2.6001551151275635, -2.350339412689209, -2.1005234718322754, -1.8507078886032104, -1.600892186164856, -1.351076364517212, -1.1012606620788574, -0.8514449596405029, -0.6016292572021484, -0.35181349515914917, -0.1019977331161499, 0.1478179693222046, 0.3976336717605591, 0.6474494934082031, 0.8972651958465576, 1.147080421447754, 1.3968961238861084, 1.646711826324463, 1.896527647972107, 2.146343231201172, 2.3961591720581055, 2.64597487449646, 2.8957905769348145, 3.145606279373169, 3.3954219818115234, 3.645237684249878, 3.8950533866882324, 4.144869327545166, 4.394684791564941, 4.644500732421875, 4.894316673278809, 5.144132137298584, 5.393948078155518, 5.643763542175293, 5.893579483032227, 6.143394947052002, 6.3932108879089355, 6.643026351928711, 6.8928422927856445, 7.142658233642578, 7.392474174499512, 7.642289638519287, 7.892105579376221, 8.141921043395996, 8.39173698425293, 8.641552925109863, 8.891368865966797, 9.141183853149414]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 9.0, 6.0, 11.0, 6.0, 13.0, 10.0, 13.0, 13.0, 22.0, 22.0, 12.0, 20.0, 35.0, 29.0, 46.0, 31.0, 35.0, 33.0, 46.0, 44.0, 37.0, 51.0, 42.0, 43.0, 44.0, 28.0, 32.0, 37.0, 36.0, 32.0, 25.0, 25.0, 15.0, 12.0, 14.0, 10.0, 11.0, 8.0, 7.0, 7.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.495150566101074, -5.3013596534729, -5.107568740844727, -4.913777828216553, -4.719986915588379, -4.526196002960205, -4.332405090332031, -4.138614177703857, -3.9448232650756836, -3.7510323524475098, -3.557241439819336, -3.363450527191162, -3.1696596145629883, -2.9758687019348145, -2.7820777893066406, -2.588286876678467, -2.394496202468872, -2.2007052898406982, -2.0069143772125244, -1.8131234645843506, -1.6193325519561768, -1.425541639328003, -1.2317508459091187, -1.0379599332809448, -0.844169020652771, -0.6503781080245972, -0.4565872251987457, -0.2627963423728943, -0.06900542974472046, 0.12478548288345337, 0.3185763359069824, 0.5123672485351562, 0.7061581611633301, 0.8999490737915039, 1.0937399864196777, 1.2875308990478516, 1.4813218116760254, 1.6751127243041992, 1.8689035177230835, 2.062694549560547, 2.2564854621887207, 2.4502763748168945, 2.6440672874450684, 2.837858200073242, 3.031649112701416, 3.22544002532959, 3.4192309379577637, 3.6130218505859375, 3.8068125247955322, 4.000603199005127, 4.194394111633301, 4.388185024261475, 4.581975936889648, 4.775766849517822, 4.969557762145996, 5.16334867477417, 5.357139587402344, 5.550930500030518, 5.744721412658691, 5.938512325286865, 6.132303237915039, 6.326094150543213, 6.519885063171387, 6.7136759757995605, 6.907466888427734]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 9.0, 13.0, 8.0, 29.0, 42.0, 56.0, 80.0, 143.0, 200.0, 350.0, 590.0, 1028.0, 1968.0, 3638.0, 7057.0, 14257.0, 29514.0, 59607.0, 116387.0, 195707.0, 235772.0, 178090.0, 101864.0, 51479.0, 25041.0, 12424.0, 6113.0, 3066.0, 1765.0, 920.0, 517.0, 274.0, 193.0, 122.0, 68.0, 46.0, 34.0, 21.0, 13.0, 12.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.167724609375, -3.05615234375, -2.944580078125, -2.8330078125, -2.721435546875, -2.60986328125, -2.498291015625, -2.38671875, -2.275146484375, -2.16357421875, -2.052001953125, -1.9404296875, -1.828857421875, -1.71728515625, -1.605712890625, -1.494140625, -1.382568359375, -1.27099609375, -1.159423828125, -1.0478515625, -0.936279296875, -0.82470703125, -0.713134765625, -0.6015625, -0.489990234375, -0.37841796875, -0.266845703125, -0.1552734375, -0.043701171875, 0.06787109375, 0.179443359375, 0.291015625, 0.402587890625, 0.51416015625, 0.625732421875, 0.7373046875, 0.848876953125, 0.96044921875, 1.072021484375, 1.18359375, 1.295166015625, 1.40673828125, 1.518310546875, 1.6298828125, 1.741455078125, 1.85302734375, 1.964599609375, 2.076171875, 2.187744140625, 2.29931640625, 2.410888671875, 2.5224609375, 2.634033203125, 2.74560546875, 2.857177734375, 2.96875, 3.080322265625, 3.19189453125, 3.303466796875, 3.4150390625, 3.526611328125, 3.63818359375, 3.749755859375, 3.861328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 4.0, 6.0, 8.0, 7.0, 7.0, 11.0, 8.0, 18.0, 30.0, 26.0, 25.0, 47.0, 41.0, 50.0, 52.0, 54.0, 64.0, 52.0, 58.0, 53.0, 62.0, 47.0, 46.0, 33.0, 37.0, 31.0, 22.0, 21.0, 18.0, 13.0, 9.0, 3.0, 12.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.552734375, -2.471893310546875, -2.39105224609375, -2.310211181640625, -2.2293701171875, -2.148529052734375, -2.06768798828125, -1.986846923828125, -1.906005859375, -1.825164794921875, -1.74432373046875, -1.663482666015625, -1.5826416015625, -1.501800537109375, -1.42095947265625, -1.340118408203125, -1.25927734375, -1.178436279296875, -1.09759521484375, -1.016754150390625, -0.9359130859375, -0.855072021484375, -0.77423095703125, -0.693389892578125, -0.612548828125, -0.531707763671875, -0.45086669921875, -0.370025634765625, -0.2891845703125, -0.208343505859375, -0.12750244140625, -0.046661376953125, 0.0341796875, 0.115020751953125, 0.19586181640625, 0.276702880859375, 0.3575439453125, 0.438385009765625, 0.51922607421875, 0.600067138671875, 0.680908203125, 0.761749267578125, 0.84259033203125, 0.923431396484375, 1.0042724609375, 1.085113525390625, 1.16595458984375, 1.246795654296875, 1.32763671875, 1.408477783203125, 1.48931884765625, 1.570159912109375, 1.6510009765625, 1.731842041015625, 1.81268310546875, 1.893524169921875, 1.974365234375, 2.055206298828125, 2.13604736328125, 2.216888427734375, 2.2977294921875, 2.378570556640625, 2.45941162109375, 2.540252685546875, 2.62109375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 2.0, 4.0, 3.0, 12.0, 9.0, 10.0, 31.0, 34.0, 55.0, 62.0, 79.0, 137.0, 177.0, 298.0, 479.0, 774.0, 1549.0, 3642.0, 17898.0, 228068.0, 707991.0, 73425.0, 8429.0, 2423.0, 1149.0, 616.0, 387.0, 264.0, 164.0, 126.0, 63.0, 59.0, 38.0, 24.0, 19.0, 15.0, 14.0, 4.0, 7.0, 3.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.0675048828125, -10.689697265625, -10.3118896484375, -9.93408203125, -9.5562744140625, -9.178466796875, -8.8006591796875, -8.4228515625, -8.0450439453125, -7.667236328125, -7.2894287109375, -6.91162109375, -6.5338134765625, -6.156005859375, -5.7781982421875, -5.400390625, -5.0225830078125, -4.644775390625, -4.2669677734375, -3.88916015625, -3.5113525390625, -3.133544921875, -2.7557373046875, -2.3779296875, -2.0001220703125, -1.622314453125, -1.2445068359375, -0.86669921875, -0.4888916015625, -0.111083984375, 0.2667236328125, 0.64453125, 1.0223388671875, 1.400146484375, 1.7779541015625, 2.15576171875, 2.5335693359375, 2.911376953125, 3.2891845703125, 3.6669921875, 4.0447998046875, 4.422607421875, 4.8004150390625, 5.17822265625, 5.5560302734375, 5.933837890625, 6.3116455078125, 6.689453125, 7.0672607421875, 7.445068359375, 7.8228759765625, 8.20068359375, 8.5784912109375, 8.956298828125, 9.3341064453125, 9.7119140625, 10.0897216796875, 10.467529296875, 10.8453369140625, 11.22314453125, 11.6009521484375, 11.978759765625, 12.3565673828125, 12.734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 3.0, 11.0, 8.0, 17.0, 20.0, 20.0, 19.0, 30.0, 33.0, 38.0, 37.0, 38.0, 44.0, 54.0, 56.0, 48.0, 58.0, 45.0, 51.0, 38.0, 59.0, 52.0, 25.0, 30.0, 21.0, 25.0, 29.0, 19.0, 19.0, 9.0, 4.0, 12.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.6676025390625, -10.272705078125, -9.8778076171875, -9.48291015625, -9.0880126953125, -8.693115234375, -8.2982177734375, -7.9033203125, -7.5084228515625, -7.113525390625, -6.7186279296875, -6.32373046875, -5.9288330078125, -5.533935546875, -5.1390380859375, -4.744140625, -4.3492431640625, -3.954345703125, -3.5594482421875, -3.16455078125, -2.7696533203125, -2.374755859375, -1.9798583984375, -1.5849609375, -1.1900634765625, -0.795166015625, -0.4002685546875, -0.00537109375, 0.3895263671875, 0.784423828125, 1.1793212890625, 1.57421875, 1.9691162109375, 2.364013671875, 2.7589111328125, 3.15380859375, 3.5487060546875, 3.943603515625, 4.3385009765625, 4.7333984375, 5.1282958984375, 5.523193359375, 5.9180908203125, 6.31298828125, 6.7078857421875, 7.102783203125, 7.4976806640625, 7.892578125, 8.2874755859375, 8.682373046875, 9.0772705078125, 9.47216796875, 9.8670654296875, 10.261962890625, 10.6568603515625, 11.0517578125, 11.4466552734375, 11.841552734375, 12.2364501953125, 12.63134765625, 13.0262451171875, 13.421142578125, 13.8160400390625, 14.2109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 12.0, 13.0, 34.0, 78.0, 168.0, 400.0, 1144.0, 5026.0, 84291.0, 869117.0, 81401.0, 5062.0, 1116.0, 353.0, 154.0, 78.0, 37.0, 30.0, 9.0, 6.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9375, -8.67840576171875, -8.4193115234375, -8.16021728515625, -7.901123046875, -7.64202880859375, -7.3829345703125, -7.12384033203125, -6.86474609375, -6.60565185546875, -6.3465576171875, -6.08746337890625, -5.828369140625, -5.56927490234375, -5.3101806640625, -5.05108642578125, -4.7919921875, -4.53289794921875, -4.2738037109375, -4.01470947265625, -3.755615234375, -3.49652099609375, -3.2374267578125, -2.97833251953125, -2.71923828125, -2.46014404296875, -2.2010498046875, -1.94195556640625, -1.682861328125, -1.42376708984375, -1.1646728515625, -0.90557861328125, -0.646484375, -0.38739013671875, -0.1282958984375, 0.13079833984375, 0.389892578125, 0.64898681640625, 0.9080810546875, 1.16717529296875, 1.42626953125, 1.68536376953125, 1.9444580078125, 2.20355224609375, 2.462646484375, 2.72174072265625, 2.9808349609375, 3.23992919921875, 3.4990234375, 3.75811767578125, 4.0172119140625, 4.27630615234375, 4.535400390625, 4.79449462890625, 5.0535888671875, 5.31268310546875, 5.57177734375, 5.83087158203125, 6.0899658203125, 6.34906005859375, 6.608154296875, 6.86724853515625, 7.1263427734375, 7.38543701171875, 7.64453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 10.0, 17.0, 13.0, 17.0, 16.0, 30.0, 41.0, 48.0, 47.0, 51.0, 76.0, 62.0, 66.0, 71.0, 66.0, 66.0, 55.0, 32.0, 40.0, 29.0, 35.0, 22.0, 17.0, 14.0, 9.0, 9.0, 5.0, 6.0, 8.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005311965942382812, -0.0005119740962982178, -0.0004927515983581543, -0.0004735291004180908, -0.00045430660247802734, -0.00043508410453796387, -0.0004158616065979004, -0.0003966391086578369, -0.00037741661071777344, -0.00035819411277770996, -0.0003389716148376465, -0.000319749116897583, -0.00030052661895751953, -0.00028130412101745605, -0.0002620816230773926, -0.0002428591251373291, -0.00022363662719726562, -0.00020441412925720215, -0.00018519163131713867, -0.0001659691333770752, -0.00014674663543701172, -0.00012752413749694824, -0.00010830163955688477, -8.907914161682129e-05, -6.985664367675781e-05, -5.0634145736694336e-05, -3.141164779663086e-05, -1.2189149856567383e-05, 7.033348083496094e-06, 2.625584602355957e-05, 4.547834396362305e-05, 6.470084190368652e-05, 8.392333984375e-05, 0.00010314583778381348, 0.00012236833572387695, 0.00014159083366394043, 0.0001608133316040039, 0.00018003582954406738, 0.00019925832748413086, 0.00021848082542419434, 0.0002377033233642578, 0.0002569258213043213, 0.00027614831924438477, 0.00029537081718444824, 0.0003145933151245117, 0.0003338158130645752, 0.00035303831100463867, 0.00037226080894470215, 0.0003914833068847656, 0.0004107058048248291, 0.0004299283027648926, 0.00044915080070495605, 0.00046837329864501953, 0.000487595796585083, 0.0005068182945251465, 0.00052604079246521, 0.0005452632904052734, 0.0005644857883453369, 0.0005837082862854004, 0.0006029307842254639, 0.0006221532821655273, 0.0006413757801055908, 0.0006605982780456543, 0.0006798207759857178, 0.0006990432739257812]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 20.0, 21.0, 24.0, 64.0, 116.0, 267.0, 667.0, 2124.0, 11219.0, 274633.0, 724976.0, 29257.0, 3449.0, 997.0, 385.0, 148.0, 74.0, 34.0, 22.0, 18.0, 7.0, 8.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.08514404296875, -5.8226318359375, -5.56011962890625, -5.297607421875, -5.03509521484375, -4.7725830078125, -4.51007080078125, -4.24755859375, -3.98504638671875, -3.7225341796875, -3.46002197265625, -3.197509765625, -2.93499755859375, -2.6724853515625, -2.40997314453125, -2.1474609375, -1.88494873046875, -1.6224365234375, -1.35992431640625, -1.097412109375, -0.83489990234375, -0.5723876953125, -0.30987548828125, -0.04736328125, 0.21514892578125, 0.4776611328125, 0.74017333984375, 1.002685546875, 1.26519775390625, 1.5277099609375, 1.79022216796875, 2.052734375, 2.31524658203125, 2.5777587890625, 2.84027099609375, 3.102783203125, 3.36529541015625, 3.6278076171875, 3.89031982421875, 4.15283203125, 4.41534423828125, 4.6778564453125, 4.94036865234375, 5.202880859375, 5.46539306640625, 5.7279052734375, 5.99041748046875, 6.2529296875, 6.51544189453125, 6.7779541015625, 7.04046630859375, 7.302978515625, 7.56549072265625, 7.8280029296875, 8.09051513671875, 8.35302734375, 8.61553955078125, 8.8780517578125, 9.14056396484375, 9.403076171875, 9.66558837890625, 9.9281005859375, 10.19061279296875, 10.453125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 11.0, 7.0, 20.0, 41.0, 63.0, 93.0, 135.0, 135.0, 131.0, 99.0, 96.0, 62.0, 39.0, 26.0, 17.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.92816162109375, -7.7078857421875, -7.48760986328125, -7.267333984375, -7.04705810546875, -6.8267822265625, -6.60650634765625, -6.38623046875, -6.16595458984375, -5.9456787109375, -5.72540283203125, -5.505126953125, -5.28485107421875, -5.0645751953125, -4.84429931640625, -4.6240234375, -4.40374755859375, -4.1834716796875, -3.96319580078125, -3.742919921875, -3.52264404296875, -3.3023681640625, -3.08209228515625, -2.86181640625, -2.64154052734375, -2.4212646484375, -2.20098876953125, -1.980712890625, -1.76043701171875, -1.5401611328125, -1.31988525390625, -1.099609375, -0.87933349609375, -0.6590576171875, -0.43878173828125, -0.218505859375, 0.00177001953125, 0.2220458984375, 0.44232177734375, 0.66259765625, 0.88287353515625, 1.1031494140625, 1.32342529296875, 1.543701171875, 1.76397705078125, 1.9842529296875, 2.20452880859375, 2.4248046875, 2.64508056640625, 2.8653564453125, 3.08563232421875, 3.305908203125, 3.52618408203125, 3.7464599609375, 3.96673583984375, 4.18701171875, 4.40728759765625, 4.6275634765625, 4.84783935546875, 5.068115234375, 5.28839111328125, 5.5086669921875, 5.72894287109375, 5.94921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 13.0, 18.0, 95.0, 258.0, 319.0, 206.0, 67.0, 22.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.9571762084961, -115.7615966796875, -110.5660171508789, -105.37043762207031, -100.17485046386719, -94.97927856445312, -89.78369140625, -84.5881118774414, -79.39253234863281, -74.19695281982422, -69.00137329101562, -63.805789947509766, -58.61021041870117, -53.41463088989258, -48.21904754638672, -43.023468017578125, -37.82788848876953, -32.63230895996094, -27.43672752380371, -22.241146087646484, -17.04556655883789, -11.849987030029297, -6.65440559387207, -1.4588241577148438, 3.73675537109375, 8.93233585357666, 14.12791633605957, 19.323497772216797, 24.51907730102539, 29.714656829833984, 34.910240173339844, 40.10581970214844, 45.3013916015625, 50.496971130371094, 55.69255065917969, 60.88813400268555, 66.08370971679688, 71.279296875, 76.4748764038086, 81.67045593261719, 86.86603546142578, 92.06161499023438, 97.25719451904297, 102.45277404785156, 107.64836120605469, 112.84393310546875, 118.03952026367188, 123.23509979248047, 128.43067932128906, 133.6262664794922, 138.82183837890625, 144.01742553710938, 149.21299743652344, 154.40858459472656, 159.60415649414062, 164.79974365234375, 169.99533081054688, 175.19091796875, 180.38648986816406, 185.5820770263672, 190.77764892578125, 195.97323608398438, 201.16880798339844, 206.36439514160156, 211.55996704101562]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 6.0, 9.0, 9.0, 17.0, 23.0, 17.0, 21.0, 20.0, 34.0, 27.0, 36.0, 42.0, 38.0, 40.0, 55.0, 43.0, 49.0, 49.0, 53.0, 67.0, 36.0, 45.0, 35.0, 39.0, 32.0, 24.0, 17.0, 18.0, 16.0, 17.0, 11.0, 13.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.229698181152344, -54.52511978149414, -52.82054138183594, -51.115962982177734, -49.41138458251953, -47.70680618286133, -46.002227783203125, -44.29765319824219, -42.59307098388672, -40.888492584228516, -39.18391418457031, -37.47933578491211, -35.774757385253906, -34.0701789855957, -32.3656005859375, -30.66102409362793, -28.95644760131836, -27.251869201660156, -25.547290802001953, -23.84271240234375, -22.138134002685547, -20.433555603027344, -18.728979110717773, -17.02440071105957, -15.319822311401367, -13.615243911743164, -11.910665512084961, -10.206088066101074, -8.501509666442871, -6.796931266784668, -5.092353820800781, -3.387775421142578, -1.683197021484375, 0.021381139755249023, 1.725959300994873, 3.430537223815918, 5.135115623474121, 6.839694023132324, 8.544271469116211, 10.248849868774414, 11.953428268432617, 13.65800666809082, 15.362585067749023, 17.067161560058594, 18.771739959716797, 20.476318359375, 22.180896759033203, 23.885475158691406, 25.59005355834961, 27.294631958007812, 28.999210357666016, 30.70378875732422, 32.40836715698242, 34.112945556640625, 35.81752014160156, 37.52210235595703, 39.22667694091797, 40.93125534057617, 42.635833740234375, 44.34041213989258, 46.04499053955078, 47.749568939208984, 49.45414733886719, 51.158721923828125, 52.863304138183594]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 11.0, 7.0, 16.0, 21.0, 36.0, 35.0, 64.0, 74.0, 95.0, 111.0, 166.0, 340.0, 699.0, 1876.0, 6646.0, 49203.0, 4097653.0, 29279.0, 4956.0, 1446.0, 645.0, 291.0, 138.0, 109.0, 81.0, 88.0, 33.0, 38.0, 28.0, 23.0, 18.0, 11.0, 8.0, 11.0, 2.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.8125, -18.23193359375, -17.6513671875, -17.07080078125, -16.490234375, -15.90966796875, -15.3291015625, -14.74853515625, -14.16796875, -13.58740234375, -13.0068359375, -12.42626953125, -11.845703125, -11.26513671875, -10.6845703125, -10.10400390625, -9.5234375, -8.94287109375, -8.3623046875, -7.78173828125, -7.201171875, -6.62060546875, -6.0400390625, -5.45947265625, -4.87890625, -4.29833984375, -3.7177734375, -3.13720703125, -2.556640625, -1.97607421875, -1.3955078125, -0.81494140625, -0.234375, 0.34619140625, 0.9267578125, 1.50732421875, 2.087890625, 2.66845703125, 3.2490234375, 3.82958984375, 4.41015625, 4.99072265625, 5.5712890625, 6.15185546875, 6.732421875, 7.31298828125, 7.8935546875, 8.47412109375, 9.0546875, 9.63525390625, 10.2158203125, 10.79638671875, 11.376953125, 11.95751953125, 12.5380859375, 13.11865234375, 13.69921875, 14.27978515625, 14.8603515625, 15.44091796875, 16.021484375, 16.60205078125, 17.1826171875, 17.76318359375, 18.34375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 18.0, 23.0, 17.0, 38.0, 25.0, 41.0, 48.0, 60.0, 63.0, 67.0, 54.0, 75.0, 59.0, 57.0, 45.0, 55.0, 50.0, 34.0, 35.0, 28.0, 16.0, 23.0, 7.0, 7.0, 5.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.15625, -3.06396484375, -2.9716796875, -2.87939453125, -2.787109375, -2.69482421875, -2.6025390625, -2.51025390625, -2.41796875, -2.32568359375, -2.2333984375, -2.14111328125, -2.048828125, -1.95654296875, -1.8642578125, -1.77197265625, -1.6796875, -1.58740234375, -1.4951171875, -1.40283203125, -1.310546875, -1.21826171875, -1.1259765625, -1.03369140625, -0.94140625, -0.84912109375, -0.7568359375, -0.66455078125, -0.572265625, -0.47998046875, -0.3876953125, -0.29541015625, -0.203125, -0.11083984375, -0.0185546875, 0.07373046875, 0.166015625, 0.25830078125, 0.3505859375, 0.44287109375, 0.53515625, 0.62744140625, 0.7197265625, 0.81201171875, 0.904296875, 0.99658203125, 1.0888671875, 1.18115234375, 1.2734375, 1.36572265625, 1.4580078125, 1.55029296875, 1.642578125, 1.73486328125, 1.8271484375, 1.91943359375, 2.01171875, 2.10400390625, 2.1962890625, 2.28857421875, 2.380859375, 2.47314453125, 2.5654296875, 2.65771484375, 2.75]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 12.0, 11.0, 16.0, 16.0, 35.0, 38.0, 58.0, 71.0, 127.0, 175.0, 282.0, 524.0, 1433.0, 5554.0, 48256.0, 4087979.0, 41639.0, 5240.0, 1316.0, 580.0, 284.0, 197.0, 130.0, 93.0, 59.0, 42.0, 29.0, 16.0, 15.0, 13.0, 5.0, 6.0, 3.0, 10.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.4375, -17.83251953125, -17.2275390625, -16.62255859375, -16.017578125, -15.41259765625, -14.8076171875, -14.20263671875, -13.59765625, -12.99267578125, -12.3876953125, -11.78271484375, -11.177734375, -10.57275390625, -9.9677734375, -9.36279296875, -8.7578125, -8.15283203125, -7.5478515625, -6.94287109375, -6.337890625, -5.73291015625, -5.1279296875, -4.52294921875, -3.91796875, -3.31298828125, -2.7080078125, -2.10302734375, -1.498046875, -0.89306640625, -0.2880859375, 0.31689453125, 0.921875, 1.52685546875, 2.1318359375, 2.73681640625, 3.341796875, 3.94677734375, 4.5517578125, 5.15673828125, 5.76171875, 6.36669921875, 6.9716796875, 7.57666015625, 8.181640625, 8.78662109375, 9.3916015625, 9.99658203125, 10.6015625, 11.20654296875, 11.8115234375, 12.41650390625, 13.021484375, 13.62646484375, 14.2314453125, 14.83642578125, 15.44140625, 16.04638671875, 16.6513671875, 17.25634765625, 17.861328125, 18.46630859375, 19.0712890625, 19.67626953125, 20.28125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 15.0, 24.0, 38.0, 85.0, 526.0, 3173.0, 99.0, 52.0, 14.0, 15.0, 5.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8443145751953125, -1.736480712890625, -1.6286468505859375, -1.52081298828125, -1.4129791259765625, -1.305145263671875, -1.1973114013671875, -1.0894775390625, -0.9816436767578125, -0.873809814453125, -0.7659759521484375, -0.65814208984375, -0.5503082275390625, -0.442474365234375, -0.3346405029296875, -0.226806640625, -0.1189727783203125, -0.011138916015625, 0.0966949462890625, 0.20452880859375, 0.3123626708984375, 0.420196533203125, 0.5280303955078125, 0.6358642578125, 0.7436981201171875, 0.851531982421875, 0.9593658447265625, 1.06719970703125, 1.1750335693359375, 1.282867431640625, 1.3907012939453125, 1.49853515625, 1.6063690185546875, 1.714202880859375, 1.8220367431640625, 1.92987060546875, 2.0377044677734375, 2.145538330078125, 2.2533721923828125, 2.3612060546875, 2.4690399169921875, 2.576873779296875, 2.6847076416015625, 2.79254150390625, 2.9003753662109375, 3.008209228515625, 3.1160430908203125, 3.223876953125, 3.3317108154296875, 3.439544677734375, 3.5473785400390625, 3.65521240234375, 3.7630462646484375, 3.870880126953125, 3.9787139892578125, 4.0865478515625, 4.1943817138671875, 4.302215576171875, 4.4100494384765625, 4.51788330078125, 4.6257171630859375, 4.733551025390625, 4.8413848876953125, 4.94921875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 10.0, 7.0, 30.0, 33.0, 36.0, 54.0, 75.0, 83.0, 113.0, 108.0, 79.0, 87.0, 65.0, 54.0, 40.0, 29.0, 23.0, 19.0, 10.0, 6.0, 3.0, 8.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-10.107322692871094, -9.82966136932373, -9.55199909210205, -9.274337768554688, -8.996676445007324, -8.719014167785645, -8.441352844238281, -8.163691520690918, -7.886029243469238, -7.608367443084717, -7.3307061195373535, -7.053044319152832, -6.7753825187683105, -6.497720718383789, -6.220059394836426, -5.942397594451904, -5.664736270904541, -5.3870744705200195, -5.109413146972656, -4.831751346588135, -4.554089546203613, -4.27642822265625, -3.9987664222717285, -3.721104621887207, -3.4434430599212646, -3.1657814979553223, -2.888119697570801, -2.6104581356048584, -2.332796573638916, -2.0551347732543945, -1.7774732112884521, -1.4998115301132202, -1.22214937210083, -0.9444876909255981, -0.666826069355011, -0.38916444778442383, -0.1115027666091919, 0.16615891456604004, 0.4438204765319824, 0.7214821577072144, 0.9991438388824463, 1.2768055200576782, 1.5544672012329102, 1.8321287631988525, 2.109790325164795, 2.3874521255493164, 2.665113687515259, 2.942775249481201, 3.2204370498657227, 3.498098611831665, 3.7757604122161865, 4.053421974182129, 4.33108377456665, 4.608745574951172, 4.886406898498535, 5.164068698883057, 5.441730499267578, 5.7193922996521, 5.997053623199463, 6.274715423583984, 6.552377223968506, 6.830039024353027, 7.107700347900391, 7.385362148284912, 7.663023471832275]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 8.0, 7.0, 2.0, 10.0, 11.0, 12.0, 19.0, 15.0, 17.0, 18.0, 27.0, 18.0, 19.0, 30.0, 29.0, 33.0, 43.0, 45.0, 38.0, 37.0, 42.0, 39.0, 41.0, 38.0, 43.0, 40.0, 32.0, 37.0, 31.0, 29.0, 24.0, 28.0, 16.0, 17.0, 22.0, 16.0, 12.0, 9.0, 9.0, 10.0, 10.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.144894123077393, -4.985811710357666, -4.8267292976379395, -4.667646408081055, -4.508563995361328, -4.349481582641602, -4.190399169921875, -4.031316757202148, -3.8722341060638428, -3.713151693344116, -3.5540690422058105, -3.394986629486084, -3.2359042167663574, -3.0768215656280518, -2.917739152908325, -2.7586565017700195, -2.599574089050293, -2.4404916763305664, -2.2814090251922607, -2.122326612472534, -1.963244080543518, -1.804161548614502, -1.6450791358947754, -1.4859966039657593, -1.3269140720367432, -1.167831540107727, -1.008749008178711, -0.8496665954589844, -0.6905840635299683, -0.5315015316009521, -0.3724190592765808, -0.21333658695220947, -0.054253578186035156, 0.10482892394065857, 0.2639114260673523, 0.422993928194046, 0.5820764303207397, 0.7411589622497559, 0.9002414345741272, 1.0593239068984985, 1.2184064388275146, 1.3774889707565308, 1.5365715026855469, 1.6956539154052734, 1.8547364473342896, 2.0138189792633057, 2.1729013919830322, 2.331984043121338, 2.4910664558410645, 2.650148868560791, 2.8092315196990967, 2.9683139324188232, 3.127396583557129, 3.2864789962768555, 3.445561408996582, 3.6046438217163086, 3.7637264728546143, 3.922808885574341, 4.0818915367126465, 4.240973949432373, 4.4000563621521, 4.559139251708984, 4.718221664428711, 4.8773040771484375, 5.036386489868164]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 13.0, 11.0, 16.0, 33.0, 39.0, 66.0, 159.0, 234.0, 376.0, 677.0, 1376.0, 2826.0, 6547.0, 17018.0, 48810.0, 144522.0, 368967.0, 294414.0, 104473.0, 35726.0, 12553.0, 5117.0, 2139.0, 1068.0, 587.0, 306.0, 197.0, 106.0, 61.0, 44.0, 22.0, 16.0, 14.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.09375, -5.92376708984375, -5.7537841796875, -5.58380126953125, -5.413818359375, -5.24383544921875, -5.0738525390625, -4.90386962890625, -4.73388671875, -4.56390380859375, -4.3939208984375, -4.22393798828125, -4.053955078125, -3.88397216796875, -3.7139892578125, -3.54400634765625, -3.3740234375, -3.20404052734375, -3.0340576171875, -2.86407470703125, -2.694091796875, -2.52410888671875, -2.3541259765625, -2.18414306640625, -2.01416015625, -1.84417724609375, -1.6741943359375, -1.50421142578125, -1.334228515625, -1.16424560546875, -0.9942626953125, -0.82427978515625, -0.654296875, -0.48431396484375, -0.3143310546875, -0.14434814453125, 0.025634765625, 0.19561767578125, 0.3656005859375, 0.53558349609375, 0.70556640625, 0.87554931640625, 1.0455322265625, 1.21551513671875, 1.385498046875, 1.55548095703125, 1.7254638671875, 1.89544677734375, 2.0654296875, 2.23541259765625, 2.4053955078125, 2.57537841796875, 2.745361328125, 2.91534423828125, 3.0853271484375, 3.25531005859375, 3.42529296875, 3.59527587890625, 3.7652587890625, 3.93524169921875, 4.105224609375, 4.27520751953125, 4.4451904296875, 4.61517333984375, 4.78515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 6.0, 15.0, 5.0, 31.0, 26.0, 30.0, 37.0, 45.0, 49.0, 61.0, 61.0, 74.0, 63.0, 67.0, 63.0, 58.0, 50.0, 49.0, 33.0, 35.0, 41.0, 19.0, 23.0, 8.0, 12.0, 11.0, 3.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.953125, -3.848724365234375, -3.74432373046875, -3.639923095703125, -3.5355224609375, -3.431121826171875, -3.32672119140625, -3.222320556640625, -3.117919921875, -3.013519287109375, -2.90911865234375, -2.804718017578125, -2.7003173828125, -2.595916748046875, -2.49151611328125, -2.387115478515625, -2.28271484375, -2.178314208984375, -2.07391357421875, -1.969512939453125, -1.8651123046875, -1.760711669921875, -1.65631103515625, -1.551910400390625, -1.447509765625, -1.343109130859375, -1.23870849609375, -1.134307861328125, -1.0299072265625, -0.925506591796875, -0.82110595703125, -0.716705322265625, -0.6123046875, -0.507904052734375, -0.40350341796875, -0.299102783203125, -0.1947021484375, -0.090301513671875, 0.01409912109375, 0.118499755859375, 0.222900390625, 0.327301025390625, 0.43170166015625, 0.536102294921875, 0.6405029296875, 0.744903564453125, 0.84930419921875, 0.953704833984375, 1.05810546875, 1.162506103515625, 1.26690673828125, 1.371307373046875, 1.4757080078125, 1.580108642578125, 1.68450927734375, 1.788909912109375, 1.893310546875, 1.997711181640625, 2.10211181640625, 2.206512451171875, 2.3109130859375, 2.415313720703125, 2.51971435546875, 2.624114990234375, 2.728515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 18.0, 18.0, 15.0, 29.0, 41.0, 55.0, 71.0, 99.0, 143.0, 206.0, 267.0, 388.0, 579.0, 927.0, 1618.0, 3942.0, 16831.0, 136294.0, 717344.0, 143325.0, 17595.0, 4152.0, 1762.0, 930.0, 590.0, 371.0, 271.0, 181.0, 110.0, 91.0, 76.0, 60.0, 36.0, 20.0, 24.0, 10.0, 16.0, 12.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.515869140625, -7.24267578125, -6.969482421875, -6.6962890625, -6.423095703125, -6.14990234375, -5.876708984375, -5.603515625, -5.330322265625, -5.05712890625, -4.783935546875, -4.5107421875, -4.237548828125, -3.96435546875, -3.691162109375, -3.41796875, -3.144775390625, -2.87158203125, -2.598388671875, -2.3251953125, -2.052001953125, -1.77880859375, -1.505615234375, -1.232421875, -0.959228515625, -0.68603515625, -0.412841796875, -0.1396484375, 0.133544921875, 0.40673828125, 0.679931640625, 0.953125, 1.226318359375, 1.49951171875, 1.772705078125, 2.0458984375, 2.319091796875, 2.59228515625, 2.865478515625, 3.138671875, 3.411865234375, 3.68505859375, 3.958251953125, 4.2314453125, 4.504638671875, 4.77783203125, 5.051025390625, 5.32421875, 5.597412109375, 5.87060546875, 6.143798828125, 6.4169921875, 6.690185546875, 6.96337890625, 7.236572265625, 7.509765625, 7.782958984375, 8.05615234375, 8.329345703125, 8.6025390625, 8.875732421875, 9.14892578125, 9.422119140625, 9.6953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 5.0, 13.0, 15.0, 13.0, 18.0, 16.0, 15.0, 30.0, 28.0, 30.0, 35.0, 32.0, 34.0, 37.0, 47.0, 36.0, 40.0, 33.0, 43.0, 38.0, 41.0, 36.0, 36.0, 38.0, 27.0, 35.0, 30.0, 22.0, 24.0, 13.0, 18.0, 14.0, 16.0, 14.0, 15.0, 10.0, 11.0, 4.0, 7.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-10.78125, -10.46484375, -10.1484375, -9.83203125, -9.515625, -9.19921875, -8.8828125, -8.56640625, -8.25, -7.93359375, -7.6171875, -7.30078125, -6.984375, -6.66796875, -6.3515625, -6.03515625, -5.71875, -5.40234375, -5.0859375, -4.76953125, -4.453125, -4.13671875, -3.8203125, -3.50390625, -3.1875, -2.87109375, -2.5546875, -2.23828125, -1.921875, -1.60546875, -1.2890625, -0.97265625, -0.65625, -0.33984375, -0.0234375, 0.29296875, 0.609375, 0.92578125, 1.2421875, 1.55859375, 1.875, 2.19140625, 2.5078125, 2.82421875, 3.140625, 3.45703125, 3.7734375, 4.08984375, 4.40625, 4.72265625, 5.0390625, 5.35546875, 5.671875, 5.98828125, 6.3046875, 6.62109375, 6.9375, 7.25390625, 7.5703125, 7.88671875, 8.203125, 8.51953125, 8.8359375, 9.15234375, 9.46875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 11.0, 6.0, 22.0, 18.0, 34.0, 73.0, 104.0, 236.0, 461.0, 1294.0, 5228.0, 59021.0, 898215.0, 75406.0, 6000.0, 1457.0, 451.0, 213.0, 115.0, 76.0, 42.0, 21.0, 11.0, 9.0, 5.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.8125, -9.557861328125, -9.30322265625, -9.048583984375, -8.7939453125, -8.539306640625, -8.28466796875, -8.030029296875, -7.775390625, -7.520751953125, -7.26611328125, -7.011474609375, -6.7568359375, -6.502197265625, -6.24755859375, -5.992919921875, -5.73828125, -5.483642578125, -5.22900390625, -4.974365234375, -4.7197265625, -4.465087890625, -4.21044921875, -3.955810546875, -3.701171875, -3.446533203125, -3.19189453125, -2.937255859375, -2.6826171875, -2.427978515625, -2.17333984375, -1.918701171875, -1.6640625, -1.409423828125, -1.15478515625, -0.900146484375, -0.6455078125, -0.390869140625, -0.13623046875, 0.118408203125, 0.373046875, 0.627685546875, 0.88232421875, 1.136962890625, 1.3916015625, 1.646240234375, 1.90087890625, 2.155517578125, 2.41015625, 2.664794921875, 2.91943359375, 3.174072265625, 3.4287109375, 3.683349609375, 3.93798828125, 4.192626953125, 4.447265625, 4.701904296875, 4.95654296875, 5.211181640625, 5.4658203125, 5.720458984375, 5.97509765625, 6.229736328125, 6.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 15.0, 15.0, 17.0, 28.0, 39.0, 47.0, 60.0, 88.0, 107.0, 120.0, 95.0, 91.0, 65.0, 43.0, 35.0, 32.0, 21.0, 17.0, 19.0, 9.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005316734313964844, -0.0005080774426460266, -0.00048448145389556885, -0.0004608854651451111, -0.0004372894763946533, -0.00041369348764419556, -0.0003900974988937378, -0.00036650151014328003, -0.00034290552139282227, -0.0003193095326423645, -0.00029571354389190674, -0.000272117555141449, -0.0002485215663909912, -0.00022492557764053345, -0.00020132958889007568, -0.00017773360013961792, -0.00015413761138916016, -0.0001305416226387024, -0.00010694563388824463, -8.334964513778687e-05, -5.97536563873291e-05, -3.615766763687134e-05, -1.2561678886413574e-05, 1.103430986404419e-05, 3.463029861450195e-05, 5.822628736495972e-05, 8.182227611541748e-05, 0.00010541826486587524, 0.000129014253616333, 0.00015261024236679077, 0.00017620623111724854, 0.0001998022198677063, 0.00022339820861816406, 0.0002469941973686218, 0.0002705901861190796, 0.00029418617486953735, 0.0003177821636199951, 0.0003413781523704529, 0.00036497414112091064, 0.0003885701298713684, 0.00041216611862182617, 0.00043576210737228394, 0.0004593580961227417, 0.00048295408487319946, 0.0005065500736236572, 0.000530146062374115, 0.0005537420511245728, 0.0005773380398750305, 0.0006009340286254883, 0.000624530017375946, 0.0006481260061264038, 0.0006717219948768616, 0.0006953179836273193, 0.0007189139723777771, 0.0007425099611282349, 0.0007661059498786926, 0.0007897019386291504, 0.0008132979273796082, 0.0008368939161300659, 0.0008604899048805237, 0.0008840858936309814, 0.0009076818823814392, 0.000931277871131897, 0.0009548738598823547, 0.0009784698486328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 13.0, 9.0, 6.0, 13.0, 21.0, 35.0, 29.0, 44.0, 71.0, 102.0, 156.0, 236.0, 414.0, 711.0, 1387.0, 3028.0, 8404.0, 36805.0, 274599.0, 609525.0, 88228.0, 15769.0, 4611.0, 1873.0, 963.0, 562.0, 317.0, 181.0, 129.0, 89.0, 57.0, 38.0, 34.0, 19.0, 16.0, 10.0, 6.0, 7.0, 4.0, 3.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.3203125, -4.186279296875, -4.05224609375, -3.918212890625, -3.7841796875, -3.650146484375, -3.51611328125, -3.382080078125, -3.248046875, -3.114013671875, -2.97998046875, -2.845947265625, -2.7119140625, -2.577880859375, -2.44384765625, -2.309814453125, -2.17578125, -2.041748046875, -1.90771484375, -1.773681640625, -1.6396484375, -1.505615234375, -1.37158203125, -1.237548828125, -1.103515625, -0.969482421875, -0.83544921875, -0.701416015625, -0.5673828125, -0.433349609375, -0.29931640625, -0.165283203125, -0.03125, 0.102783203125, 0.23681640625, 0.370849609375, 0.5048828125, 0.638916015625, 0.77294921875, 0.906982421875, 1.041015625, 1.175048828125, 1.30908203125, 1.443115234375, 1.5771484375, 1.711181640625, 1.84521484375, 1.979248046875, 2.11328125, 2.247314453125, 2.38134765625, 2.515380859375, 2.6494140625, 2.783447265625, 2.91748046875, 3.051513671875, 3.185546875, 3.319580078125, 3.45361328125, 3.587646484375, 3.7216796875, 3.855712890625, 3.98974609375, 4.123779296875, 4.2578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 14.0, 10.0, 26.0, 54.0, 49.0, 68.0, 64.0, 106.0, 98.0, 90.0, 90.0, 84.0, 72.0, 63.0, 18.0, 17.0, 9.0, 9.0, 9.0, 10.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03125, -5.8720703125, -5.712890625, -5.5537109375, -5.39453125, -5.2353515625, -5.076171875, -4.9169921875, -4.7578125, -4.5986328125, -4.439453125, -4.2802734375, -4.12109375, -3.9619140625, -3.802734375, -3.6435546875, -3.484375, -3.3251953125, -3.166015625, -3.0068359375, -2.84765625, -2.6884765625, -2.529296875, -2.3701171875, -2.2109375, -2.0517578125, -1.892578125, -1.7333984375, -1.57421875, -1.4150390625, -1.255859375, -1.0966796875, -0.9375, -0.7783203125, -0.619140625, -0.4599609375, -0.30078125, -0.1416015625, 0.017578125, 0.1767578125, 0.3359375, 0.4951171875, 0.654296875, 0.8134765625, 0.97265625, 1.1318359375, 1.291015625, 1.4501953125, 1.609375, 1.7685546875, 1.927734375, 2.0869140625, 2.24609375, 2.4052734375, 2.564453125, 2.7236328125, 2.8828125, 3.0419921875, 3.201171875, 3.3603515625, 3.51953125, 3.6787109375, 3.837890625, 3.9970703125, 4.15625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 19.0, 106.0, 339.0, 342.0, 137.0, 38.0, 12.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.54248046875, -155.76971435546875, -149.99693298339844, -144.2241668701172, -138.45138549804688, -132.67861938476562, -126.90584564208984, -121.13307189941406, -115.36029815673828, -109.5875244140625, -103.81475067138672, -98.04197692871094, -92.26921081542969, -86.49642944335938, -80.72366333007812, -74.95088958740234, -69.17811584472656, -63.40534210205078, -57.632568359375, -51.859798431396484, -46.0870246887207, -40.31425094604492, -34.541481018066406, -28.768707275390625, -22.995933532714844, -17.223159790039062, -11.450387954711914, -5.677616119384766, 0.09515762329101562, 5.867931365966797, 11.640701293945312, 17.413475036621094, 23.186248779296875, 28.959022521972656, 34.73179626464844, 40.50456619262695, 46.277339935302734, 52.050113677978516, 57.82288360595703, 63.59565734863281, 69.3684310913086, 75.14120483398438, 80.91397857666016, 86.68675231933594, 92.45951843261719, 98.2322998046875, 104.00506591796875, 109.77783966064453, 115.55061340332031, 121.3233871459961, 127.09616088867188, 132.86892700195312, 138.64170837402344, 144.4144744873047, 150.187255859375, 155.96002197265625, 161.7327880859375, 167.50555419921875, 173.27833557128906, 179.0511016845703, 184.82388305664062, 190.59664916992188, 196.36941528320312, 202.14219665527344, 207.91497802734375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 13.0, 7.0, 10.0, 12.0, 17.0, 31.0, 25.0, 34.0, 29.0, 34.0, 42.0, 37.0, 49.0, 53.0, 55.0, 52.0, 57.0, 54.0, 59.0, 49.0, 31.0, 37.0, 34.0, 26.0, 32.0, 21.0, 19.0, 14.0, 16.0, 7.0, 10.0, 7.0, 3.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0], "bins": [-64.94923400878906, -63.23587417602539, -61.522518157958984, -59.80915832519531, -58.095802307128906, -56.382442474365234, -54.66908264160156, -52.955726623535156, -51.242366790771484, -49.52900695800781, -47.815650939941406, -46.102291107177734, -44.38893508911133, -42.675575256347656, -40.96221923828125, -39.24885940551758, -37.535499572753906, -35.822139739990234, -34.10878372192383, -32.395423889160156, -30.682065963745117, -28.968708038330078, -27.25535011291504, -25.5419921875, -23.828636169433594, -22.115278244018555, -20.401920318603516, -18.688560485839844, -16.975202560424805, -15.261844635009766, -13.548486709594727, -11.835127830505371, -10.121768951416016, -8.408411026000977, -6.695052146911621, -4.981694221496582, -3.2683358192443848, -1.5549774169921875, 0.15838050842285156, 1.871739387512207, 3.585097312927246, 5.298455715179443, 7.011814117431641, 8.72517204284668, 10.438529968261719, 12.151888847351074, 13.865246772766113, 15.578605651855469, 17.291963577270508, 19.005321502685547, 20.718679428100586, 22.432037353515625, 24.145397186279297, 25.858755111694336, 27.572113037109375, 29.285472869873047, 30.998828887939453, 32.712188720703125, 34.42554473876953, 36.1389045715332, 37.85226058959961, 39.56562042236328, 41.27897644042969, 42.99233627319336, 44.70569610595703]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 14.0, 19.0, 19.0, 25.0, 38.0, 49.0, 79.0, 84.0, 188.0, 289.0, 547.0, 1215.0, 3433.0, 14126.0, 177643.0, 3953466.0, 33324.0, 6027.0, 1876.0, 809.0, 370.0, 202.0, 124.0, 82.0, 61.0, 42.0, 39.0, 25.0, 14.0, 14.0, 9.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.3203125, -14.8726806640625, -14.425048828125, -13.9774169921875, -13.52978515625, -13.0821533203125, -12.634521484375, -12.1868896484375, -11.7392578125, -11.2916259765625, -10.843994140625, -10.3963623046875, -9.94873046875, -9.5010986328125, -9.053466796875, -8.6058349609375, -8.158203125, -7.7105712890625, -7.262939453125, -6.8153076171875, -6.36767578125, -5.9200439453125, -5.472412109375, -5.0247802734375, -4.5771484375, -4.1295166015625, -3.681884765625, -3.2342529296875, -2.78662109375, -2.3389892578125, -1.891357421875, -1.4437255859375, -0.99609375, -0.5484619140625, -0.100830078125, 0.3468017578125, 0.79443359375, 1.2420654296875, 1.689697265625, 2.1373291015625, 2.5849609375, 3.0325927734375, 3.480224609375, 3.9278564453125, 4.37548828125, 4.8231201171875, 5.270751953125, 5.7183837890625, 6.166015625, 6.6136474609375, 7.061279296875, 7.5089111328125, 7.95654296875, 8.4041748046875, 8.851806640625, 9.2994384765625, 9.7470703125, 10.1947021484375, 10.642333984375, 11.0899658203125, 11.53759765625, 11.9852294921875, 12.432861328125, 12.8804931640625, 13.328125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 6.0, 13.0, 17.0, 18.0, 32.0, 28.0, 29.0, 46.0, 43.0, 71.0, 57.0, 56.0, 59.0, 64.0, 68.0, 57.0, 50.0, 37.0, 45.0, 40.0, 35.0, 31.0, 25.0, 17.0, 16.0, 8.0, 4.0, 11.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.548828125, -3.455780029296875, -3.36273193359375, -3.269683837890625, -3.1766357421875, -3.083587646484375, -2.99053955078125, -2.897491455078125, -2.804443359375, -2.711395263671875, -2.61834716796875, -2.525299072265625, -2.4322509765625, -2.339202880859375, -2.24615478515625, -2.153106689453125, -2.06005859375, -1.967010498046875, -1.87396240234375, -1.780914306640625, -1.6878662109375, -1.594818115234375, -1.50177001953125, -1.408721923828125, -1.315673828125, -1.222625732421875, -1.12957763671875, -1.036529541015625, -0.9434814453125, -0.850433349609375, -0.75738525390625, -0.664337158203125, -0.5712890625, -0.478240966796875, -0.38519287109375, -0.292144775390625, -0.1990966796875, -0.106048583984375, -0.01300048828125, 0.080047607421875, 0.173095703125, 0.266143798828125, 0.35919189453125, 0.452239990234375, 0.5452880859375, 0.638336181640625, 0.73138427734375, 0.824432373046875, 0.91748046875, 1.010528564453125, 1.10357666015625, 1.196624755859375, 1.2896728515625, 1.382720947265625, 1.47576904296875, 1.568817138671875, 1.661865234375, 1.754913330078125, 1.84796142578125, 1.941009521484375, 2.0340576171875, 2.127105712890625, 2.22015380859375, 2.313201904296875, 2.40625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 12.0, 14.0, 14.0, 21.0, 23.0, 27.0, 55.0, 79.0, 96.0, 169.0, 214.0, 427.0, 793.0, 1702.0, 4541.0, 16407.0, 135545.0, 3925303.0, 88555.0, 13085.0, 3889.0, 1510.0, 699.0, 390.0, 219.0, 149.0, 115.0, 63.0, 41.0, 28.0, 23.0, 19.0, 14.0, 12.0, 12.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.625, -11.2664794921875, -10.907958984375, -10.5494384765625, -10.19091796875, -9.8323974609375, -9.473876953125, -9.1153564453125, -8.7568359375, -8.3983154296875, -8.039794921875, -7.6812744140625, -7.32275390625, -6.9642333984375, -6.605712890625, -6.2471923828125, -5.888671875, -5.5301513671875, -5.171630859375, -4.8131103515625, -4.45458984375, -4.0960693359375, -3.737548828125, -3.3790283203125, -3.0205078125, -2.6619873046875, -2.303466796875, -1.9449462890625, -1.58642578125, -1.2279052734375, -0.869384765625, -0.5108642578125, -0.15234375, 0.2061767578125, 0.564697265625, 0.9232177734375, 1.28173828125, 1.6402587890625, 1.998779296875, 2.3572998046875, 2.7158203125, 3.0743408203125, 3.432861328125, 3.7913818359375, 4.14990234375, 4.5084228515625, 4.866943359375, 5.2254638671875, 5.583984375, 5.9425048828125, 6.301025390625, 6.6595458984375, 7.01806640625, 7.3765869140625, 7.735107421875, 8.0936279296875, 8.4521484375, 8.8106689453125, 9.169189453125, 9.5277099609375, 9.88623046875, 10.2447509765625, 10.603271484375, 10.9617919921875, 11.3203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 13.0, 28.0, 33.0, 75.0, 153.0, 1025.0, 2402.0, 184.0, 66.0, 37.0, 22.0, 9.0, 10.0, 8.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.26788330078125, -5.0865478515625, -4.90521240234375, -4.723876953125, -4.54254150390625, -4.3612060546875, -4.17987060546875, -3.99853515625, -3.81719970703125, -3.6358642578125, -3.45452880859375, -3.273193359375, -3.09185791015625, -2.9105224609375, -2.72918701171875, -2.5478515625, -2.36651611328125, -2.1851806640625, -2.00384521484375, -1.822509765625, -1.64117431640625, -1.4598388671875, -1.27850341796875, -1.09716796875, -0.91583251953125, -0.7344970703125, -0.55316162109375, -0.371826171875, -0.19049072265625, -0.0091552734375, 0.17218017578125, 0.353515625, 0.53485107421875, 0.7161865234375, 0.89752197265625, 1.078857421875, 1.26019287109375, 1.4415283203125, 1.62286376953125, 1.80419921875, 1.98553466796875, 2.1668701171875, 2.34820556640625, 2.529541015625, 2.71087646484375, 2.8922119140625, 3.07354736328125, 3.2548828125, 3.43621826171875, 3.6175537109375, 3.79888916015625, 3.980224609375, 4.16156005859375, 4.3428955078125, 4.52423095703125, 4.70556640625, 4.88690185546875, 5.0682373046875, 5.24957275390625, 5.430908203125, 5.61224365234375, 5.7935791015625, 5.97491455078125, 6.15625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 9.0, 9.0, 8.0, 17.0, 9.0, 16.0, 20.0, 39.0, 45.0, 54.0, 65.0, 85.0, 74.0, 97.0, 93.0, 90.0, 69.0, 45.0, 48.0, 31.0, 21.0, 10.0, 2.0, 7.0, 4.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.569573402404785, -10.201430320739746, -9.833288192749023, -9.465145111083984, -9.097002029418945, -8.728859901428223, -8.360716819763184, -7.992574214935303, -7.624431610107422, -7.256289005279541, -6.888145923614502, -6.520003318786621, -6.15186071395874, -5.783718109130859, -5.41557502746582, -5.0474324226379395, -4.6792893409729, -4.3111467361450195, -3.9430038928985596, -3.5748610496520996, -3.2067184448242188, -2.838575601577759, -2.470432758331299, -2.102290153503418, -1.734147310256958, -1.3660045862197876, -0.9978618025779724, -0.6297190189361572, -0.2615762948989868, 0.1065664291381836, 0.47470927238464355, 0.8428518772125244, 1.2109947204589844, 1.5791374444961548, 1.9472801685333252, 2.315423011779785, 2.683565616607666, 3.051708459854126, 3.419851303100586, 3.787993907928467, 4.156136512756348, 4.5242791175842285, 4.892422199249268, 5.260564804077148, 5.628707408905029, 5.99685001373291, 6.364993095397949, 6.73313570022583, 7.101278781890869, 7.46942138671875, 7.837564468383789, 8.205707550048828, 8.57384967803955, 8.94199275970459, 9.310134887695312, 9.678277969360352, 10.04642105102539, 10.41456413269043, 10.782706260681152, 11.150849342346191, 11.51899242401123, 11.887134552001953, 12.255277633666992, 12.623420715332031, 12.991562843322754]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 2.0, 7.0, 12.0, 10.0, 14.0, 17.0, 12.0, 31.0, 18.0, 31.0, 22.0, 24.0, 30.0, 35.0, 36.0, 32.0, 39.0, 44.0, 32.0, 38.0, 36.0, 46.0, 46.0, 40.0, 29.0, 23.0, 33.0, 25.0, 28.0, 26.0, 17.0, 20.0, 18.0, 26.0, 17.0, 13.0, 4.0, 11.0, 9.0, 6.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-10.026663780212402, -9.740232467651367, -9.453801155090332, -9.167369842529297, -8.880938529968262, -8.594507217407227, -8.308075904846191, -8.021644592285156, -7.735213756561279, -7.448782444000244, -7.162351131439209, -6.875919818878174, -6.589488983154297, -6.303057670593262, -6.016626358032227, -5.730195045471191, -5.443763732910156, -5.157332420349121, -4.870901107788086, -4.584469795227051, -4.298038482666016, -4.0116071701049805, -3.7251763343811035, -3.4387450218200684, -3.152313709259033, -2.865882396697998, -2.579451084136963, -2.293020009994507, -2.0065886974334717, -1.7201573848724365, -1.433726191520691, -1.1472949981689453, -0.8608627319335938, -0.5744314789772034, -0.288000226020813, -0.0015689730644226074, 0.2848622798919678, 0.5712935924530029, 0.8577247858047485, 1.1441559791564941, 1.4305872917175293, 1.7170186042785645, 2.0034499168395996, 2.2898809909820557, 2.576312303543091, 2.862743616104126, 3.149174690246582, 3.435606002807617, 3.7220373153686523, 4.0084686279296875, 4.294899940490723, 4.581331253051758, 4.867762565612793, 5.154193878173828, 5.440624713897705, 5.72705602645874, 6.013487339019775, 6.2999186515808105, 6.586349964141846, 6.872781276702881, 7.159212112426758, 7.445643424987793, 7.732074737548828, 8.018506050109863, 8.304937362670898]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 13.0, 11.0, 16.0, 24.0, 29.0, 35.0, 53.0, 87.0, 107.0, 157.0, 267.0, 383.0, 648.0, 1114.0, 2193.0, 4545.0, 10869.0, 28020.0, 75785.0, 213372.0, 429625.0, 175640.0, 64363.0, 23455.0, 9074.0, 3993.0, 1942.0, 1042.0, 629.0, 319.0, 217.0, 149.0, 110.0, 73.0, 59.0, 33.0, 27.0, 21.0, 17.0, 14.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.20703125, -6.0029296875, -5.798828125, -5.5947265625, -5.390625, -5.1865234375, -4.982421875, -4.7783203125, -4.57421875, -4.3701171875, -4.166015625, -3.9619140625, -3.7578125, -3.5537109375, -3.349609375, -3.1455078125, -2.94140625, -2.7373046875, -2.533203125, -2.3291015625, -2.125, -1.9208984375, -1.716796875, -1.5126953125, -1.30859375, -1.1044921875, -0.900390625, -0.6962890625, -0.4921875, -0.2880859375, -0.083984375, 0.1201171875, 0.32421875, 0.5283203125, 0.732421875, 0.9365234375, 1.140625, 1.3447265625, 1.548828125, 1.7529296875, 1.95703125, 2.1611328125, 2.365234375, 2.5693359375, 2.7734375, 2.9775390625, 3.181640625, 3.3857421875, 3.58984375, 3.7939453125, 3.998046875, 4.2021484375, 4.40625, 4.6103515625, 4.814453125, 5.0185546875, 5.22265625, 5.4267578125, 5.630859375, 5.8349609375, 6.0390625, 6.2431640625, 6.447265625, 6.6513671875, 6.85546875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 8.0, 6.0, 14.0, 13.0, 24.0, 24.0, 31.0, 44.0, 37.0, 48.0, 57.0, 62.0, 68.0, 66.0, 65.0, 53.0, 56.0, 39.0, 46.0, 33.0, 47.0, 31.0, 18.0, 20.0, 23.0, 10.0, 12.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.744140625, -3.64990234375, -3.5556640625, -3.46142578125, -3.3671875, -3.27294921875, -3.1787109375, -3.08447265625, -2.990234375, -2.89599609375, -2.8017578125, -2.70751953125, -2.61328125, -2.51904296875, -2.4248046875, -2.33056640625, -2.236328125, -2.14208984375, -2.0478515625, -1.95361328125, -1.859375, -1.76513671875, -1.6708984375, -1.57666015625, -1.482421875, -1.38818359375, -1.2939453125, -1.19970703125, -1.10546875, -1.01123046875, -0.9169921875, -0.82275390625, -0.728515625, -0.63427734375, -0.5400390625, -0.44580078125, -0.3515625, -0.25732421875, -0.1630859375, -0.06884765625, 0.025390625, 0.11962890625, 0.2138671875, 0.30810546875, 0.40234375, 0.49658203125, 0.5908203125, 0.68505859375, 0.779296875, 0.87353515625, 0.9677734375, 1.06201171875, 1.15625, 1.25048828125, 1.3447265625, 1.43896484375, 1.533203125, 1.62744140625, 1.7216796875, 1.81591796875, 1.91015625, 2.00439453125, 2.0986328125, 2.19287109375, 2.287109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 7.0, 11.0, 8.0, 33.0, 31.0, 40.0, 63.0, 100.0, 124.0, 189.0, 321.0, 416.0, 721.0, 1250.0, 2492.0, 6664.0, 33924.0, 341985.0, 589775.0, 54742.0, 9145.0, 2930.0, 1421.0, 806.0, 470.0, 300.0, 197.0, 117.0, 92.0, 55.0, 35.0, 28.0, 13.0, 15.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4232177734375, -10.065185546875, -9.7071533203125, -9.34912109375, -8.9910888671875, -8.633056640625, -8.2750244140625, -7.9169921875, -7.5589599609375, -7.200927734375, -6.8428955078125, -6.48486328125, -6.1268310546875, -5.768798828125, -5.4107666015625, -5.052734375, -4.6947021484375, -4.336669921875, -3.9786376953125, -3.62060546875, -3.2625732421875, -2.904541015625, -2.5465087890625, -2.1884765625, -1.8304443359375, -1.472412109375, -1.1143798828125, -0.75634765625, -0.3983154296875, -0.040283203125, 0.3177490234375, 0.67578125, 1.0338134765625, 1.391845703125, 1.7498779296875, 2.10791015625, 2.4659423828125, 2.823974609375, 3.1820068359375, 3.5400390625, 3.8980712890625, 4.256103515625, 4.6141357421875, 4.97216796875, 5.3302001953125, 5.688232421875, 6.0462646484375, 6.404296875, 6.7623291015625, 7.120361328125, 7.4783935546875, 7.83642578125, 8.1944580078125, 8.552490234375, 8.9105224609375, 9.2685546875, 9.6265869140625, 9.984619140625, 10.3426513671875, 10.70068359375, 11.0587158203125, 11.416748046875, 11.7747802734375, 12.1328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 4.0, 6.0, 19.0, 12.0, 15.0, 26.0, 16.0, 19.0, 34.0, 43.0, 24.0, 40.0, 47.0, 46.0, 48.0, 54.0, 67.0, 52.0, 58.0, 30.0, 42.0, 43.0, 41.0, 36.0, 29.0, 33.0, 17.0, 13.0, 9.0, 15.0, 8.0, 9.0, 15.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.78125, -12.421875, -12.0625, -11.703125, -11.34375, -10.984375, -10.625, -10.265625, -9.90625, -9.546875, -9.1875, -8.828125, -8.46875, -8.109375, -7.75, -7.390625, -7.03125, -6.671875, -6.3125, -5.953125, -5.59375, -5.234375, -4.875, -4.515625, -4.15625, -3.796875, -3.4375, -3.078125, -2.71875, -2.359375, -2.0, -1.640625, -1.28125, -0.921875, -0.5625, -0.203125, 0.15625, 0.515625, 0.875, 1.234375, 1.59375, 1.953125, 2.3125, 2.671875, 3.03125, 3.390625, 3.75, 4.109375, 4.46875, 4.828125, 5.1875, 5.546875, 5.90625, 6.265625, 6.625, 6.984375, 7.34375, 7.703125, 8.0625, 8.421875, 8.78125, 9.140625, 9.5, 9.859375, 10.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 8.0, 11.0, 9.0, 19.0, 24.0, 42.0, 49.0, 101.0, 130.0, 212.0, 364.0, 686.0, 1275.0, 2814.0, 6715.0, 19998.0, 74010.0, 341192.0, 467184.0, 94411.0, 24648.0, 8120.0, 3199.0, 1449.0, 765.0, 401.0, 248.0, 156.0, 104.0, 55.0, 35.0, 37.0, 23.0, 17.0, 12.0, 8.0, 10.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.759765625, -2.670989990234375, -2.58221435546875, -2.493438720703125, -2.4046630859375, -2.315887451171875, -2.22711181640625, -2.138336181640625, -2.049560546875, -1.960784912109375, -1.87200927734375, -1.783233642578125, -1.6944580078125, -1.605682373046875, -1.51690673828125, -1.428131103515625, -1.33935546875, -1.250579833984375, -1.16180419921875, -1.073028564453125, -0.9842529296875, -0.895477294921875, -0.80670166015625, -0.717926025390625, -0.629150390625, -0.540374755859375, -0.45159912109375, -0.362823486328125, -0.2740478515625, -0.185272216796875, -0.09649658203125, -0.007720947265625, 0.0810546875, 0.169830322265625, 0.25860595703125, 0.347381591796875, 0.4361572265625, 0.524932861328125, 0.61370849609375, 0.702484130859375, 0.791259765625, 0.880035400390625, 0.96881103515625, 1.057586669921875, 1.1463623046875, 1.235137939453125, 1.32391357421875, 1.412689208984375, 1.50146484375, 1.590240478515625, 1.67901611328125, 1.767791748046875, 1.8565673828125, 1.945343017578125, 2.03411865234375, 2.122894287109375, 2.211669921875, 2.300445556640625, 2.38922119140625, 2.477996826171875, 2.5667724609375, 2.655548095703125, 2.74432373046875, 2.833099365234375, 2.921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 12.0, 13.0, 12.0, 12.0, 13.0, 27.0, 16.0, 26.0, 31.0, 27.0, 48.0, 51.0, 62.0, 91.0, 121.0, 106.0, 57.0, 40.0, 37.0, 21.0, 36.0, 21.0, 18.0, 11.0, 10.0, 11.0, 15.0, 3.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007367134094238281, -0.0007132813334465027, -0.0006898492574691772, -0.0006664171814918518, -0.0006429851055145264, -0.0006195530295372009, -0.0005961209535598755, -0.00057268887758255, -0.0005492568016052246, -0.0005258247256278992, -0.0005023926496505737, -0.0004789605736732483, -0.00045552849769592285, -0.0004320964217185974, -0.00040866434574127197, -0.00038523226976394653, -0.0003618001937866211, -0.00033836811780929565, -0.0003149360418319702, -0.0002915039658546448, -0.00026807188987731934, -0.0002446398138999939, -0.00022120773792266846, -0.00019777566194534302, -0.00017434358596801758, -0.00015091150999069214, -0.0001274794340133667, -0.00010404735803604126, -8.061528205871582e-05, -5.718320608139038e-05, -3.375113010406494e-05, -1.0319054126739502e-05, 1.3113021850585938e-05, 3.654509782791138e-05, 5.9977173805236816e-05, 8.340924978256226e-05, 0.0001068413257598877, 0.00013027340173721313, 0.00015370547771453857, 0.00017713755369186401, 0.00020056962966918945, 0.0002240017056465149, 0.00024743378162384033, 0.00027086585760116577, 0.0002942979335784912, 0.00031773000955581665, 0.0003411620855331421, 0.00036459416151046753, 0.00038802623748779297, 0.0004114583134651184, 0.00043489038944244385, 0.0004583224654197693, 0.0004817545413970947, 0.0005051866173744202, 0.0005286186933517456, 0.000552050769329071, 0.0005754828453063965, 0.0005989149212837219, 0.0006223469972610474, 0.0006457790732383728, 0.0006692111492156982, 0.0006926432251930237, 0.0007160753011703491, 0.0007395073771476746, 0.000762939453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 12.0, 10.0, 17.0, 21.0, 20.0, 48.0, 50.0, 90.0, 168.0, 236.0, 425.0, 791.0, 1752.0, 4828.0, 20836.0, 154290.0, 710322.0, 128934.0, 18082.0, 4165.0, 1656.0, 752.0, 414.0, 224.0, 155.0, 84.0, 49.0, 44.0, 16.0, 15.0, 10.0, 10.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.91796875, -4.79010009765625, -4.6622314453125, -4.53436279296875, -4.406494140625, -4.27862548828125, -4.1507568359375, -4.02288818359375, -3.89501953125, -3.76715087890625, -3.6392822265625, -3.51141357421875, -3.383544921875, -3.25567626953125, -3.1278076171875, -2.99993896484375, -2.8720703125, -2.74420166015625, -2.6163330078125, -2.48846435546875, -2.360595703125, -2.23272705078125, -2.1048583984375, -1.97698974609375, -1.84912109375, -1.72125244140625, -1.5933837890625, -1.46551513671875, -1.337646484375, -1.20977783203125, -1.0819091796875, -0.95404052734375, -0.826171875, -0.69830322265625, -0.5704345703125, -0.44256591796875, -0.314697265625, -0.18682861328125, -0.0589599609375, 0.06890869140625, 0.19677734375, 0.32464599609375, 0.4525146484375, 0.58038330078125, 0.708251953125, 0.83612060546875, 0.9639892578125, 1.09185791015625, 1.2197265625, 1.34759521484375, 1.4754638671875, 1.60333251953125, 1.731201171875, 1.85906982421875, 1.9869384765625, 2.11480712890625, 2.24267578125, 2.37054443359375, 2.4984130859375, 2.62628173828125, 2.754150390625, 2.88201904296875, 3.0098876953125, 3.13775634765625, 3.265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 11.0, 15.0, 12.0, 13.0, 16.0, 16.0, 29.0, 29.0, 48.0, 52.0, 75.0, 88.0, 85.0, 85.0, 86.0, 77.0, 65.0, 45.0, 36.0, 28.0, 23.0, 13.0, 16.0, 13.0, 6.0, 5.0, 9.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.54296875, -4.43560791015625, -4.3282470703125, -4.22088623046875, -4.113525390625, -4.00616455078125, -3.8988037109375, -3.79144287109375, -3.68408203125, -3.57672119140625, -3.4693603515625, -3.36199951171875, -3.254638671875, -3.14727783203125, -3.0399169921875, -2.93255615234375, -2.8251953125, -2.71783447265625, -2.6104736328125, -2.50311279296875, -2.395751953125, -2.28839111328125, -2.1810302734375, -2.07366943359375, -1.96630859375, -1.85894775390625, -1.7515869140625, -1.64422607421875, -1.536865234375, -1.42950439453125, -1.3221435546875, -1.21478271484375, -1.107421875, -1.00006103515625, -0.8927001953125, -0.78533935546875, -0.677978515625, -0.57061767578125, -0.4632568359375, -0.35589599609375, -0.24853515625, -0.14117431640625, -0.0338134765625, 0.07354736328125, 0.180908203125, 0.28826904296875, 0.3956298828125, 0.50299072265625, 0.6103515625, 0.71771240234375, 0.8250732421875, 0.93243408203125, 1.039794921875, 1.14715576171875, 1.2545166015625, 1.36187744140625, 1.46923828125, 1.57659912109375, 1.6839599609375, 1.79132080078125, 1.898681640625, 2.00604248046875, 2.1134033203125, 2.22076416015625, 2.328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 15.0, 19.0, 35.0, 48.0, 74.0, 91.0, 113.0, 123.0, 110.0, 100.0, 81.0, 59.0, 43.0, 24.0, 18.0, 14.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.60453033447266, -62.79473114013672, -60.98493576049805, -59.17513656616211, -57.36534118652344, -55.5555419921875, -53.74574279785156, -51.93594741821289, -50.12615203857422, -48.31635284423828, -46.50655746459961, -44.69675827026367, -42.886962890625, -41.07716369628906, -39.267364501953125, -37.45756912231445, -35.647769927978516, -33.83797073364258, -32.028175354003906, -30.21837615966797, -28.408580780029297, -26.59878158569336, -24.788984298706055, -22.97918701171875, -21.169389724731445, -19.35959243774414, -17.549795150756836, -15.739996910095215, -13.93019962310791, -12.120402336120605, -10.310604095458984, -8.50080680847168, -6.691009521484375, -4.88121223449707, -3.0714144706726074, -1.2616167068481445, 0.5481805801391602, 2.357977867126465, 4.167776107788086, 5.977573394775391, 7.787370681762695, 9.59716796875, 11.406965255737305, 13.216763496398926, 15.02656078338623, 16.83635711669922, 18.646156311035156, 20.45595359802246, 22.265750885009766, 24.07554817199707, 25.885345458984375, 27.695144653320312, 29.504940032958984, 31.314739227294922, 33.124534606933594, 34.93433380126953, 36.74413299560547, 38.553932189941406, 40.36372756958008, 42.173526763916016, 43.98332214355469, 45.793121337890625, 47.60292053222656, 49.412715911865234, 51.222511291503906]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 5.0, 9.0, 10.0, 12.0, 13.0, 16.0, 24.0, 30.0, 27.0, 36.0, 28.0, 55.0, 37.0, 32.0, 45.0, 65.0, 60.0, 57.0, 51.0, 44.0, 46.0, 52.0, 47.0, 29.0, 25.0, 21.0, 14.0, 18.0, 16.0, 16.0, 10.0, 5.0, 7.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-54.771141052246094, -53.17585754394531, -51.5805778503418, -49.985294342041016, -48.390010833740234, -46.79473114013672, -45.19944763183594, -43.604164123535156, -42.008880615234375, -40.413597106933594, -38.81831741333008, -37.2230339050293, -35.627750396728516, -34.032470703125, -32.43718719482422, -30.841903686523438, -29.246623992919922, -27.651342391967773, -26.056058883666992, -24.460777282714844, -22.865493774414062, -21.270212173461914, -19.674930572509766, -18.079647064208984, -16.484365463256836, -14.889082908630371, -13.293800354003906, -11.698518753051758, -10.103236198425293, -8.507953643798828, -6.91267204284668, -5.317389488220215, -3.72210693359375, -2.1268246173858643, -0.5315423011779785, 1.0637397766113281, 2.659022331237793, 4.254304885864258, 5.849586486816406, 7.444869041442871, 9.040151596069336, 10.6354341506958, 12.230716705322266, 13.825998306274414, 15.421280860900879, 17.016563415527344, 18.611845016479492, 20.20712661743164, 21.802410125732422, 23.39769172668457, 24.99297523498535, 26.5882568359375, 28.18354034423828, 29.77882194519043, 31.374103546142578, 32.96938705444336, 34.564666748046875, 36.159950256347656, 37.75522994995117, 39.35051345825195, 40.945796966552734, 42.54107666015625, 44.13636016845703, 45.73164367675781, 47.326927185058594]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 5.0, 9.0, 9.0, 19.0, 14.0, 18.0, 27.0, 42.0, 69.0, 100.0, 144.0, 253.0, 350.0, 596.0, 1064.0, 1830.0, 3354.0, 6988.0, 16220.0, 46969.0, 220244.0, 2678325.0, 1050765.0, 113437.0, 30639.0, 11521.0, 5262.0, 2581.0, 1350.0, 798.0, 453.0, 303.0, 170.0, 113.0, 59.0, 63.0, 32.0, 17.0, 15.0, 18.0, 8.0, 7.0, 8.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0], "bins": [-5.90234375, -5.74200439453125, -5.5816650390625, -5.42132568359375, -5.260986328125, -5.10064697265625, -4.9403076171875, -4.77996826171875, -4.61962890625, -4.45928955078125, -4.2989501953125, -4.13861083984375, -3.978271484375, -3.81793212890625, -3.6575927734375, -3.49725341796875, -3.3369140625, -3.17657470703125, -3.0162353515625, -2.85589599609375, -2.695556640625, -2.53521728515625, -2.3748779296875, -2.21453857421875, -2.05419921875, -1.89385986328125, -1.7335205078125, -1.57318115234375, -1.412841796875, -1.25250244140625, -1.0921630859375, -0.93182373046875, -0.771484375, -0.61114501953125, -0.4508056640625, -0.29046630859375, -0.130126953125, 0.03021240234375, 0.1905517578125, 0.35089111328125, 0.51123046875, 0.67156982421875, 0.8319091796875, 0.99224853515625, 1.152587890625, 1.31292724609375, 1.4732666015625, 1.63360595703125, 1.7939453125, 1.95428466796875, 2.1146240234375, 2.27496337890625, 2.435302734375, 2.59564208984375, 2.7559814453125, 2.91632080078125, 3.07666015625, 3.23699951171875, 3.3973388671875, 3.55767822265625, 3.718017578125, 3.87835693359375, 4.0386962890625, 4.19903564453125, 4.359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 8.0, 12.0, 9.0, 10.0, 25.0, 25.0, 35.0, 41.0, 41.0, 57.0, 79.0, 75.0, 63.0, 75.0, 75.0, 63.0, 52.0, 55.0, 42.0, 35.0, 35.0, 27.0, 16.0, 14.0, 11.0, 6.0, 2.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.37109375, -4.269775390625, -4.16845703125, -4.067138671875, -3.9658203125, -3.864501953125, -3.76318359375, -3.661865234375, -3.560546875, -3.459228515625, -3.35791015625, -3.256591796875, -3.1552734375, -3.053955078125, -2.95263671875, -2.851318359375, -2.75, -2.648681640625, -2.54736328125, -2.446044921875, -2.3447265625, -2.243408203125, -2.14208984375, -2.040771484375, -1.939453125, -1.838134765625, -1.73681640625, -1.635498046875, -1.5341796875, -1.432861328125, -1.33154296875, -1.230224609375, -1.12890625, -1.027587890625, -0.92626953125, -0.824951171875, -0.7236328125, -0.622314453125, -0.52099609375, -0.419677734375, -0.318359375, -0.217041015625, -0.11572265625, -0.014404296875, 0.0869140625, 0.188232421875, 0.28955078125, 0.390869140625, 0.4921875, 0.593505859375, 0.69482421875, 0.796142578125, 0.8974609375, 0.998779296875, 1.10009765625, 1.201416015625, 1.302734375, 1.404052734375, 1.50537109375, 1.606689453125, 1.7080078125, 1.809326171875, 1.91064453125, 2.011962890625, 2.11328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 3.0, 15.0, 11.0, 24.0, 30.0, 40.0, 77.0, 116.0, 191.0, 376.0, 713.0, 1493.0, 3838.0, 10299.0, 35318.0, 190776.0, 3139995.0, 710413.0, 71911.0, 18073.0, 5994.0, 2301.0, 1054.0, 512.0, 267.0, 140.0, 99.0, 64.0, 42.0, 14.0, 19.0, 21.0, 15.0, 4.0, 5.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.578125, -7.353515625, -7.12890625, -6.904296875, -6.6796875, -6.455078125, -6.23046875, -6.005859375, -5.78125, -5.556640625, -5.33203125, -5.107421875, -4.8828125, -4.658203125, -4.43359375, -4.208984375, -3.984375, -3.759765625, -3.53515625, -3.310546875, -3.0859375, -2.861328125, -2.63671875, -2.412109375, -2.1875, -1.962890625, -1.73828125, -1.513671875, -1.2890625, -1.064453125, -0.83984375, -0.615234375, -0.390625, -0.166015625, 0.05859375, 0.283203125, 0.5078125, 0.732421875, 0.95703125, 1.181640625, 1.40625, 1.630859375, 1.85546875, 2.080078125, 2.3046875, 2.529296875, 2.75390625, 2.978515625, 3.203125, 3.427734375, 3.65234375, 3.876953125, 4.1015625, 4.326171875, 4.55078125, 4.775390625, 5.0, 5.224609375, 5.44921875, 5.673828125, 5.8984375, 6.123046875, 6.34765625, 6.572265625, 6.796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 8.0, 2.0, 8.0, 15.0, 11.0, 14.0, 29.0, 33.0, 38.0, 63.0, 110.0, 162.0, 280.0, 488.0, 823.0, 825.0, 458.0, 241.0, 135.0, 103.0, 56.0, 36.0, 32.0, 24.0, 14.0, 10.0, 11.0, 10.0, 6.0, 7.0, 2.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.11676025390625, -5.8975830078125, -5.67840576171875, -5.459228515625, -5.24005126953125, -5.0208740234375, -4.80169677734375, -4.58251953125, -4.36334228515625, -4.1441650390625, -3.92498779296875, -3.705810546875, -3.48663330078125, -3.2674560546875, -3.04827880859375, -2.8291015625, -2.60992431640625, -2.3907470703125, -2.17156982421875, -1.952392578125, -1.73321533203125, -1.5140380859375, -1.29486083984375, -1.07568359375, -0.85650634765625, -0.6373291015625, -0.41815185546875, -0.198974609375, 0.02020263671875, 0.2393798828125, 0.45855712890625, 0.677734375, 0.89691162109375, 1.1160888671875, 1.33526611328125, 1.554443359375, 1.77362060546875, 1.9927978515625, 2.21197509765625, 2.43115234375, 2.65032958984375, 2.8695068359375, 3.08868408203125, 3.307861328125, 3.52703857421875, 3.7462158203125, 3.96539306640625, 4.1845703125, 4.40374755859375, 4.6229248046875, 4.84210205078125, 5.061279296875, 5.28045654296875, 5.4996337890625, 5.71881103515625, 5.93798828125, 6.15716552734375, 6.3763427734375, 6.59552001953125, 6.814697265625, 7.03387451171875, 7.2530517578125, 7.47222900390625, 7.69140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 10.0, 14.0, 22.0, 53.0, 76.0, 133.0, 168.0, 174.0, 126.0, 101.0, 51.0, 23.0, 14.0, 10.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.672786712646484, -50.492698669433594, -48.31261444091797, -46.13252639770508, -43.95243835449219, -41.7723503112793, -39.592262268066406, -37.41217803955078, -35.23208999633789, -33.052001953125, -30.871915817260742, -28.691829681396484, -26.511741638183594, -24.331653594970703, -22.151567459106445, -19.971481323242188, -17.791393280029297, -15.611306190490723, -13.431219100952148, -11.251132011413574, -9.071044921875, -6.890957832336426, -4.710870742797852, -2.5307836532592773, -0.3506965637207031, 1.829390525817871, 4.009477615356445, 6.1895647048950195, 8.369651794433594, 10.549738883972168, 12.729825973510742, 14.909913063049316, 17.089996337890625, 19.270084381103516, 21.450170516967773, 23.63025665283203, 25.810344696044922, 27.990432739257812, 30.17051887512207, 32.35060501098633, 34.53069305419922, 36.71078109741211, 38.890869140625, 41.070953369140625, 43.251041412353516, 45.431129455566406, 47.61121368408203, 49.79130172729492, 51.97138977050781, 54.1514778137207, 56.331565856933594, 58.51165008544922, 60.69173812866211, 62.871826171875, 65.05191040039062, 67.23200225830078, 69.4120864868164, 71.59217071533203, 73.77226257324219, 75.95234680175781, 78.13243103027344, 80.3125228881836, 82.49260711669922, 84.67269897460938, 86.852783203125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 6.0, 7.0, 11.0, 12.0, 21.0, 19.0, 12.0, 31.0, 17.0, 37.0, 32.0, 34.0, 59.0, 42.0, 39.0, 44.0, 37.0, 44.0, 50.0, 48.0, 40.0, 42.0, 49.0, 30.0, 30.0, 30.0, 33.0, 24.0, 27.0, 23.0, 8.0, 16.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.845794677734375, -27.835613250732422, -26.825429916381836, -25.81524658203125, -24.805065155029297, -23.794883728027344, -22.784700393676758, -21.774517059326172, -20.76433563232422, -19.754154205322266, -18.74397087097168, -17.733787536621094, -16.72360610961914, -15.713423728942871, -14.703241348266602, -13.693058967590332, -12.682876586914062, -11.672694206237793, -10.662511825561523, -9.652329444885254, -8.642147064208984, -7.631964683532715, -6.621782302856445, -5.611599922180176, -4.601417541503906, -3.5912351608276367, -2.581052780151367, -1.5708703994750977, -0.5606880187988281, 0.4494943618774414, 1.459676742553711, 2.4698591232299805, 3.4800453186035156, 4.490227699279785, 5.500410079956055, 6.510592460632324, 7.520774841308594, 8.530957221984863, 9.541139602661133, 10.551321983337402, 11.561504364013672, 12.571686744689941, 13.581869125366211, 14.59205150604248, 15.60223388671875, 16.612415313720703, 17.62259864807129, 18.632781982421875, 19.642963409423828, 20.65314483642578, 21.663328170776367, 22.673511505126953, 23.683692932128906, 24.69387435913086, 25.704057693481445, 26.71424102783203, 27.724422454833984, 28.734603881835938, 29.744787216186523, 30.75497055053711, 31.765151977539062, 32.775333404541016, 33.78551483154297, 34.79570007324219, 35.80588150024414]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 17.0, 23.0, 34.0, 69.0, 78.0, 113.0, 150.0, 244.0, 393.0, 600.0, 995.0, 1541.0, 2594.0, 4661.0, 8018.0, 15337.0, 29188.0, 61649.0, 151619.0, 380180.0, 225738.0, 83726.0, 38378.0, 19186.0, 10114.0, 5618.0, 3188.0, 1903.0, 1157.0, 700.0, 401.0, 280.0, 230.0, 126.0, 86.0, 74.0, 44.0, 33.0, 17.0, 17.0, 6.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.8515625, -4.703125, -4.5546875, -4.40625, -4.2578125, -4.109375, -3.9609375, -3.8125, -3.6640625, -3.515625, -3.3671875, -3.21875, -3.0703125, -2.921875, -2.7734375, -2.625, -2.4765625, -2.328125, -2.1796875, -2.03125, -1.8828125, -1.734375, -1.5859375, -1.4375, -1.2890625, -1.140625, -0.9921875, -0.84375, -0.6953125, -0.546875, -0.3984375, -0.25, -0.1015625, 0.046875, 0.1953125, 0.34375, 0.4921875, 0.640625, 0.7890625, 0.9375, 1.0859375, 1.234375, 1.3828125, 1.53125, 1.6796875, 1.828125, 1.9765625, 2.125, 2.2734375, 2.421875, 2.5703125, 2.71875, 2.8671875, 3.015625, 3.1640625, 3.3125, 3.4609375, 3.609375, 3.7578125, 3.90625, 4.0546875, 4.203125, 4.3515625, 4.5]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 10.0, 10.0, 15.0, 16.0, 15.0, 24.0, 23.0, 29.0, 29.0, 14.0, 43.0, 39.0, 49.0, 42.0, 46.0, 53.0, 54.0, 44.0, 36.0, 40.0, 38.0, 38.0, 33.0, 40.0, 30.0, 28.0, 13.0, 26.0, 18.0, 11.0, 15.0, 14.0, 9.0, 14.0, 6.0, 8.0, 8.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.314453125, -2.249755859375, -2.18505859375, -2.120361328125, -2.0556640625, -1.990966796875, -1.92626953125, -1.861572265625, -1.796875, -1.732177734375, -1.66748046875, -1.602783203125, -1.5380859375, -1.473388671875, -1.40869140625, -1.343994140625, -1.279296875, -1.214599609375, -1.14990234375, -1.085205078125, -1.0205078125, -0.955810546875, -0.89111328125, -0.826416015625, -0.76171875, -0.697021484375, -0.63232421875, -0.567626953125, -0.5029296875, -0.438232421875, -0.37353515625, -0.308837890625, -0.244140625, -0.179443359375, -0.11474609375, -0.050048828125, 0.0146484375, 0.079345703125, 0.14404296875, 0.208740234375, 0.2734375, 0.338134765625, 0.40283203125, 0.467529296875, 0.5322265625, 0.596923828125, 0.66162109375, 0.726318359375, 0.791015625, 0.855712890625, 0.92041015625, 0.985107421875, 1.0498046875, 1.114501953125, 1.17919921875, 1.243896484375, 1.30859375, 1.373291015625, 1.43798828125, 1.502685546875, 1.5673828125, 1.632080078125, 1.69677734375, 1.761474609375, 1.826171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 10.0, 12.0, 26.0, 24.0, 35.0, 59.0, 107.0, 132.0, 231.0, 339.0, 592.0, 1050.0, 2193.0, 6637.0, 32034.0, 426117.0, 531768.0, 35208.0, 6879.0, 2363.0, 1124.0, 567.0, 344.0, 237.0, 144.0, 95.0, 69.0, 52.0, 27.0, 24.0, 11.0, 13.0, 12.0, 11.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.7642822265625, -10.380126953125, -9.9959716796875, -9.61181640625, -9.2276611328125, -8.843505859375, -8.4593505859375, -8.0751953125, -7.6910400390625, -7.306884765625, -6.9227294921875, -6.53857421875, -6.1544189453125, -5.770263671875, -5.3861083984375, -5.001953125, -4.6177978515625, -4.233642578125, -3.8494873046875, -3.46533203125, -3.0811767578125, -2.697021484375, -2.3128662109375, -1.9287109375, -1.5445556640625, -1.160400390625, -0.7762451171875, -0.39208984375, -0.0079345703125, 0.376220703125, 0.7603759765625, 1.14453125, 1.5286865234375, 1.912841796875, 2.2969970703125, 2.68115234375, 3.0653076171875, 3.449462890625, 3.8336181640625, 4.2177734375, 4.6019287109375, 4.986083984375, 5.3702392578125, 5.75439453125, 6.1385498046875, 6.522705078125, 6.9068603515625, 7.291015625, 7.6751708984375, 8.059326171875, 8.4434814453125, 8.82763671875, 9.2117919921875, 9.595947265625, 9.9801025390625, 10.3642578125, 10.7484130859375, 11.132568359375, 11.5167236328125, 11.90087890625, 12.2850341796875, 12.669189453125, 13.0533447265625, 13.4375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 8.0, 14.0, 10.0, 4.0, 12.0, 16.0, 18.0, 32.0, 29.0, 35.0, 30.0, 33.0, 30.0, 45.0, 50.0, 53.0, 53.0, 49.0, 37.0, 39.0, 47.0, 41.0, 41.0, 34.0, 27.0, 26.0, 29.0, 20.0, 24.0, 21.0, 12.0, 17.0, 9.0, 9.0, 8.0, 4.0, 11.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.185546875, -7.88671875, -7.587890625, -7.2890625, -6.990234375, -6.69140625, -6.392578125, -6.09375, -5.794921875, -5.49609375, -5.197265625, -4.8984375, -4.599609375, -4.30078125, -4.001953125, -3.703125, -3.404296875, -3.10546875, -2.806640625, -2.5078125, -2.208984375, -1.91015625, -1.611328125, -1.3125, -1.013671875, -0.71484375, -0.416015625, -0.1171875, 0.181640625, 0.48046875, 0.779296875, 1.078125, 1.376953125, 1.67578125, 1.974609375, 2.2734375, 2.572265625, 2.87109375, 3.169921875, 3.46875, 3.767578125, 4.06640625, 4.365234375, 4.6640625, 4.962890625, 5.26171875, 5.560546875, 5.859375, 6.158203125, 6.45703125, 6.755859375, 7.0546875, 7.353515625, 7.65234375, 7.951171875, 8.25, 8.548828125, 8.84765625, 9.146484375, 9.4453125, 9.744140625, 10.04296875, 10.341796875, 10.640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 13.0, 12.0, 19.0, 45.0, 75.0, 118.0, 224.0, 470.0, 1097.0, 3009.0, 10424.0, 52804.0, 604432.0, 326431.0, 37333.0, 7866.0, 2436.0, 890.0, 391.0, 192.0, 96.0, 48.0, 40.0, 31.0, 8.0, 16.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.22869873046875, -4.0823974609375, -3.93609619140625, -3.789794921875, -3.64349365234375, -3.4971923828125, -3.35089111328125, -3.20458984375, -3.05828857421875, -2.9119873046875, -2.76568603515625, -2.619384765625, -2.47308349609375, -2.3267822265625, -2.18048095703125, -2.0341796875, -1.88787841796875, -1.7415771484375, -1.59527587890625, -1.448974609375, -1.30267333984375, -1.1563720703125, -1.01007080078125, -0.86376953125, -0.71746826171875, -0.5711669921875, -0.42486572265625, -0.278564453125, -0.13226318359375, 0.0140380859375, 0.16033935546875, 0.306640625, 0.45294189453125, 0.5992431640625, 0.74554443359375, 0.891845703125, 1.03814697265625, 1.1844482421875, 1.33074951171875, 1.47705078125, 1.62335205078125, 1.7696533203125, 1.91595458984375, 2.062255859375, 2.20855712890625, 2.3548583984375, 2.50115966796875, 2.6474609375, 2.79376220703125, 2.9400634765625, 3.08636474609375, 3.232666015625, 3.37896728515625, 3.5252685546875, 3.67156982421875, 3.81787109375, 3.96417236328125, 4.1104736328125, 4.25677490234375, 4.403076171875, 4.54937744140625, 4.6956787109375, 4.84197998046875, 4.98828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 10.0, 10.0, 22.0, 24.0, 20.0, 34.0, 50.0, 78.0, 172.0, 176.0, 127.0, 77.0, 35.0, 36.0, 28.0, 15.0, 14.0, 7.0, 14.0, 12.0, 2.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012636184692382812, -0.0012267082929611206, -0.00118979811668396, -0.0011528879404067993, -0.0011159777641296387, -0.001079067587852478, -0.0010421574115753174, -0.0010052472352981567, -0.0009683370590209961, -0.0009314268827438354, -0.0008945167064666748, -0.0008576065301895142, -0.0008206963539123535, -0.0007837861776351929, -0.0007468760013580322, -0.0007099658250808716, -0.0006730556488037109, -0.0006361454725265503, -0.0005992352962493896, -0.000562325119972229, -0.0005254149436950684, -0.0004885047674179077, -0.00045159459114074707, -0.0004146844148635864, -0.0003777742385864258, -0.00034086406230926514, -0.0003039538860321045, -0.00026704370975494385, -0.0002301335334777832, -0.00019322335720062256, -0.00015631318092346191, -0.00011940300464630127, -8.249282836914062e-05, -4.558265209197998e-05, -8.672475814819336e-06, 2.823770046234131e-05, 6.514787673950195e-05, 0.0001020580530166626, 0.00013896822929382324, 0.0001758784055709839, 0.00021278858184814453, 0.0002496987581253052, 0.0002866089344024658, 0.00032351911067962646, 0.0003604292869567871, 0.00039733946323394775, 0.0004342496395111084, 0.00047115981578826904, 0.0005080699920654297, 0.0005449801683425903, 0.000581890344619751, 0.0006188005208969116, 0.0006557106971740723, 0.0006926208734512329, 0.0007295310497283936, 0.0007664412260055542, 0.0008033514022827148, 0.0008402615785598755, 0.0008771717548370361, 0.0009140819311141968, 0.0009509921073913574, 0.000987902283668518, 0.0010248124599456787, 0.0010617226362228394, 0.0010986328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 4.0, 8.0, 16.0, 24.0, 34.0, 55.0, 64.0, 103.0, 169.0, 316.0, 449.0, 827.0, 1736.0, 3942.0, 12170.0, 56930.0, 503435.0, 398520.0, 51186.0, 11181.0, 3657.0, 1627.0, 834.0, 449.0, 271.0, 185.0, 119.0, 75.0, 43.0, 37.0, 29.0, 12.0, 17.0, 8.0, 5.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.3359375, -4.211944580078125, -4.08795166015625, -3.963958740234375, -3.8399658203125, -3.715972900390625, -3.59197998046875, -3.467987060546875, -3.343994140625, -3.220001220703125, -3.09600830078125, -2.972015380859375, -2.8480224609375, -2.724029541015625, -2.60003662109375, -2.476043701171875, -2.35205078125, -2.228057861328125, -2.10406494140625, -1.980072021484375, -1.8560791015625, -1.732086181640625, -1.60809326171875, -1.484100341796875, -1.360107421875, -1.236114501953125, -1.11212158203125, -0.988128662109375, -0.8641357421875, -0.740142822265625, -0.61614990234375, -0.492156982421875, -0.3681640625, -0.244171142578125, -0.12017822265625, 0.003814697265625, 0.1278076171875, 0.251800537109375, 0.37579345703125, 0.499786376953125, 0.623779296875, 0.747772216796875, 0.87176513671875, 0.995758056640625, 1.1197509765625, 1.243743896484375, 1.36773681640625, 1.491729736328125, 1.61572265625, 1.739715576171875, 1.86370849609375, 1.987701416015625, 2.1116943359375, 2.235687255859375, 2.35968017578125, 2.483673095703125, 2.607666015625, 2.731658935546875, 2.85565185546875, 2.979644775390625, 3.1036376953125, 3.227630615234375, 3.35162353515625, 3.475616455078125, 3.599609375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 3.0, 5.0, 7.0, 10.0, 10.0, 16.0, 14.0, 14.0, 22.0, 26.0, 27.0, 28.0, 42.0, 50.0, 46.0, 70.0, 71.0, 87.0, 62.0, 68.0, 52.0, 59.0, 34.0, 41.0, 29.0, 17.0, 19.0, 10.0, 8.0, 13.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.68328857421875, -2.5970458984375, -2.51080322265625, -2.424560546875, -2.33831787109375, -2.2520751953125, -2.16583251953125, -2.07958984375, -1.99334716796875, -1.9071044921875, -1.82086181640625, -1.734619140625, -1.64837646484375, -1.5621337890625, -1.47589111328125, -1.3896484375, -1.30340576171875, -1.2171630859375, -1.13092041015625, -1.044677734375, -0.95843505859375, -0.8721923828125, -0.78594970703125, -0.69970703125, -0.61346435546875, -0.5272216796875, -0.44097900390625, -0.354736328125, -0.26849365234375, -0.1822509765625, -0.09600830078125, -0.009765625, 0.07647705078125, 0.1627197265625, 0.24896240234375, 0.335205078125, 0.42144775390625, 0.5076904296875, 0.59393310546875, 0.68017578125, 0.76641845703125, 0.8526611328125, 0.93890380859375, 1.025146484375, 1.11138916015625, 1.1976318359375, 1.28387451171875, 1.3701171875, 1.45635986328125, 1.5426025390625, 1.62884521484375, 1.715087890625, 1.80133056640625, 1.8875732421875, 1.97381591796875, 2.06005859375, 2.14630126953125, 2.2325439453125, 2.31878662109375, 2.405029296875, 2.49127197265625, 2.5775146484375, 2.66375732421875, 2.75]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 13.0, 22.0, 39.0, 88.0, 122.0, 182.0, 187.0, 127.0, 88.0, 58.0, 22.0, 17.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-88.24029541015625, -85.86024475097656, -83.48018646240234, -81.10013580322266, -78.72007751464844, -76.34002685546875, -73.95996856689453, -71.57991790771484, -69.19985961914062, -66.81980895996094, -64.43975067138672, -62.059696197509766, -59.67964172363281, -57.29958724975586, -54.919532775878906, -52.53948211669922, -50.159427642822266, -47.77937316894531, -45.39931869506836, -43.019264221191406, -40.63920974731445, -38.2591552734375, -35.87910461425781, -33.499046325683594, -31.118993759155273, -28.73893928527832, -26.358884811401367, -23.978832244873047, -21.598777770996094, -19.21872329711914, -16.838668823242188, -14.458614349365234, -12.078559875488281, -9.698505401611328, -7.318451404571533, -4.938397407531738, -2.558342933654785, -0.17828845977783203, 2.2017650604248047, 4.581819534301758, 6.961874008178711, 9.341928482055664, 11.721982955932617, 14.102036476135254, 16.48208999633789, 18.862144470214844, 21.242198944091797, 23.62225341796875, 26.002307891845703, 28.382362365722656, 30.76241683959961, 33.14247131347656, 35.522525787353516, 37.90258026123047, 40.282630920410156, 42.662689208984375, 45.04273986816406, 47.422794342041016, 49.80284881591797, 52.18290328979492, 54.562957763671875, 56.94301223754883, 59.32306671142578, 61.70311737060547, 64.08317565917969]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 9.0, 7.0, 13.0, 11.0, 18.0, 13.0, 25.0, 30.0, 27.0, 32.0, 41.0, 24.0, 50.0, 48.0, 48.0, 55.0, 57.0, 70.0, 44.0, 39.0, 34.0, 31.0, 27.0, 37.0, 44.0, 28.0, 19.0, 22.0, 16.0, 19.0, 12.0, 5.0, 6.0, 9.0, 11.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.08901023864746, -29.91200828552246, -28.735004425048828, -27.558002471923828, -26.381000518798828, -25.203998565673828, -24.026994705200195, -22.849992752075195, -21.672988891601562, -20.495986938476562, -19.31898307800293, -18.14198112487793, -16.96497917175293, -15.787976264953613, -14.610973358154297, -13.433971405029297, -12.256969451904297, -11.07996654510498, -9.90296459197998, -8.725961685180664, -7.548959255218506, -6.371956825256348, -5.194953918457031, -4.017951965332031, -2.840949058532715, -1.663946509361267, -0.48694396018981934, 0.690058708190918, 1.8670611381530762, 3.0440635681152344, 4.221066474914551, 5.398068428039551, 6.575069427490234, 7.752071857452393, 8.92907428741455, 10.106077194213867, 11.283079147338867, 12.460082054138184, 13.6370849609375, 14.8140869140625, 15.991089820861816, 17.168092727661133, 18.345094680786133, 19.522098541259766, 20.699100494384766, 21.876102447509766, 23.053104400634766, 24.230106353759766, 25.4071102142334, 26.5841121673584, 27.76111602783203, 28.93811798095703, 30.11511993408203, 31.29212188720703, 32.46912384033203, 33.64612579345703, 34.8231315612793, 36.0001335144043, 37.1771354675293, 38.35414123535156, 39.53114318847656, 40.70814514160156, 41.88514709472656, 43.06214904785156, 44.23915100097656]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 17.0, 16.0, 30.0, 42.0, 61.0, 90.0, 173.0, 464.0, 2495.0, 44708.0, 4074510.0, 67563.0, 3063.0, 542.0, 167.0, 101.0, 60.0, 55.0, 32.0, 10.0, 17.0, 17.0, 8.0, 7.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0625, -14.4951171875, -13.927734375, -13.3603515625, -12.79296875, -12.2255859375, -11.658203125, -11.0908203125, -10.5234375, -9.9560546875, -9.388671875, -8.8212890625, -8.25390625, -7.6865234375, -7.119140625, -6.5517578125, -5.984375, -5.4169921875, -4.849609375, -4.2822265625, -3.71484375, -3.1474609375, -2.580078125, -2.0126953125, -1.4453125, -0.8779296875, -0.310546875, 0.2568359375, 0.82421875, 1.3916015625, 1.958984375, 2.5263671875, 3.09375, 3.6611328125, 4.228515625, 4.7958984375, 5.36328125, 5.9306640625, 6.498046875, 7.0654296875, 7.6328125, 8.2001953125, 8.767578125, 9.3349609375, 9.90234375, 10.4697265625, 11.037109375, 11.6044921875, 12.171875, 12.7392578125, 13.306640625, 13.8740234375, 14.44140625, 15.0087890625, 15.576171875, 16.1435546875, 16.7109375, 17.2783203125, 17.845703125, 18.4130859375, 18.98046875, 19.5478515625, 20.115234375, 20.6826171875, 21.25]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 3.0, 8.0, 17.0, 15.0, 13.0, 16.0, 21.0, 27.0, 23.0, 34.0, 44.0, 46.0, 51.0, 46.0, 44.0, 51.0, 49.0, 39.0, 50.0, 43.0, 44.0, 45.0, 27.0, 48.0, 29.0, 24.0, 26.0, 18.0, 17.0, 15.0, 11.0, 8.0, 10.0, 1.0, 6.0, 8.0, 1.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.974609375, -1.90997314453125, -1.8453369140625, -1.78070068359375, -1.716064453125, -1.65142822265625, -1.5867919921875, -1.52215576171875, -1.45751953125, -1.39288330078125, -1.3282470703125, -1.26361083984375, -1.198974609375, -1.13433837890625, -1.0697021484375, -1.00506591796875, -0.9404296875, -0.87579345703125, -0.8111572265625, -0.74652099609375, -0.681884765625, -0.61724853515625, -0.5526123046875, -0.48797607421875, -0.42333984375, -0.35870361328125, -0.2940673828125, -0.22943115234375, -0.164794921875, -0.10015869140625, -0.0355224609375, 0.02911376953125, 0.09375, 0.15838623046875, 0.2230224609375, 0.28765869140625, 0.352294921875, 0.41693115234375, 0.4815673828125, 0.54620361328125, 0.61083984375, 0.67547607421875, 0.7401123046875, 0.80474853515625, 0.869384765625, 0.93402099609375, 0.9986572265625, 1.06329345703125, 1.1279296875, 1.19256591796875, 1.2572021484375, 1.32183837890625, 1.386474609375, 1.45111083984375, 1.5157470703125, 1.58038330078125, 1.64501953125, 1.70965576171875, 1.7742919921875, 1.83892822265625, 1.903564453125, 1.96820068359375, 2.0328369140625, 2.09747314453125, 2.162109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 9.0, 21.0, 29.0, 49.0, 72.0, 91.0, 154.0, 247.0, 439.0, 718.0, 1313.0, 2576.0, 5543.0, 12706.0, 35388.0, 132802.0, 902178.0, 2604078.0, 382208.0, 73571.0, 22520.0, 8968.0, 4040.0, 1944.0, 1063.0, 615.0, 327.0, 241.0, 115.0, 93.0, 42.0, 29.0, 27.0, 15.0, 14.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.707000732421875, -3.56048583984375, -3.413970947265625, -3.2674560546875, -3.120941162109375, -2.97442626953125, -2.827911376953125, -2.681396484375, -2.534881591796875, -2.38836669921875, -2.241851806640625, -2.0953369140625, -1.948822021484375, -1.80230712890625, -1.655792236328125, -1.50927734375, -1.362762451171875, -1.21624755859375, -1.069732666015625, -0.9232177734375, -0.776702880859375, -0.63018798828125, -0.483673095703125, -0.337158203125, -0.190643310546875, -0.04412841796875, 0.102386474609375, 0.2489013671875, 0.395416259765625, 0.54193115234375, 0.688446044921875, 0.8349609375, 0.981475830078125, 1.12799072265625, 1.274505615234375, 1.4210205078125, 1.567535400390625, 1.71405029296875, 1.860565185546875, 2.007080078125, 2.153594970703125, 2.30010986328125, 2.446624755859375, 2.5931396484375, 2.739654541015625, 2.88616943359375, 3.032684326171875, 3.17919921875, 3.325714111328125, 3.47222900390625, 3.618743896484375, 3.7652587890625, 3.911773681640625, 4.05828857421875, 4.204803466796875, 4.351318359375, 4.497833251953125, 4.64434814453125, 4.790863037109375, 4.9373779296875, 5.083892822265625, 5.23040771484375, 5.376922607421875, 5.5234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 16.0, 24.0, 24.0, 28.0, 72.0, 93.0, 146.0, 273.0, 441.0, 794.0, 841.0, 567.0, 304.0, 152.0, 100.0, 63.0, 39.0, 19.0, 18.0, 12.0, 11.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.87109375, -7.6468505859375, -7.422607421875, -7.1983642578125, -6.97412109375, -6.7498779296875, -6.525634765625, -6.3013916015625, -6.0771484375, -5.8529052734375, -5.628662109375, -5.4044189453125, -5.18017578125, -4.9559326171875, -4.731689453125, -4.5074462890625, -4.283203125, -4.0589599609375, -3.834716796875, -3.6104736328125, -3.38623046875, -3.1619873046875, -2.937744140625, -2.7135009765625, -2.4892578125, -2.2650146484375, -2.040771484375, -1.8165283203125, -1.59228515625, -1.3680419921875, -1.143798828125, -0.9195556640625, -0.6953125, -0.4710693359375, -0.246826171875, -0.0225830078125, 0.20166015625, 0.4259033203125, 0.650146484375, 0.8743896484375, 1.0986328125, 1.3228759765625, 1.547119140625, 1.7713623046875, 1.99560546875, 2.2198486328125, 2.444091796875, 2.6683349609375, 2.892578125, 3.1168212890625, 3.341064453125, 3.5653076171875, 3.78955078125, 4.0137939453125, 4.238037109375, 4.4622802734375, 4.6865234375, 4.9107666015625, 5.135009765625, 5.3592529296875, 5.58349609375, 5.8077392578125, 6.031982421875, 6.2562255859375, 6.48046875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 11.0, 20.0, 61.0, 87.0, 153.0, 195.0, 207.0, 134.0, 60.0, 30.0, 13.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-91.51319885253906, -89.37858581542969, -87.24397277832031, -85.10935974121094, -82.97474670410156, -80.84013366699219, -78.70552062988281, -76.57090759277344, -74.43629455566406, -72.30168151855469, -70.16706848144531, -68.03245544433594, -65.89784240722656, -63.76322937011719, -61.62861251831055, -59.49399948120117, -57.35938262939453, -55.224769592285156, -53.09015655517578, -50.955543518066406, -48.82093048095703, -46.686317443847656, -44.551700592041016, -42.41708755493164, -40.282474517822266, -38.14786148071289, -36.013248443603516, -33.87863540649414, -31.744020462036133, -29.609407424926758, -27.47479248046875, -25.340179443359375, -23.205562591552734, -21.07094955444336, -18.936336517333984, -16.801721572875977, -14.667108535766602, -12.532495498657227, -10.397881507873535, -8.263267517089844, -6.128654479980469, -3.9940409660339355, -1.8594274520874023, 0.27518606185913086, 2.409799575805664, 4.544412612915039, 6.6790266036987305, 8.813640594482422, 10.948253631591797, 13.082866668701172, 15.217480659484863, 17.352094650268555, 19.48670768737793, 21.621320724487305, 23.755935668945312, 25.890548706054688, 28.025161743164062, 30.159774780273438, 32.29438781738281, 34.42900085449219, 36.56361389160156, 38.69822692871094, 40.83284378051758, 42.96745681762695, 45.10206985473633]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 7.0, 6.0, 6.0, 7.0, 13.0, 10.0, 11.0, 23.0, 25.0, 38.0, 27.0, 29.0, 35.0, 41.0, 43.0, 23.0, 31.0, 51.0, 35.0, 43.0, 43.0, 41.0, 35.0, 37.0, 29.0, 28.0, 30.0, 33.0, 29.0, 27.0, 24.0, 17.0, 21.0, 17.0, 14.0, 15.0, 5.0, 11.0, 11.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-23.235137939453125, -22.518321990966797, -21.80150604248047, -21.08469009399414, -20.367874145507812, -19.651058197021484, -18.934242248535156, -18.217426300048828, -17.5006103515625, -16.783794403076172, -16.066978454589844, -15.350162506103516, -14.633346557617188, -13.91653060913086, -13.199714660644531, -12.482898712158203, -11.766083717346191, -11.049267768859863, -10.332451820373535, -9.615635871887207, -8.898819923400879, -8.18200397491455, -7.465188503265381, -6.748372554779053, -6.031556606292725, -5.3147406578063965, -4.597924709320068, -3.8811089992523193, -3.164293050765991, -2.447477102279663, -1.730661392211914, -1.013845443725586, -0.2970294952392578, 0.41978639364242554, 1.1366022825241089, 1.8534181118011475, 2.5702340602874756, 3.2870500087738037, 4.003865718841553, 4.720681667327881, 5.437497615814209, 6.154313564300537, 6.871129512786865, 7.587944984436035, 8.304760932922363, 9.021576881408691, 9.73839282989502, 10.455208778381348, 11.172024726867676, 11.888840675354004, 12.605656623840332, 13.32247257232666, 14.039288520812988, 14.756104469299316, 15.472919464111328, 16.189735412597656, 16.906551361083984, 17.623367309570312, 18.34018325805664, 19.05699920654297, 19.773815155029297, 20.490631103515625, 21.207447052001953, 21.92426300048828, 22.64107894897461]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 7.0, 16.0, 22.0, 29.0, 37.0, 55.0, 89.0, 105.0, 161.0, 252.0, 348.0, 534.0, 844.0, 1235.0, 1959.0, 3458.0, 6013.0, 10491.0, 19899.0, 40448.0, 99584.0, 307719.0, 346652.0, 113853.0, 45320.0, 21970.0, 11451.0, 6395.0, 3624.0, 2135.0, 1279.0, 865.0, 530.0, 371.0, 233.0, 151.0, 118.0, 90.0, 61.0, 43.0, 35.0, 21.0, 16.0, 17.0, 7.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.63671875, -4.5006103515625, -4.364501953125, -4.2283935546875, -4.09228515625, -3.9561767578125, -3.820068359375, -3.6839599609375, -3.5478515625, -3.4117431640625, -3.275634765625, -3.1395263671875, -3.00341796875, -2.8673095703125, -2.731201171875, -2.5950927734375, -2.458984375, -2.3228759765625, -2.186767578125, -2.0506591796875, -1.91455078125, -1.7784423828125, -1.642333984375, -1.5062255859375, -1.3701171875, -1.2340087890625, -1.097900390625, -0.9617919921875, -0.82568359375, -0.6895751953125, -0.553466796875, -0.4173583984375, -0.28125, -0.1451416015625, -0.009033203125, 0.1270751953125, 0.26318359375, 0.3992919921875, 0.535400390625, 0.6715087890625, 0.8076171875, 0.9437255859375, 1.079833984375, 1.2159423828125, 1.35205078125, 1.4881591796875, 1.624267578125, 1.7603759765625, 1.896484375, 2.0325927734375, 2.168701171875, 2.3048095703125, 2.44091796875, 2.5770263671875, 2.713134765625, 2.8492431640625, 2.9853515625, 3.1214599609375, 3.257568359375, 3.3936767578125, 3.52978515625, 3.6658935546875, 3.802001953125, 3.9381103515625, 4.07421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 5.0, 6.0, 10.0, 12.0, 13.0, 11.0, 15.0, 18.0, 22.0, 34.0, 24.0, 43.0, 30.0, 43.0, 35.0, 41.0, 47.0, 34.0, 51.0, 44.0, 33.0, 54.0, 51.0, 51.0, 30.0, 27.0, 34.0, 27.0, 34.0, 20.0, 22.0, 20.0, 10.0, 8.0, 5.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.060546875, -1.995880126953125, -1.93121337890625, -1.866546630859375, -1.8018798828125, -1.737213134765625, -1.67254638671875, -1.607879638671875, -1.543212890625, -1.478546142578125, -1.41387939453125, -1.349212646484375, -1.2845458984375, -1.219879150390625, -1.15521240234375, -1.090545654296875, -1.02587890625, -0.961212158203125, -0.89654541015625, -0.831878662109375, -0.7672119140625, -0.702545166015625, -0.63787841796875, -0.573211669921875, -0.508544921875, -0.443878173828125, -0.37921142578125, -0.314544677734375, -0.2498779296875, -0.185211181640625, -0.12054443359375, -0.055877685546875, 0.0087890625, 0.073455810546875, 0.13812255859375, 0.202789306640625, 0.2674560546875, 0.332122802734375, 0.39678955078125, 0.461456298828125, 0.526123046875, 0.590789794921875, 0.65545654296875, 0.720123291015625, 0.7847900390625, 0.849456787109375, 0.91412353515625, 0.978790283203125, 1.04345703125, 1.108123779296875, 1.17279052734375, 1.237457275390625, 1.3021240234375, 1.366790771484375, 1.43145751953125, 1.496124267578125, 1.560791015625, 1.625457763671875, 1.69012451171875, 1.754791259765625, 1.8194580078125, 1.884124755859375, 1.94879150390625, 2.013458251953125, 2.078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 14.0, 17.0, 18.0, 31.0, 26.0, 54.0, 57.0, 97.0, 147.0, 205.0, 303.0, 501.0, 868.0, 1592.0, 3809.0, 9981.0, 34224.0, 196820.0, 687042.0, 81041.0, 19613.0, 6410.0, 2627.0, 1236.0, 665.0, 398.0, 227.0, 152.0, 95.0, 68.0, 62.0, 40.0, 23.0, 24.0, 16.0, 8.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.767822265625, -8.50439453125, -8.240966796875, -7.9775390625, -7.714111328125, -7.45068359375, -7.187255859375, -6.923828125, -6.660400390625, -6.39697265625, -6.133544921875, -5.8701171875, -5.606689453125, -5.34326171875, -5.079833984375, -4.81640625, -4.552978515625, -4.28955078125, -4.026123046875, -3.7626953125, -3.499267578125, -3.23583984375, -2.972412109375, -2.708984375, -2.445556640625, -2.18212890625, -1.918701171875, -1.6552734375, -1.391845703125, -1.12841796875, -0.864990234375, -0.6015625, -0.338134765625, -0.07470703125, 0.188720703125, 0.4521484375, 0.715576171875, 0.97900390625, 1.242431640625, 1.505859375, 1.769287109375, 2.03271484375, 2.296142578125, 2.5595703125, 2.822998046875, 3.08642578125, 3.349853515625, 3.61328125, 3.876708984375, 4.14013671875, 4.403564453125, 4.6669921875, 4.930419921875, 5.19384765625, 5.457275390625, 5.720703125, 5.984130859375, 6.24755859375, 6.510986328125, 6.7744140625, 7.037841796875, 7.30126953125, 7.564697265625, 7.828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 5.0, 8.0, 6.0, 11.0, 17.0, 23.0, 22.0, 21.0, 29.0, 32.0, 44.0, 62.0, 60.0, 56.0, 52.0, 47.0, 75.0, 69.0, 58.0, 48.0, 45.0, 31.0, 39.0, 35.0, 24.0, 14.0, 21.0, 11.0, 8.0, 13.0, 8.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.7930908203125, -8.453369140625, -8.1136474609375, -7.77392578125, -7.4342041015625, -7.094482421875, -6.7547607421875, -6.4150390625, -6.0753173828125, -5.735595703125, -5.3958740234375, -5.05615234375, -4.7164306640625, -4.376708984375, -4.0369873046875, -3.697265625, -3.3575439453125, -3.017822265625, -2.6781005859375, -2.33837890625, -1.9986572265625, -1.658935546875, -1.3192138671875, -0.9794921875, -0.6397705078125, -0.300048828125, 0.0396728515625, 0.37939453125, 0.7191162109375, 1.058837890625, 1.3985595703125, 1.73828125, 2.0780029296875, 2.417724609375, 2.7574462890625, 3.09716796875, 3.4368896484375, 3.776611328125, 4.1163330078125, 4.4560546875, 4.7957763671875, 5.135498046875, 5.4752197265625, 5.81494140625, 6.1546630859375, 6.494384765625, 6.8341064453125, 7.173828125, 7.5135498046875, 7.853271484375, 8.1929931640625, 8.53271484375, 8.8724365234375, 9.212158203125, 9.5518798828125, 9.8916015625, 10.2313232421875, 10.571044921875, 10.9107666015625, 11.25048828125, 11.5902099609375, 11.929931640625, 12.2696533203125, 12.609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 8.0, 7.0, 15.0, 26.0, 42.0, 103.0, 163.0, 416.0, 1171.0, 4255.0, 23096.0, 255871.0, 704706.0, 48333.0, 7467.0, 1789.0, 561.0, 244.0, 119.0, 43.0, 38.0, 19.0, 11.0, 15.0, 6.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.765625, -6.57861328125, -6.3916015625, -6.20458984375, -6.017578125, -5.83056640625, -5.6435546875, -5.45654296875, -5.26953125, -5.08251953125, -4.8955078125, -4.70849609375, -4.521484375, -4.33447265625, -4.1474609375, -3.96044921875, -3.7734375, -3.58642578125, -3.3994140625, -3.21240234375, -3.025390625, -2.83837890625, -2.6513671875, -2.46435546875, -2.27734375, -2.09033203125, -1.9033203125, -1.71630859375, -1.529296875, -1.34228515625, -1.1552734375, -0.96826171875, -0.78125, -0.59423828125, -0.4072265625, -0.22021484375, -0.033203125, 0.15380859375, 0.3408203125, 0.52783203125, 0.71484375, 0.90185546875, 1.0888671875, 1.27587890625, 1.462890625, 1.64990234375, 1.8369140625, 2.02392578125, 2.2109375, 2.39794921875, 2.5849609375, 2.77197265625, 2.958984375, 3.14599609375, 3.3330078125, 3.52001953125, 3.70703125, 3.89404296875, 4.0810546875, 4.26806640625, 4.455078125, 4.64208984375, 4.8291015625, 5.01611328125, 5.203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 17.0, 20.0, 28.0, 29.0, 43.0, 93.0, 220.0, 231.0, 131.0, 66.0, 28.0, 22.0, 27.0, 12.0, 7.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000850677490234375, -0.0007981956005096436, -0.0007457137107849121, -0.0006932318210601807, -0.0006407499313354492, -0.0005882680416107178, -0.0005357861518859863, -0.0004833042621612549, -0.00043082237243652344, -0.000378340482711792, -0.00032585859298706055, -0.0002733767032623291, -0.00022089481353759766, -0.0001684129238128662, -0.00011593103408813477, -6.344914436340332e-05, -1.0967254638671875e-05, 4.151463508605957e-05, 9.399652481079102e-05, 0.00014647841453552246, 0.0001989603042602539, 0.00025144219398498535, 0.0003039240837097168, 0.00035640597343444824, 0.0004088878631591797, 0.00046136975288391113, 0.0005138516426086426, 0.000566333532333374, 0.0006188154220581055, 0.0006712973117828369, 0.0007237792015075684, 0.0007762610912322998, 0.0008287429809570312, 0.0008812248706817627, 0.0009337067604064941, 0.0009861886501312256, 0.001038670539855957, 0.0010911524295806885, 0.00114363431930542, 0.0011961162090301514, 0.0012485980987548828, 0.0013010799884796143, 0.0013535618782043457, 0.0014060437679290771, 0.0014585256576538086, 0.00151100754737854, 0.0015634894371032715, 0.001615971326828003, 0.0016684532165527344, 0.0017209351062774658, 0.0017734169960021973, 0.0018258988857269287, 0.0018783807754516602, 0.0019308626651763916, 0.001983344554901123, 0.0020358264446258545, 0.002088308334350586, 0.0021407902240753174, 0.002193272113800049, 0.0022457540035247803, 0.0022982358932495117, 0.002350717782974243, 0.0024031996726989746, 0.002455681562423706, 0.0025081634521484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 13.0, 12.0, 14.0, 25.0, 36.0, 56.0, 108.0, 160.0, 286.0, 536.0, 1217.0, 2912.0, 9421.0, 41700.0, 288685.0, 605147.0, 75599.0, 15224.0, 4254.0, 1551.0, 730.0, 404.0, 189.0, 108.0, 57.0, 40.0, 23.0, 16.0, 12.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.39459228515625, -3.2696533203125, -3.14471435546875, -3.019775390625, -2.89483642578125, -2.7698974609375, -2.64495849609375, -2.52001953125, -2.39508056640625, -2.2701416015625, -2.14520263671875, -2.020263671875, -1.89532470703125, -1.7703857421875, -1.64544677734375, -1.5205078125, -1.39556884765625, -1.2706298828125, -1.14569091796875, -1.020751953125, -0.89581298828125, -0.7708740234375, -0.64593505859375, -0.52099609375, -0.39605712890625, -0.2711181640625, -0.14617919921875, -0.021240234375, 0.10369873046875, 0.2286376953125, 0.35357666015625, 0.478515625, 0.60345458984375, 0.7283935546875, 0.85333251953125, 0.978271484375, 1.10321044921875, 1.2281494140625, 1.35308837890625, 1.47802734375, 1.60296630859375, 1.7279052734375, 1.85284423828125, 1.977783203125, 2.10272216796875, 2.2276611328125, 2.35260009765625, 2.4775390625, 2.60247802734375, 2.7274169921875, 2.85235595703125, 2.977294921875, 3.10223388671875, 3.2271728515625, 3.35211181640625, 3.47705078125, 3.60198974609375, 3.7269287109375, 3.85186767578125, 3.976806640625, 4.10174560546875, 4.2266845703125, 4.35162353515625, 4.4765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 9.0, 9.0, 18.0, 22.0, 34.0, 27.0, 41.0, 44.0, 70.0, 58.0, 93.0, 89.0, 87.0, 69.0, 63.0, 62.0, 32.0, 22.0, 27.0, 19.0, 18.0, 13.0, 12.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.27734375, -3.175628662109375, -3.07391357421875, -2.972198486328125, -2.8704833984375, -2.768768310546875, -2.66705322265625, -2.565338134765625, -2.463623046875, -2.361907958984375, -2.26019287109375, -2.158477783203125, -2.0567626953125, -1.955047607421875, -1.85333251953125, -1.751617431640625, -1.64990234375, -1.548187255859375, -1.44647216796875, -1.344757080078125, -1.2430419921875, -1.141326904296875, -1.03961181640625, -0.937896728515625, -0.836181640625, -0.734466552734375, -0.63275146484375, -0.531036376953125, -0.4293212890625, -0.327606201171875, -0.22589111328125, -0.124176025390625, -0.0224609375, 0.079254150390625, 0.18096923828125, 0.282684326171875, 0.3843994140625, 0.486114501953125, 0.58782958984375, 0.689544677734375, 0.791259765625, 0.892974853515625, 0.99468994140625, 1.096405029296875, 1.1981201171875, 1.299835205078125, 1.40155029296875, 1.503265380859375, 1.60498046875, 1.706695556640625, 1.80841064453125, 1.910125732421875, 2.0118408203125, 2.113555908203125, 2.21527099609375, 2.316986083984375, 2.418701171875, 2.520416259765625, 2.62213134765625, 2.723846435546875, 2.8255615234375, 2.927276611328125, 3.02899169921875, 3.130706787109375, 3.232421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 18.0, 46.0, 98.0, 178.0, 291.0, 179.0, 107.0, 41.0, 15.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-109.37437438964844, -106.30702209472656, -103.23966217041016, -100.17230987548828, -97.10494995117188, -94.03759765625, -90.9702377319336, -87.90288543701172, -84.83552551269531, -81.76817321777344, -78.70081329345703, -75.63346099853516, -72.56610107421875, -69.49874877929688, -66.43138885498047, -63.364036560058594, -60.29668045043945, -57.22932434082031, -54.16196823120117, -51.09461212158203, -48.02725601196289, -44.95989990234375, -41.892547607421875, -38.82518768310547, -35.757835388183594, -32.69047927856445, -29.623123168945312, -26.555767059326172, -23.48841094970703, -20.42105484008789, -17.353700637817383, -14.286344528198242, -11.218986511230469, -8.151630401611328, -5.084274768829346, -2.0169191360473633, 1.0504369735717773, 4.117793083190918, 7.185148239135742, 10.252504348754883, 13.319860458374023, 16.387216567993164, 19.454572677612305, 22.521926879882812, 25.589282989501953, 28.656639099121094, 31.723995208740234, 34.791351318359375, 37.858707427978516, 40.926063537597656, 43.9934196472168, 47.06077575683594, 50.12813186645508, 53.19548797607422, 56.262840270996094, 59.3302001953125, 62.397552490234375, 65.46490478515625, 68.53226470947266, 71.59961700439453, 74.66697692871094, 77.73432922363281, 80.80168914794922, 83.8690414428711, 86.9364013671875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 14.0, 18.0, 11.0, 18.0, 14.0, 16.0, 26.0, 26.0, 26.0, 49.0, 39.0, 49.0, 52.0, 63.0, 77.0, 79.0, 72.0, 60.0, 41.0, 54.0, 20.0, 38.0, 25.0, 29.0, 24.0, 21.0, 11.0, 8.0, 7.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.405670166015625, -39.97478485107422, -38.54389953613281, -37.113014221191406, -35.68212890625, -34.251243591308594, -32.82035827636719, -31.38947296142578, -29.958587646484375, -28.52770233154297, -27.096817016601562, -25.665931701660156, -24.23504638671875, -22.804161071777344, -21.373275756835938, -19.94239044189453, -18.511505126953125, -17.08061981201172, -15.649734497070312, -14.218849182128906, -12.7879638671875, -11.357078552246094, -9.926193237304688, -8.495307922363281, -7.064422607421875, -5.633537292480469, -4.2026519775390625, -2.7717666625976562, -1.34088134765625, 0.09000396728515625, 1.5208892822265625, 2.9517745971679688, 4.382656097412109, 5.813541412353516, 7.244426727294922, 8.675312042236328, 10.106197357177734, 11.53708267211914, 12.967967987060547, 14.398853302001953, 15.82973861694336, 17.260623931884766, 18.691509246826172, 20.122394561767578, 21.553279876708984, 22.98416519165039, 24.415050506591797, 25.845935821533203, 27.27682113647461, 28.707706451416016, 30.138591766357422, 31.569477081298828, 33.000362396240234, 34.43124771118164, 35.86213302612305, 37.29301834106445, 38.72390365600586, 40.154788970947266, 41.58567428588867, 43.01655960083008, 44.447444915771484, 45.87833023071289, 47.3092155456543, 48.7401008605957, 50.17098617553711]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 12.0, 15.0, 15.0, 36.0, 27.0, 55.0, 75.0, 113.0, 197.0, 270.0, 469.0, 743.0, 1259.0, 2244.0, 4158.0, 7944.0, 15306.0, 32828.0, 75001.0, 208145.0, 746128.0, 1862283.0, 849579.0, 234531.0, 82598.0, 35150.0, 16628.0, 8341.0, 4359.0, 2300.0, 1376.0, 783.0, 441.0, 289.0, 164.0, 134.0, 80.0, 68.0, 30.0, 26.0, 20.0, 12.0, 19.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.375, -2.29180908203125, -2.2086181640625, -2.12542724609375, -2.042236328125, -1.95904541015625, -1.8758544921875, -1.79266357421875, -1.70947265625, -1.62628173828125, -1.5430908203125, -1.45989990234375, -1.376708984375, -1.29351806640625, -1.2103271484375, -1.12713623046875, -1.0439453125, -0.96075439453125, -0.8775634765625, -0.79437255859375, -0.711181640625, -0.62799072265625, -0.5447998046875, -0.46160888671875, -0.37841796875, -0.29522705078125, -0.2120361328125, -0.12884521484375, -0.045654296875, 0.03753662109375, 0.1207275390625, 0.20391845703125, 0.287109375, 0.37030029296875, 0.4534912109375, 0.53668212890625, 0.619873046875, 0.70306396484375, 0.7862548828125, 0.86944580078125, 0.95263671875, 1.03582763671875, 1.1190185546875, 1.20220947265625, 1.285400390625, 1.36859130859375, 1.4517822265625, 1.53497314453125, 1.6181640625, 1.70135498046875, 1.7845458984375, 1.86773681640625, 1.950927734375, 2.03411865234375, 2.1173095703125, 2.20050048828125, 2.28369140625, 2.36688232421875, 2.4500732421875, 2.53326416015625, 2.616455078125, 2.69964599609375, 2.7828369140625, 2.86602783203125, 2.94921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 21.0, 18.0, 31.0, 35.0, 53.0, 50.0, 73.0, 82.0, 89.0, 109.0, 81.0, 68.0, 60.0, 51.0, 46.0, 36.0, 29.0, 20.0, 13.0, 5.0, 9.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.30181884765625, -2.1934814453125, -2.08514404296875, -1.976806640625, -1.86846923828125, -1.7601318359375, -1.65179443359375, -1.54345703125, -1.43511962890625, -1.3267822265625, -1.21844482421875, -1.110107421875, -1.00177001953125, -0.8934326171875, -0.78509521484375, -0.6767578125, -0.56842041015625, -0.4600830078125, -0.35174560546875, -0.243408203125, -0.13507080078125, -0.0267333984375, 0.08160400390625, 0.18994140625, 0.29827880859375, 0.4066162109375, 0.51495361328125, 0.623291015625, 0.73162841796875, 0.8399658203125, 0.94830322265625, 1.056640625, 1.16497802734375, 1.2733154296875, 1.38165283203125, 1.489990234375, 1.59832763671875, 1.7066650390625, 1.81500244140625, 1.92333984375, 2.03167724609375, 2.1400146484375, 2.24835205078125, 2.356689453125, 2.46502685546875, 2.5733642578125, 2.68170166015625, 2.7900390625, 2.89837646484375, 3.0067138671875, 3.11505126953125, 3.223388671875, 3.33172607421875, 3.4400634765625, 3.54840087890625, 3.65673828125, 3.76507568359375, 3.8734130859375, 3.98175048828125, 4.090087890625, 4.19842529296875, 4.3067626953125, 4.41510009765625, 4.5234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 5.0, 13.0, 8.0, 7.0, 22.0, 61.0, 62.0, 117.0, 209.0, 359.0, 698.0, 1380.0, 3160.0, 7962.0, 24274.0, 91664.0, 527442.0, 2726170.0, 664821.0, 105906.0, 25943.0, 8190.0, 3088.0, 1270.0, 616.0, 293.0, 221.0, 108.0, 64.0, 47.0, 29.0, 20.0, 18.0, 10.0, 8.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.875, -5.7049560546875, -5.534912109375, -5.3648681640625, -5.19482421875, -5.0247802734375, -4.854736328125, -4.6846923828125, -4.5146484375, -4.3446044921875, -4.174560546875, -4.0045166015625, -3.83447265625, -3.6644287109375, -3.494384765625, -3.3243408203125, -3.154296875, -2.9842529296875, -2.814208984375, -2.6441650390625, -2.47412109375, -2.3040771484375, -2.134033203125, -1.9639892578125, -1.7939453125, -1.6239013671875, -1.453857421875, -1.2838134765625, -1.11376953125, -0.9437255859375, -0.773681640625, -0.6036376953125, -0.43359375, -0.2635498046875, -0.093505859375, 0.0765380859375, 0.24658203125, 0.4166259765625, 0.586669921875, 0.7567138671875, 0.9267578125, 1.0968017578125, 1.266845703125, 1.4368896484375, 1.60693359375, 1.7769775390625, 1.947021484375, 2.1170654296875, 2.287109375, 2.4571533203125, 2.627197265625, 2.7972412109375, 2.96728515625, 3.1373291015625, 3.307373046875, 3.4774169921875, 3.6474609375, 3.8175048828125, 3.987548828125, 4.1575927734375, 4.32763671875, 4.4976806640625, 4.667724609375, 4.8377685546875, 5.0078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 5.0, 12.0, 3.0, 11.0, 17.0, 17.0, 26.0, 35.0, 40.0, 60.0, 81.0, 110.0, 157.0, 224.0, 325.0, 411.0, 577.0, 507.0, 439.0, 266.0, 224.0, 171.0, 83.0, 80.0, 41.0, 38.0, 29.0, 14.0, 17.0, 12.0, 10.0, 7.0, 5.0, 5.0, 0.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.93829345703125, -5.7515869140625, -5.56488037109375, -5.378173828125, -5.19146728515625, -5.0047607421875, -4.81805419921875, -4.63134765625, -4.44464111328125, -4.2579345703125, -4.07122802734375, -3.884521484375, -3.69781494140625, -3.5111083984375, -3.32440185546875, -3.1376953125, -2.95098876953125, -2.7642822265625, -2.57757568359375, -2.390869140625, -2.20416259765625, -2.0174560546875, -1.83074951171875, -1.64404296875, -1.45733642578125, -1.2706298828125, -1.08392333984375, -0.897216796875, -0.71051025390625, -0.5238037109375, -0.33709716796875, -0.150390625, 0.03631591796875, 0.2230224609375, 0.40972900390625, 0.596435546875, 0.78314208984375, 0.9698486328125, 1.15655517578125, 1.34326171875, 1.52996826171875, 1.7166748046875, 1.90338134765625, 2.090087890625, 2.27679443359375, 2.4635009765625, 2.65020751953125, 2.8369140625, 3.02362060546875, 3.2103271484375, 3.39703369140625, 3.583740234375, 3.77044677734375, 3.9571533203125, 4.14385986328125, 4.33056640625, 4.51727294921875, 4.7039794921875, 4.89068603515625, 5.077392578125, 5.26409912109375, 5.4508056640625, 5.63751220703125, 5.82421875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 16.0, 14.0, 54.0, 107.0, 198.0, 212.0, 180.0, 107.0, 51.0, 23.0, 13.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-88.04563903808594, -85.15619659423828, -82.26675415039062, -79.3773193359375, -76.48787689208984, -73.59843444824219, -70.70899200439453, -67.81954956054688, -64.93010711669922, -62.04066467285156, -59.15122604370117, -56.261783599853516, -53.37234115600586, -50.48290252685547, -47.59346008300781, -44.704017639160156, -41.814579010009766, -38.92513656616211, -36.03569793701172, -33.14625549316406, -30.256813049316406, -27.367372512817383, -24.47793197631836, -21.588489532470703, -18.69904899597168, -15.80960750579834, -12.920166015625, -10.030725479125977, -7.141283988952637, -4.251842498779297, -1.3624019622802734, 1.5270404815673828, 4.416481018066406, 7.305922508239746, 10.195363998413086, 13.08480453491211, 15.97424602508545, 18.86368751525879, 21.753128051757812, 24.64257049560547, 27.532011032104492, 30.421451568603516, 33.31089401245117, 36.20033264160156, 39.08977508544922, 41.979217529296875, 44.86865997314453, 47.75810241699219, 50.64754104614258, 53.536983489990234, 56.426422119140625, 59.31586456298828, 62.20530700683594, 65.0947494506836, 67.98419189453125, 70.87362670898438, 73.76306915283203, 76.65251159667969, 79.54195404052734, 82.431396484375, 85.32083129882812, 88.21027374267578, 91.09971618652344, 93.9891586303711, 96.87860107421875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 9.0, 7.0, 6.0, 8.0, 17.0, 12.0, 25.0, 22.0, 24.0, 19.0, 27.0, 26.0, 44.0, 27.0, 43.0, 38.0, 49.0, 45.0, 48.0, 43.0, 58.0, 52.0, 37.0, 36.0, 28.0, 37.0, 15.0, 21.0, 30.0, 28.0, 20.0, 13.0, 15.0, 11.0, 13.0, 7.0, 18.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.65509033203125, -31.727840423583984, -30.80059051513672, -29.873340606689453, -28.946088790893555, -28.01883888244629, -27.091588973999023, -26.164339065551758, -25.23708724975586, -24.309837341308594, -23.382587432861328, -22.455337524414062, -21.528085708618164, -20.6008358001709, -19.673585891723633, -18.746335983276367, -17.8190860748291, -16.891836166381836, -15.964585304260254, -15.037335395812988, -14.110084533691406, -13.18283462524414, -12.255584716796875, -11.32833480834961, -10.401083946228027, -9.473834037780762, -8.54658317565918, -7.619333267211914, -6.69208288192749, -5.764832496643066, -4.837582588195801, -3.910332202911377, -2.983081817626953, -2.0558314323425293, -1.1285812854766846, -0.20133113861083984, 0.725919246673584, 1.6531696319580078, 2.5804195404052734, 3.5076699256896973, 4.434920310974121, 5.362170696258545, 6.289421081542969, 7.216670989990234, 8.1439208984375, 9.071171760559082, 9.998421669006348, 10.92567253112793, 11.852922439575195, 12.780172348022461, 13.707423210144043, 14.634673118591309, 15.56192398071289, 16.489173889160156, 17.416423797607422, 18.343673706054688, 19.270923614501953, 20.19817352294922, 21.125423431396484, 22.05267333984375, 22.97992515563965, 23.907175064086914, 24.83442497253418, 25.761674880981445, 26.688926696777344]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 6.0, 3.0, 8.0, 6.0, 14.0, 15.0, 19.0, 26.0, 44.0, 70.0, 84.0, 115.0, 136.0, 248.0, 341.0, 532.0, 774.0, 1346.0, 1988.0, 3350.0, 5462.0, 8953.0, 15286.0, 26157.0, 45825.0, 82787.0, 166069.0, 289536.0, 187738.0, 91060.0, 49892.0, 28729.0, 16610.0, 9688.0, 5890.0, 3479.0, 2219.0, 1342.0, 871.0, 592.0, 387.0, 261.0, 176.0, 119.0, 91.0, 66.0, 37.0, 27.0, 23.0, 19.0, 15.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.583984375, -3.470489501953125, -3.35699462890625, -3.243499755859375, -3.1300048828125, -3.016510009765625, -2.90301513671875, -2.789520263671875, -2.676025390625, -2.562530517578125, -2.44903564453125, -2.335540771484375, -2.2220458984375, -2.108551025390625, -1.99505615234375, -1.881561279296875, -1.76806640625, -1.654571533203125, -1.54107666015625, -1.427581787109375, -1.3140869140625, -1.200592041015625, -1.08709716796875, -0.973602294921875, -0.860107421875, -0.746612548828125, -0.63311767578125, -0.519622802734375, -0.4061279296875, -0.292633056640625, -0.17913818359375, -0.065643310546875, 0.0478515625, 0.161346435546875, 0.27484130859375, 0.388336181640625, 0.5018310546875, 0.615325927734375, 0.72882080078125, 0.842315673828125, 0.955810546875, 1.069305419921875, 1.18280029296875, 1.296295166015625, 1.4097900390625, 1.523284912109375, 1.63677978515625, 1.750274658203125, 1.86376953125, 1.977264404296875, 2.09075927734375, 2.204254150390625, 2.3177490234375, 2.431243896484375, 2.54473876953125, 2.658233642578125, 2.771728515625, 2.885223388671875, 2.99871826171875, 3.112213134765625, 3.2257080078125, 3.339202880859375, 3.45269775390625, 3.566192626953125, 3.6796875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 7.0, 2.0, 0.0, 10.0, 10.0, 16.0, 7.0, 13.0, 11.0, 11.0, 19.0, 23.0, 26.0, 32.0, 27.0, 40.0, 33.0, 20.0, 40.0, 41.0, 47.0, 49.0, 44.0, 35.0, 41.0, 41.0, 39.0, 34.0, 33.0, 36.0, 40.0, 27.0, 15.0, 29.0, 21.0, 6.0, 9.0, 13.0, 7.0, 7.0, 10.0, 6.0, 4.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6533203125, -1.596893310546875, -1.54046630859375, -1.484039306640625, -1.4276123046875, -1.371185302734375, -1.31475830078125, -1.258331298828125, -1.201904296875, -1.145477294921875, -1.08905029296875, -1.032623291015625, -0.9761962890625, -0.919769287109375, -0.86334228515625, -0.806915283203125, -0.75048828125, -0.694061279296875, -0.63763427734375, -0.581207275390625, -0.5247802734375, -0.468353271484375, -0.41192626953125, -0.355499267578125, -0.299072265625, -0.242645263671875, -0.18621826171875, -0.129791259765625, -0.0733642578125, -0.016937255859375, 0.03948974609375, 0.095916748046875, 0.15234375, 0.208770751953125, 0.26519775390625, 0.321624755859375, 0.3780517578125, 0.434478759765625, 0.49090576171875, 0.547332763671875, 0.603759765625, 0.660186767578125, 0.71661376953125, 0.773040771484375, 0.8294677734375, 0.885894775390625, 0.94232177734375, 0.998748779296875, 1.05517578125, 1.111602783203125, 1.16802978515625, 1.224456787109375, 1.2808837890625, 1.337310791015625, 1.39373779296875, 1.450164794921875, 1.506591796875, 1.563018798828125, 1.61944580078125, 1.675872802734375, 1.7322998046875, 1.788726806640625, 1.84515380859375, 1.901580810546875, 1.9580078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 18.0, 10.0, 21.0, 23.0, 35.0, 43.0, 60.0, 109.0, 104.0, 154.0, 241.0, 327.0, 443.0, 737.0, 1199.0, 1931.0, 3968.0, 10495.0, 38369.0, 215093.0, 660645.0, 82799.0, 18854.0, 6046.0, 2631.0, 1519.0, 852.0, 570.0, 366.0, 250.0, 184.0, 119.0, 102.0, 61.0, 48.0, 36.0, 24.0, 17.0, 15.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.6646728515625, -8.368408203125, -8.0721435546875, -7.77587890625, -7.4796142578125, -7.183349609375, -6.8870849609375, -6.5908203125, -6.2945556640625, -5.998291015625, -5.7020263671875, -5.40576171875, -5.1094970703125, -4.813232421875, -4.5169677734375, -4.220703125, -3.9244384765625, -3.628173828125, -3.3319091796875, -3.03564453125, -2.7393798828125, -2.443115234375, -2.1468505859375, -1.8505859375, -1.5543212890625, -1.258056640625, -0.9617919921875, -0.66552734375, -0.3692626953125, -0.072998046875, 0.2232666015625, 0.51953125, 0.8157958984375, 1.112060546875, 1.4083251953125, 1.70458984375, 2.0008544921875, 2.297119140625, 2.5933837890625, 2.8896484375, 3.1859130859375, 3.482177734375, 3.7784423828125, 4.07470703125, 4.3709716796875, 4.667236328125, 4.9635009765625, 5.259765625, 5.5560302734375, 5.852294921875, 6.1485595703125, 6.44482421875, 6.7410888671875, 7.037353515625, 7.3336181640625, 7.6298828125, 7.9261474609375, 8.222412109375, 8.5186767578125, 8.81494140625, 9.1112060546875, 9.407470703125, 9.7037353515625, 10.0]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 7.0, 10.0, 11.0, 12.0, 15.0, 19.0, 13.0, 33.0, 44.0, 34.0, 27.0, 46.0, 30.0, 58.0, 59.0, 49.0, 57.0, 62.0, 51.0, 51.0, 44.0, 37.0, 35.0, 30.0, 27.0, 23.0, 20.0, 18.0, 16.0, 10.0, 12.0, 6.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.710205078125, -8.40478515625, -8.099365234375, -7.7939453125, -7.488525390625, -7.18310546875, -6.877685546875, -6.572265625, -6.266845703125, -5.96142578125, -5.656005859375, -5.3505859375, -5.045166015625, -4.73974609375, -4.434326171875, -4.12890625, -3.823486328125, -3.51806640625, -3.212646484375, -2.9072265625, -2.601806640625, -2.29638671875, -1.990966796875, -1.685546875, -1.380126953125, -1.07470703125, -0.769287109375, -0.4638671875, -0.158447265625, 0.14697265625, 0.452392578125, 0.7578125, 1.063232421875, 1.36865234375, 1.674072265625, 1.9794921875, 2.284912109375, 2.59033203125, 2.895751953125, 3.201171875, 3.506591796875, 3.81201171875, 4.117431640625, 4.4228515625, 4.728271484375, 5.03369140625, 5.339111328125, 5.64453125, 5.949951171875, 6.25537109375, 6.560791015625, 6.8662109375, 7.171630859375, 7.47705078125, 7.782470703125, 8.087890625, 8.393310546875, 8.69873046875, 9.004150390625, 9.3095703125, 9.614990234375, 9.92041015625, 10.225830078125, 10.53125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 2.0, 8.0, 10.0, 17.0, 25.0, 38.0, 58.0, 85.0, 155.0, 242.0, 370.0, 778.0, 1523.0, 3387.0, 8966.0, 27615.0, 96247.0, 577506.0, 243538.0, 59312.0, 17811.0, 5887.0, 2366.0, 1151.0, 592.0, 333.0, 193.0, 113.0, 78.0, 52.0, 25.0, 19.0, 12.0, 15.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.955078125, -3.844635009765625, -3.73419189453125, -3.623748779296875, -3.5133056640625, -3.402862548828125, -3.29241943359375, -3.181976318359375, -3.071533203125, -2.961090087890625, -2.85064697265625, -2.740203857421875, -2.6297607421875, -2.519317626953125, -2.40887451171875, -2.298431396484375, -2.18798828125, -2.077545166015625, -1.96710205078125, -1.856658935546875, -1.7462158203125, -1.635772705078125, -1.52532958984375, -1.414886474609375, -1.304443359375, -1.194000244140625, -1.08355712890625, -0.973114013671875, -0.8626708984375, -0.752227783203125, -0.64178466796875, -0.531341552734375, -0.4208984375, -0.310455322265625, -0.20001220703125, -0.089569091796875, 0.0208740234375, 0.131317138671875, 0.24176025390625, 0.352203369140625, 0.462646484375, 0.573089599609375, 0.68353271484375, 0.793975830078125, 0.9044189453125, 1.014862060546875, 1.12530517578125, 1.235748291015625, 1.34619140625, 1.456634521484375, 1.56707763671875, 1.677520751953125, 1.7879638671875, 1.898406982421875, 2.00885009765625, 2.119293212890625, 2.229736328125, 2.340179443359375, 2.45062255859375, 2.561065673828125, 2.6715087890625, 2.781951904296875, 2.89239501953125, 3.002838134765625, 3.11328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 8.0, 4.0, 11.0, 4.0, 4.0, 9.0, 9.0, 12.0, 14.0, 16.0, 17.0, 21.0, 30.0, 37.0, 43.0, 57.0, 84.0, 101.0, 117.0, 81.0, 51.0, 51.0, 23.0, 36.0, 23.0, 24.0, 13.0, 14.0, 11.0, 13.0, 11.0, 8.0, 8.0, 5.0, 4.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010080337524414062, -0.0009756982326507568, -0.0009433627128601074, -0.000911027193069458, -0.0008786916732788086, -0.0008463561534881592, -0.0008140206336975098, -0.0007816851139068604, -0.0007493495941162109, -0.0007170140743255615, -0.0006846785545349121, -0.0006523430347442627, -0.0006200075149536133, -0.0005876719951629639, -0.0005553364753723145, -0.000523000955581665, -0.0004906654357910156, -0.0004583299160003662, -0.0004259943962097168, -0.0003936588764190674, -0.00036132335662841797, -0.00032898783683776855, -0.00029665231704711914, -0.0002643167972564697, -0.0002319812774658203, -0.0001996457576751709, -0.00016731023788452148, -0.00013497471809387207, -0.00010263919830322266, -7.030367851257324e-05, -3.796815872192383e-05, -5.632638931274414e-06, 2.6702880859375e-05, 5.9038400650024414e-05, 9.137392044067383e-05, 0.00012370944023132324, 0.00015604496002197266, 0.00018838047981262207, 0.00022071599960327148, 0.0002530515193939209, 0.0002853870391845703, 0.0003177225589752197, 0.00035005807876586914, 0.00038239359855651855, 0.00041472911834716797, 0.0004470646381378174, 0.0004794001579284668, 0.0005117356777191162, 0.0005440711975097656, 0.000576406717300415, 0.0006087422370910645, 0.0006410777568817139, 0.0006734132766723633, 0.0007057487964630127, 0.0007380843162536621, 0.0007704198360443115, 0.0008027553558349609, 0.0008350908756256104, 0.0008674263954162598, 0.0008997619152069092, 0.0009320974349975586, 0.000964432954788208, 0.0009967684745788574, 0.0010291039943695068, 0.0010614395141601562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 8.0, 2.0, 5.0, 18.0, 14.0, 20.0, 34.0, 41.0, 76.0, 107.0, 174.0, 263.0, 451.0, 796.0, 1450.0, 3172.0, 8386.0, 31141.0, 155257.0, 674087.0, 131655.0, 27472.0, 7559.0, 3006.0, 1416.0, 714.0, 443.0, 276.0, 180.0, 117.0, 84.0, 45.0, 29.0, 20.0, 11.0, 7.0, 10.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.07318115234375, -3.9549560546875, -3.83673095703125, -3.718505859375, -3.60028076171875, -3.4820556640625, -3.36383056640625, -3.24560546875, -3.12738037109375, -3.0091552734375, -2.89093017578125, -2.772705078125, -2.65447998046875, -2.5362548828125, -2.41802978515625, -2.2998046875, -2.18157958984375, -2.0633544921875, -1.94512939453125, -1.826904296875, -1.70867919921875, -1.5904541015625, -1.47222900390625, -1.35400390625, -1.23577880859375, -1.1175537109375, -0.99932861328125, -0.881103515625, -0.76287841796875, -0.6446533203125, -0.52642822265625, -0.408203125, -0.28997802734375, -0.1717529296875, -0.05352783203125, 0.064697265625, 0.18292236328125, 0.3011474609375, 0.41937255859375, 0.53759765625, 0.65582275390625, 0.7740478515625, 0.89227294921875, 1.010498046875, 1.12872314453125, 1.2469482421875, 1.36517333984375, 1.4833984375, 1.60162353515625, 1.7198486328125, 1.83807373046875, 1.956298828125, 2.07452392578125, 2.1927490234375, 2.31097412109375, 2.42919921875, 2.54742431640625, 2.6656494140625, 2.78387451171875, 2.902099609375, 3.02032470703125, 3.1385498046875, 3.25677490234375, 3.375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 12.0, 13.0, 16.0, 12.0, 19.0, 25.0, 34.0, 35.0, 54.0, 57.0, 59.0, 70.0, 104.0, 82.0, 58.0, 70.0, 50.0, 38.0, 37.0, 32.0, 23.0, 18.0, 14.0, 9.0, 12.0, 7.0, 8.0, 9.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.00390625, -2.886962890625, -2.77001953125, -2.653076171875, -2.5361328125, -2.419189453125, -2.30224609375, -2.185302734375, -2.068359375, -1.951416015625, -1.83447265625, -1.717529296875, -1.6005859375, -1.483642578125, -1.36669921875, -1.249755859375, -1.1328125, -1.015869140625, -0.89892578125, -0.781982421875, -0.6650390625, -0.548095703125, -0.43115234375, -0.314208984375, -0.197265625, -0.080322265625, 0.03662109375, 0.153564453125, 0.2705078125, 0.387451171875, 0.50439453125, 0.621337890625, 0.73828125, 0.855224609375, 0.97216796875, 1.089111328125, 1.2060546875, 1.322998046875, 1.43994140625, 1.556884765625, 1.673828125, 1.790771484375, 1.90771484375, 2.024658203125, 2.1416015625, 2.258544921875, 2.37548828125, 2.492431640625, 2.609375, 2.726318359375, 2.84326171875, 2.960205078125, 3.0771484375, 3.194091796875, 3.31103515625, 3.427978515625, 3.544921875, 3.661865234375, 3.77880859375, 3.895751953125, 4.0126953125, 4.129638671875, 4.24658203125, 4.363525390625, 4.48046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 5.0, 4.0, 10.0, 27.0, 37.0, 62.0, 89.0, 149.0, 248.0, 179.0, 85.0, 50.0, 21.0, 16.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-108.04973602294922, -105.3194808959961, -102.58921813964844, -99.85896301269531, -97.12870788574219, -94.39845275878906, -91.66819763183594, -88.93793487548828, -86.20767974853516, -83.47742462158203, -80.74716186523438, -78.01690673828125, -75.28665161132812, -72.556396484375, -69.82614135742188, -67.09587860107422, -64.3656234741211, -61.63536834716797, -58.90510940551758, -56.17485046386719, -53.44459533691406, -50.71434020996094, -47.98408126831055, -45.253822326660156, -42.52356719970703, -39.793312072753906, -37.063053131103516, -34.332794189453125, -31.6025390625, -28.872282028198242, -26.142024993896484, -23.411767959594727, -20.681503295898438, -17.95124626159668, -15.220989227294922, -12.490732192993164, -9.760475158691406, -7.030218124389648, -4.299961090087891, -1.5697040557861328, 1.160552978515625, 3.890810012817383, 6.621067047119141, 9.351324081420898, 12.081581115722656, 14.811838150024414, 17.542095184326172, 20.27235221862793, 23.002609252929688, 25.732866287231445, 28.463123321533203, 31.19338035583496, 33.92363739013672, 36.653892517089844, 39.384151458740234, 42.114410400390625, 44.84466552734375, 47.574920654296875, 50.305179595947266, 53.035438537597656, 55.76569366455078, 58.495948791503906, 61.2262077331543, 63.95646667480469, 66.68672180175781]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 11.0, 4.0, 10.0, 8.0, 15.0, 16.0, 14.0, 22.0, 24.0, 23.0, 32.0, 31.0, 38.0, 32.0, 41.0, 52.0, 83.0, 83.0, 70.0, 49.0, 42.0, 34.0, 35.0, 37.0, 32.0, 19.0, 24.0, 19.0, 25.0, 18.0, 12.0, 12.0, 11.0, 7.0, 4.0, 1.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.337371826171875, -44.09278106689453, -42.84818649291992, -41.60359573364258, -40.35900115966797, -39.114410400390625, -37.869815826416016, -36.62522506713867, -35.38063049316406, -34.13603973388672, -32.89144515991211, -31.646852493286133, -30.402259826660156, -29.157669067382812, -27.913076400756836, -26.66848373413086, -25.423892974853516, -24.17930030822754, -22.934707641601562, -21.690114974975586, -20.44552230834961, -19.200931549072266, -17.95633888244629, -16.711746215820312, -15.467153549194336, -14.22256088256836, -12.977968215942383, -11.733376502990723, -10.488783836364746, -9.24419116973877, -7.999598979949951, -6.755006790161133, -5.510414123535156, -4.26582145690918, -3.0212292671203613, -1.7766368389129639, -0.5320444107055664, 0.7125482559204102, 1.9571404457092285, 3.201732635498047, 4.446325302124023, 5.69091796875, 6.935510158538818, 8.180102348327637, 9.424695014953613, 10.66928768157959, 11.91387939453125, 13.158472061157227, 14.403064727783203, 15.64765739440918, 16.892250061035156, 18.136842727661133, 19.38143539428711, 20.626026153564453, 21.87061882019043, 23.115211486816406, 24.359804153442383, 25.60439682006836, 26.848989486694336, 28.093582153320312, 29.338172912597656, 30.582767486572266, 31.82735824584961, 33.07195281982422, 34.31654357910156]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 3.0, 8.0, 18.0, 24.0, 30.0, 46.0, 78.0, 121.0, 168.0, 308.0, 613.0, 1076.0, 2081.0, 4190.0, 8619.0, 19775.0, 50629.0, 151727.0, 616475.0, 2034945.0, 965451.0, 222083.0, 68878.0, 25837.0, 11003.0, 4969.0, 2398.0, 1225.0, 671.0, 335.0, 193.0, 129.0, 61.0, 39.0, 22.0, 17.0, 13.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.90625, -2.8114013671875, -2.716552734375, -2.6217041015625, -2.52685546875, -2.4320068359375, -2.337158203125, -2.2423095703125, -2.1474609375, -2.0526123046875, -1.957763671875, -1.8629150390625, -1.76806640625, -1.6732177734375, -1.578369140625, -1.4835205078125, -1.388671875, -1.2938232421875, -1.198974609375, -1.1041259765625, -1.00927734375, -0.9144287109375, -0.819580078125, -0.7247314453125, -0.6298828125, -0.5350341796875, -0.440185546875, -0.3453369140625, -0.25048828125, -0.1556396484375, -0.060791015625, 0.0340576171875, 0.12890625, 0.2237548828125, 0.318603515625, 0.4134521484375, 0.50830078125, 0.6031494140625, 0.697998046875, 0.7928466796875, 0.8876953125, 0.9825439453125, 1.077392578125, 1.1722412109375, 1.26708984375, 1.3619384765625, 1.456787109375, 1.5516357421875, 1.646484375, 1.7413330078125, 1.836181640625, 1.9310302734375, 2.02587890625, 2.1207275390625, 2.215576171875, 2.3104248046875, 2.4052734375, 2.5001220703125, 2.594970703125, 2.6898193359375, 2.78466796875, 2.8795166015625, 2.974365234375, 3.0692138671875, 3.1640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 4.0, 7.0, 15.0, 12.0, 13.0, 37.0, 30.0, 45.0, 46.0, 52.0, 58.0, 51.0, 64.0, 67.0, 69.0, 72.0, 65.0, 47.0, 53.0, 41.0, 37.0, 21.0, 16.0, 18.0, 12.0, 20.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.99078369140625, -2.8995361328125, -2.80828857421875, -2.717041015625, -2.62579345703125, -2.5345458984375, -2.44329833984375, -2.35205078125, -2.26080322265625, -2.1695556640625, -2.07830810546875, -1.987060546875, -1.89581298828125, -1.8045654296875, -1.71331787109375, -1.6220703125, -1.53082275390625, -1.4395751953125, -1.34832763671875, -1.257080078125, -1.16583251953125, -1.0745849609375, -0.98333740234375, -0.89208984375, -0.80084228515625, -0.7095947265625, -0.61834716796875, -0.527099609375, -0.43585205078125, -0.3446044921875, -0.25335693359375, -0.162109375, -0.07086181640625, 0.0203857421875, 0.11163330078125, 0.202880859375, 0.29412841796875, 0.3853759765625, 0.47662353515625, 0.56787109375, 0.65911865234375, 0.7503662109375, 0.84161376953125, 0.932861328125, 1.02410888671875, 1.1153564453125, 1.20660400390625, 1.2978515625, 1.38909912109375, 1.4803466796875, 1.57159423828125, 1.662841796875, 1.75408935546875, 1.8453369140625, 1.93658447265625, 2.02783203125, 2.11907958984375, 2.2103271484375, 2.30157470703125, 2.392822265625, 2.48406982421875, 2.5753173828125, 2.66656494140625, 2.7578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 26.0, 48.0, 57.0, 157.0, 304.0, 734.0, 2117.0, 8906.0, 55252.0, 702516.0, 3131792.0, 252305.0, 30516.0, 6116.0, 1884.0, 693.0, 347.0, 209.0, 109.0, 77.0, 39.0, 25.0, 17.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76171875, -7.50567626953125, -7.2496337890625, -6.99359130859375, -6.737548828125, -6.48150634765625, -6.2254638671875, -5.96942138671875, -5.71337890625, -5.45733642578125, -5.2012939453125, -4.94525146484375, -4.689208984375, -4.43316650390625, -4.1771240234375, -3.92108154296875, -3.6650390625, -3.40899658203125, -3.1529541015625, -2.89691162109375, -2.640869140625, -2.38482666015625, -2.1287841796875, -1.87274169921875, -1.61669921875, -1.36065673828125, -1.1046142578125, -0.84857177734375, -0.592529296875, -0.33648681640625, -0.0804443359375, 0.17559814453125, 0.431640625, 0.68768310546875, 0.9437255859375, 1.19976806640625, 1.455810546875, 1.71185302734375, 1.9678955078125, 2.22393798828125, 2.47998046875, 2.73602294921875, 2.9920654296875, 3.24810791015625, 3.504150390625, 3.76019287109375, 4.0162353515625, 4.27227783203125, 4.5283203125, 4.78436279296875, 5.0404052734375, 5.29644775390625, 5.552490234375, 5.80853271484375, 6.0645751953125, 6.32061767578125, 6.57666015625, 6.83270263671875, 7.0887451171875, 7.34478759765625, 7.600830078125, 7.85687255859375, 8.1129150390625, 8.36895751953125, 8.625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 8.0, 16.0, 17.0, 44.0, 40.0, 67.0, 122.0, 165.0, 229.0, 413.0, 578.0, 667.0, 559.0, 373.0, 235.0, 186.0, 92.0, 77.0, 51.0, 35.0, 25.0, 24.0, 8.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015625, -4.7803955078125, -4.545166015625, -4.3099365234375, -4.07470703125, -3.8394775390625, -3.604248046875, -3.3690185546875, -3.1337890625, -2.8985595703125, -2.663330078125, -2.4281005859375, -2.19287109375, -1.9576416015625, -1.722412109375, -1.4871826171875, -1.251953125, -1.0167236328125, -0.781494140625, -0.5462646484375, -0.31103515625, -0.0758056640625, 0.159423828125, 0.3946533203125, 0.6298828125, 0.8651123046875, 1.100341796875, 1.3355712890625, 1.57080078125, 1.8060302734375, 2.041259765625, 2.2764892578125, 2.51171875, 2.7469482421875, 2.982177734375, 3.2174072265625, 3.45263671875, 3.6878662109375, 3.923095703125, 4.1583251953125, 4.3935546875, 4.6287841796875, 4.864013671875, 5.0992431640625, 5.33447265625, 5.5697021484375, 5.804931640625, 6.0401611328125, 6.275390625, 6.5106201171875, 6.745849609375, 6.9810791015625, 7.21630859375, 7.4515380859375, 7.686767578125, 7.9219970703125, 8.1572265625, 8.3924560546875, 8.627685546875, 8.8629150390625, 9.09814453125, 9.3333740234375, 9.568603515625, 9.8038330078125, 10.0390625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 16.0, 27.0, 53.0, 74.0, 125.0, 132.0, 174.0, 134.0, 97.0, 62.0, 34.0, 10.0, 15.0, 8.0, 4.0, 4.0, 6.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.03895568847656, -31.859479904174805, -29.680004119873047, -27.500526428222656, -25.32105255126953, -23.14157485961914, -20.962099075317383, -18.782623291015625, -16.603147506713867, -14.42367172241211, -12.244195938110352, -10.064719200134277, -7.8852434158325195, -5.705767631530762, -3.5262908935546875, -1.3468151092529297, 0.8326606750488281, 3.012136697769165, 5.191612720489502, 7.371088981628418, 9.550564765930176, 11.730040550231934, 13.909517288208008, 16.088993072509766, 18.268468856811523, 20.44794464111328, 22.62742042541504, 24.806896209716797, 26.986373901367188, 29.165847778320312, 31.345325469970703, 33.524803161621094, 35.70427703857422, 37.88375473022461, 40.063228607177734, 42.242706298828125, 44.42218017578125, 46.60165786743164, 48.78113555908203, 50.960609436035156, 53.14008331298828, 55.31956100463867, 57.4990348815918, 59.67851257324219, 61.85798645019531, 64.03746032714844, 66.2169418334961, 68.39641571044922, 70.57589721679688, 72.75537109375, 74.93485260009766, 77.11432647705078, 79.2938003540039, 81.47327423095703, 83.65275573730469, 85.83222961425781, 88.01170349121094, 90.19117736816406, 92.37065887451172, 94.55013275146484, 96.72960662841797, 98.9090805053711, 101.08856201171875, 103.26803588867188, 105.447509765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 6.0, 7.0, 8.0, 12.0, 27.0, 15.0, 26.0, 31.0, 30.0, 34.0, 51.0, 54.0, 33.0, 50.0, 41.0, 45.0, 47.0, 49.0, 45.0, 46.0, 33.0, 43.0, 32.0, 36.0, 38.0, 29.0, 21.0, 15.0, 9.0, 18.0, 16.0, 13.0, 7.0, 8.0, 5.0, 10.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-42.47863006591797, -41.298622131347656, -40.118614196777344, -38.93860626220703, -37.75859832763672, -36.578590393066406, -35.398582458496094, -34.21857452392578, -33.03856658935547, -31.858558654785156, -30.678550720214844, -29.49854278564453, -28.31853485107422, -27.138526916503906, -25.95851707458496, -24.77850914001465, -23.598499298095703, -22.41849136352539, -21.238483428955078, -20.058475494384766, -18.878467559814453, -17.69845962524414, -16.518449783325195, -15.338441848754883, -14.15843391418457, -12.978425979614258, -11.798418045043945, -10.618409156799316, -9.438401222229004, -8.258393287658691, -7.078384876251221, -5.89837646484375, -4.718372344970703, -3.5383641719818115, -2.35835599899292, -1.1783478260040283, 0.0016603469848632812, 1.1816682815551758, 2.3616766929626465, 3.541685104370117, 4.72169303894043, 5.901700973510742, 7.081709384918213, 8.261717796325684, 9.441725730895996, 10.621733665466309, 11.801742553710938, 12.98175048828125, 14.161758422851562, 15.341766357421875, 16.521774291992188, 17.7017822265625, 18.881790161132812, 20.061798095703125, 21.24180793762207, 22.421815872192383, 23.601823806762695, 24.781831741333008, 25.96183967590332, 27.141847610473633, 28.321857452392578, 29.50186538696289, 30.681873321533203, 31.861881256103516, 33.04188919067383]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 11.0, 11.0, 15.0, 29.0, 35.0, 39.0, 79.0, 121.0, 184.0, 283.0, 406.0, 601.0, 1029.0, 1672.0, 2683.0, 4747.0, 8503.0, 16928.0, 35158.0, 82822.0, 239504.0, 383029.0, 156662.0, 58266.0, 25890.0, 13044.0, 6960.0, 3800.0, 2287.0, 1343.0, 849.0, 552.0, 337.0, 223.0, 162.0, 89.0, 62.0, 39.0, 36.0, 17.0, 12.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.72265625, -4.57647705078125, -4.4302978515625, -4.28411865234375, -4.137939453125, -3.99176025390625, -3.8455810546875, -3.69940185546875, -3.55322265625, -3.40704345703125, -3.2608642578125, -3.11468505859375, -2.968505859375, -2.82232666015625, -2.6761474609375, -2.52996826171875, -2.3837890625, -2.23760986328125, -2.0914306640625, -1.94525146484375, -1.799072265625, -1.65289306640625, -1.5067138671875, -1.36053466796875, -1.21435546875, -1.06817626953125, -0.9219970703125, -0.77581787109375, -0.629638671875, -0.48345947265625, -0.3372802734375, -0.19110107421875, -0.044921875, 0.10125732421875, 0.2474365234375, 0.39361572265625, 0.539794921875, 0.68597412109375, 0.8321533203125, 0.97833251953125, 1.12451171875, 1.27069091796875, 1.4168701171875, 1.56304931640625, 1.709228515625, 1.85540771484375, 2.0015869140625, 2.14776611328125, 2.2939453125, 2.44012451171875, 2.5863037109375, 2.73248291015625, 2.878662109375, 3.02484130859375, 3.1710205078125, 3.31719970703125, 3.46337890625, 3.60955810546875, 3.7557373046875, 3.90191650390625, 4.048095703125, 4.19427490234375, 4.3404541015625, 4.48663330078125, 4.6328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 11.0, 8.0, 13.0, 19.0, 12.0, 24.0, 25.0, 27.0, 26.0, 49.0, 38.0, 53.0, 43.0, 36.0, 51.0, 53.0, 46.0, 46.0, 56.0, 61.0, 44.0, 34.0, 40.0, 35.0, 17.0, 25.0, 17.0, 20.0, 9.0, 10.0, 9.0, 10.0, 5.0, 4.0, 8.0, 5.0, 0.0, 1.0, 4.0, 1.0, 2.0], "bins": [-2.904296875, -2.82928466796875, -2.7542724609375, -2.67926025390625, -2.604248046875, -2.52923583984375, -2.4542236328125, -2.37921142578125, -2.30419921875, -2.22918701171875, -2.1541748046875, -2.07916259765625, -2.004150390625, -1.92913818359375, -1.8541259765625, -1.77911376953125, -1.7041015625, -1.62908935546875, -1.5540771484375, -1.47906494140625, -1.404052734375, -1.32904052734375, -1.2540283203125, -1.17901611328125, -1.10400390625, -1.02899169921875, -0.9539794921875, -0.87896728515625, -0.803955078125, -0.72894287109375, -0.6539306640625, -0.57891845703125, -0.50390625, -0.42889404296875, -0.3538818359375, -0.27886962890625, -0.203857421875, -0.12884521484375, -0.0538330078125, 0.02117919921875, 0.09619140625, 0.17120361328125, 0.2462158203125, 0.32122802734375, 0.396240234375, 0.47125244140625, 0.5462646484375, 0.62127685546875, 0.6962890625, 0.77130126953125, 0.8463134765625, 0.92132568359375, 0.996337890625, 1.07135009765625, 1.1463623046875, 1.22137451171875, 1.29638671875, 1.37139892578125, 1.4464111328125, 1.52142333984375, 1.596435546875, 1.67144775390625, 1.7464599609375, 1.82147216796875, 1.896484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 5.0, 10.0, 10.0, 7.0, 16.0, 27.0, 41.0, 47.0, 67.0, 81.0, 109.0, 140.0, 236.0, 358.0, 495.0, 878.0, 1588.0, 3382.0, 8582.0, 26607.0, 124691.0, 705523.0, 131297.0, 27611.0, 8891.0, 3583.0, 1661.0, 915.0, 537.0, 341.0, 234.0, 156.0, 119.0, 85.0, 51.0, 46.0, 30.0, 23.0, 16.0, 16.0, 7.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.796875, -7.5234375, -7.25, -6.9765625, -6.703125, -6.4296875, -6.15625, -5.8828125, -5.609375, -5.3359375, -5.0625, -4.7890625, -4.515625, -4.2421875, -3.96875, -3.6953125, -3.421875, -3.1484375, -2.875, -2.6015625, -2.328125, -2.0546875, -1.78125, -1.5078125, -1.234375, -0.9609375, -0.6875, -0.4140625, -0.140625, 0.1328125, 0.40625, 0.6796875, 0.953125, 1.2265625, 1.5, 1.7734375, 2.046875, 2.3203125, 2.59375, 2.8671875, 3.140625, 3.4140625, 3.6875, 3.9609375, 4.234375, 4.5078125, 4.78125, 5.0546875, 5.328125, 5.6015625, 5.875, 6.1484375, 6.421875, 6.6953125, 6.96875, 7.2421875, 7.515625, 7.7890625, 8.0625, 8.3359375, 8.609375, 8.8828125, 9.15625, 9.4296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 4.0, 11.0, 11.0, 19.0, 29.0, 20.0, 34.0, 35.0, 32.0, 40.0, 53.0, 50.0, 58.0, 41.0, 59.0, 64.0, 49.0, 57.0, 44.0, 39.0, 39.0, 31.0, 36.0, 18.0, 28.0, 23.0, 18.0, 11.0, 10.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6640625, -9.328857421875, -8.99365234375, -8.658447265625, -8.3232421875, -7.988037109375, -7.65283203125, -7.317626953125, -6.982421875, -6.647216796875, -6.31201171875, -5.976806640625, -5.6416015625, -5.306396484375, -4.97119140625, -4.635986328125, -4.30078125, -3.965576171875, -3.63037109375, -3.295166015625, -2.9599609375, -2.624755859375, -2.28955078125, -1.954345703125, -1.619140625, -1.283935546875, -0.94873046875, -0.613525390625, -0.2783203125, 0.056884765625, 0.39208984375, 0.727294921875, 1.0625, 1.397705078125, 1.73291015625, 2.068115234375, 2.4033203125, 2.738525390625, 3.07373046875, 3.408935546875, 3.744140625, 4.079345703125, 4.41455078125, 4.749755859375, 5.0849609375, 5.420166015625, 5.75537109375, 6.090576171875, 6.42578125, 6.760986328125, 7.09619140625, 7.431396484375, 7.7666015625, 8.101806640625, 8.43701171875, 8.772216796875, 9.107421875, 9.442626953125, 9.77783203125, 10.113037109375, 10.4482421875, 10.783447265625, 11.11865234375, 11.453857421875, 11.7890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 2.0, 3.0, 6.0, 5.0, 15.0, 8.0, 20.0, 30.0, 34.0, 61.0, 82.0, 116.0, 207.0, 337.0, 606.0, 1210.0, 2510.0, 6351.0, 18461.0, 57999.0, 246656.0, 573589.0, 95750.0, 28075.0, 9488.0, 3665.0, 1427.0, 771.0, 381.0, 229.0, 118.0, 107.0, 70.0, 54.0, 26.0, 22.0, 17.0, 9.0, 16.0, 4.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.46875, -3.37017822265625, -3.2716064453125, -3.17303466796875, -3.074462890625, -2.97589111328125, -2.8773193359375, -2.77874755859375, -2.68017578125, -2.58160400390625, -2.4830322265625, -2.38446044921875, -2.285888671875, -2.18731689453125, -2.0887451171875, -1.99017333984375, -1.8916015625, -1.79302978515625, -1.6944580078125, -1.59588623046875, -1.497314453125, -1.39874267578125, -1.3001708984375, -1.20159912109375, -1.10302734375, -1.00445556640625, -0.9058837890625, -0.80731201171875, -0.708740234375, -0.61016845703125, -0.5115966796875, -0.41302490234375, -0.314453125, -0.21588134765625, -0.1173095703125, -0.01873779296875, 0.079833984375, 0.17840576171875, 0.2769775390625, 0.37554931640625, 0.47412109375, 0.57269287109375, 0.6712646484375, 0.76983642578125, 0.868408203125, 0.96697998046875, 1.0655517578125, 1.16412353515625, 1.2626953125, 1.36126708984375, 1.4598388671875, 1.55841064453125, 1.656982421875, 1.75555419921875, 1.8541259765625, 1.95269775390625, 2.05126953125, 2.14984130859375, 2.2484130859375, 2.34698486328125, 2.445556640625, 2.54412841796875, 2.6427001953125, 2.74127197265625, 2.83984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 11.0, 0.0, 7.0, 8.0, 10.0, 8.0, 15.0, 27.0, 27.0, 30.0, 45.0, 72.0, 86.0, 153.0, 137.0, 122.0, 63.0, 45.0, 33.0, 31.0, 12.0, 18.0, 9.0, 8.0, 10.0, 6.0, 7.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013294219970703125, -0.0012905895709991455, -0.0012517571449279785, -0.0012129247188568115, -0.0011740922927856445, -0.0011352598667144775, -0.0010964274406433105, -0.0010575950145721436, -0.0010187625885009766, -0.0009799301624298096, -0.0009410977363586426, -0.0009022653102874756, -0.0008634328842163086, -0.0008246004581451416, -0.0007857680320739746, -0.0007469356060028076, -0.0007081031799316406, -0.0006692707538604736, -0.0006304383277893066, -0.0005916059017181396, -0.0005527734756469727, -0.0005139410495758057, -0.00047510862350463867, -0.0004362761974334717, -0.0003974437713623047, -0.0003586113452911377, -0.0003197789192199707, -0.0002809464931488037, -0.00024211406707763672, -0.00020328164100646973, -0.00016444921493530273, -0.00012561678886413574, -8.678436279296875e-05, -4.795193672180176e-05, -9.119510650634766e-06, 2.9712915420532227e-05, 6.854534149169922e-05, 0.00010737776756286621, 0.0001462101936340332, 0.0001850426197052002, 0.0002238750457763672, 0.0002627074718475342, 0.00030153989791870117, 0.00034037232398986816, 0.00037920475006103516, 0.00041803717613220215, 0.00045686960220336914, 0.0004957020282745361, 0.0005345344543457031, 0.0005733668804168701, 0.0006121993064880371, 0.0006510317325592041, 0.0006898641586303711, 0.0007286965847015381, 0.0007675290107727051, 0.0008063614368438721, 0.0008451938629150391, 0.0008840262889862061, 0.000922858715057373, 0.00096169114112854, 0.001000523567199707, 0.001039355993270874, 0.001078188419342041, 0.001117020845413208, 0.001155853271484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 11.0, 13.0, 19.0, 24.0, 36.0, 56.0, 90.0, 120.0, 177.0, 319.0, 468.0, 794.0, 1332.0, 2657.0, 5861.0, 16292.0, 55920.0, 243693.0, 577764.0, 99163.0, 26766.0, 8963.0, 3729.0, 1784.0, 964.0, 556.0, 345.0, 234.0, 127.0, 95.0, 66.0, 43.0, 34.0, 14.0, 16.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.005859375, -2.91534423828125, -2.8248291015625, -2.73431396484375, -2.643798828125, -2.55328369140625, -2.4627685546875, -2.37225341796875, -2.28173828125, -2.19122314453125, -2.1007080078125, -2.01019287109375, -1.919677734375, -1.82916259765625, -1.7386474609375, -1.64813232421875, -1.5576171875, -1.46710205078125, -1.3765869140625, -1.28607177734375, -1.195556640625, -1.10504150390625, -1.0145263671875, -0.92401123046875, -0.83349609375, -0.74298095703125, -0.6524658203125, -0.56195068359375, -0.471435546875, -0.38092041015625, -0.2904052734375, -0.19989013671875, -0.109375, -0.01885986328125, 0.0716552734375, 0.16217041015625, 0.252685546875, 0.34320068359375, 0.4337158203125, 0.52423095703125, 0.61474609375, 0.70526123046875, 0.7957763671875, 0.88629150390625, 0.976806640625, 1.06732177734375, 1.1578369140625, 1.24835205078125, 1.3388671875, 1.42938232421875, 1.5198974609375, 1.61041259765625, 1.700927734375, 1.79144287109375, 1.8819580078125, 1.97247314453125, 2.06298828125, 2.15350341796875, 2.2440185546875, 2.33453369140625, 2.425048828125, 2.51556396484375, 2.6060791015625, 2.69659423828125, 2.787109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 13.0, 7.0, 6.0, 18.0, 16.0, 25.0, 36.0, 31.0, 63.0, 68.0, 101.0, 89.0, 96.0, 98.0, 86.0, 46.0, 42.0, 39.0, 26.0, 20.0, 14.0, 10.0, 11.0, 6.0, 4.0, 6.0, 4.0, 1.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.91845703125, -2.8173828125, -2.71630859375, -2.615234375, -2.51416015625, -2.4130859375, -2.31201171875, -2.2109375, -2.10986328125, -2.0087890625, -1.90771484375, -1.806640625, -1.70556640625, -1.6044921875, -1.50341796875, -1.40234375, -1.30126953125, -1.2001953125, -1.09912109375, -0.998046875, -0.89697265625, -0.7958984375, -0.69482421875, -0.59375, -0.49267578125, -0.3916015625, -0.29052734375, -0.189453125, -0.08837890625, 0.0126953125, 0.11376953125, 0.21484375, 0.31591796875, 0.4169921875, 0.51806640625, 0.619140625, 0.72021484375, 0.8212890625, 0.92236328125, 1.0234375, 1.12451171875, 1.2255859375, 1.32666015625, 1.427734375, 1.52880859375, 1.6298828125, 1.73095703125, 1.83203125, 1.93310546875, 2.0341796875, 2.13525390625, 2.236328125, 2.33740234375, 2.4384765625, 2.53955078125, 2.640625, 2.74169921875, 2.8427734375, 2.94384765625, 3.044921875, 3.14599609375, 3.2470703125, 3.34814453125, 3.44921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 16.0, 34.0, 76.0, 175.0, 332.0, 186.0, 80.0, 43.0, 12.0, 11.0, 8.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.56970977783203, -83.31324005126953, -80.05677032470703, -76.80030059814453, -73.54383087158203, -70.28736114501953, -67.03089904785156, -63.7744255065918, -60.5179557800293, -57.2614860534668, -54.0050163269043, -50.74855041503906, -47.49208068847656, -44.23561096191406, -40.97914123535156, -37.72267150878906, -34.46620178222656, -31.209732055664062, -27.953262329101562, -24.696794509887695, -21.440324783325195, -18.183855056762695, -14.927387237548828, -11.670917510986328, -8.414447784423828, -5.157978534698486, -1.9015092849731445, 1.354959487915039, 4.611429214477539, 7.867898941040039, 11.124366760253906, 14.380836486816406, 17.637298583984375, 20.893768310546875, 24.150238037109375, 27.406705856323242, 30.663175582885742, 33.919647216796875, 37.17611312866211, 40.43258285522461, 43.68905258178711, 46.94552230834961, 50.20199203491211, 53.458457946777344, 56.714927673339844, 59.971397399902344, 63.227867126464844, 66.48433685302734, 69.74080657958984, 72.99727630615234, 76.25374603271484, 79.51021575927734, 82.76668548583984, 86.02315521240234, 89.27961730957031, 92.53608703613281, 95.79255676269531, 99.04902648925781, 102.30549621582031, 105.56196594238281, 108.81843566894531, 112.07490539550781, 115.33137512207031, 118.58784484863281, 121.84431457519531]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 10.0, 7.0, 14.0, 10.0, 16.0, 25.0, 22.0, 20.0, 33.0, 21.0, 34.0, 35.0, 34.0, 54.0, 69.0, 79.0, 57.0, 54.0, 46.0, 47.0, 28.0, 38.0, 41.0, 22.0, 31.0, 25.0, 15.0, 16.0, 18.0, 12.0, 10.0, 4.0, 13.0, 11.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.468772888183594, -39.158447265625, -37.848121643066406, -36.53779220581055, -35.22746658325195, -33.91714096069336, -32.606815338134766, -31.296489715576172, -29.986162185668945, -28.67583656311035, -27.365509033203125, -26.05518341064453, -24.744857788085938, -23.43453025817871, -22.124204635620117, -20.81387710571289, -19.503551483154297, -18.193225860595703, -16.882898330688477, -15.572572708129883, -14.262246131896973, -12.951919555664062, -11.641593933105469, -10.331267356872559, -9.020940780639648, -7.710614204406738, -6.400288105010986, -5.089962005615234, -3.779635429382324, -2.469308853149414, -1.158982753753662, 0.15134334564208984, 1.4616737365722656, 2.7720000743865967, 4.082326412200928, 5.39265251159668, 6.70297908782959, 8.0133056640625, 9.323631286621094, 10.633957862854004, 11.944284439086914, 13.254611015319824, 14.564937591552734, 15.875263214111328, 17.185588836669922, 18.49591636657715, 19.806241989135742, 21.11656951904297, 22.426895141601562, 23.737220764160156, 25.047548294067383, 26.357873916625977, 27.668201446533203, 28.978527069091797, 30.28885269165039, 31.599178314208984, 32.909507751464844, 34.21983337402344, 35.53015899658203, 36.84048843383789, 38.150814056396484, 39.46113967895508, 40.77146530151367, 42.081790924072266, 43.39211654663086]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 8.0, 14.0, 21.0, 22.0, 33.0, 44.0, 59.0, 95.0, 105.0, 194.0, 327.0, 478.0, 860.0, 1565.0, 2888.0, 5645.0, 11858.0, 27483.0, 73475.0, 270085.0, 1364618.0, 1869566.0, 403136.0, 98454.0, 34210.0, 14534.0, 6696.0, 3354.0, 1799.0, 973.0, 597.0, 363.0, 226.0, 159.0, 79.0, 73.0, 42.0, 37.0, 30.0, 19.0, 11.0, 9.0, 6.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.52545166015625, -2.4356689453125, -2.34588623046875, -2.256103515625, -2.16632080078125, -2.0765380859375, -1.98675537109375, -1.89697265625, -1.80718994140625, -1.7174072265625, -1.62762451171875, -1.537841796875, -1.44805908203125, -1.3582763671875, -1.26849365234375, -1.1787109375, -1.08892822265625, -0.9991455078125, -0.90936279296875, -0.819580078125, -0.72979736328125, -0.6400146484375, -0.55023193359375, -0.46044921875, -0.37066650390625, -0.2808837890625, -0.19110107421875, -0.101318359375, -0.01153564453125, 0.0782470703125, 0.16802978515625, 0.2578125, 0.34759521484375, 0.4373779296875, 0.52716064453125, 0.616943359375, 0.70672607421875, 0.7965087890625, 0.88629150390625, 0.97607421875, 1.06585693359375, 1.1556396484375, 1.24542236328125, 1.335205078125, 1.42498779296875, 1.5147705078125, 1.60455322265625, 1.6943359375, 1.78411865234375, 1.8739013671875, 1.96368408203125, 2.053466796875, 2.14324951171875, 2.2330322265625, 2.32281494140625, 2.41259765625, 2.50238037109375, 2.5921630859375, 2.68194580078125, 2.771728515625, 2.86151123046875, 2.9512939453125, 3.04107666015625, 3.130859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 8.0, 8.0, 10.0, 23.0, 25.0, 20.0, 24.0, 44.0, 23.0, 36.0, 38.0, 52.0, 40.0, 69.0, 73.0, 66.0, 43.0, 60.0, 72.0, 43.0, 43.0, 32.0, 33.0, 15.0, 26.0, 14.0, 12.0, 11.0, 14.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.125, -2.042877197265625, -1.96075439453125, -1.878631591796875, -1.7965087890625, -1.714385986328125, -1.63226318359375, -1.550140380859375, -1.468017578125, -1.385894775390625, -1.30377197265625, -1.221649169921875, -1.1395263671875, -1.057403564453125, -0.97528076171875, -0.893157958984375, -0.81103515625, -0.728912353515625, -0.64678955078125, -0.564666748046875, -0.4825439453125, -0.400421142578125, -0.31829833984375, -0.236175537109375, -0.154052734375, -0.071929931640625, 0.01019287109375, 0.092315673828125, 0.1744384765625, 0.256561279296875, 0.33868408203125, 0.420806884765625, 0.5029296875, 0.585052490234375, 0.66717529296875, 0.749298095703125, 0.8314208984375, 0.913543701171875, 0.99566650390625, 1.077789306640625, 1.159912109375, 1.242034912109375, 1.32415771484375, 1.406280517578125, 1.4884033203125, 1.570526123046875, 1.65264892578125, 1.734771728515625, 1.81689453125, 1.899017333984375, 1.98114013671875, 2.063262939453125, 2.1453857421875, 2.227508544921875, 2.30963134765625, 2.391754150390625, 2.473876953125, 2.555999755859375, 2.63812255859375, 2.720245361328125, 2.8023681640625, 2.884490966796875, 2.96661376953125, 3.048736572265625, 3.130859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 12.0, 9.0, 13.0, 17.0, 26.0, 33.0, 47.0, 77.0, 129.0, 188.0, 364.0, 739.0, 1854.0, 5155.0, 18306.0, 84704.0, 831358.0, 2933262.0, 261103.0, 41012.0, 10159.0, 3243.0, 1155.0, 565.0, 277.0, 162.0, 95.0, 60.0, 41.0, 33.0, 20.0, 16.0, 13.0, 16.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.31719970703125, -5.1148681640625, -4.91253662109375, -4.710205078125, -4.50787353515625, -4.3055419921875, -4.10321044921875, -3.90087890625, -3.69854736328125, -3.4962158203125, -3.29388427734375, -3.091552734375, -2.88922119140625, -2.6868896484375, -2.48455810546875, -2.2822265625, -2.07989501953125, -1.8775634765625, -1.67523193359375, -1.472900390625, -1.27056884765625, -1.0682373046875, -0.86590576171875, -0.66357421875, -0.46124267578125, -0.2589111328125, -0.05657958984375, 0.145751953125, 0.34808349609375, 0.5504150390625, 0.75274658203125, 0.955078125, 1.15740966796875, 1.3597412109375, 1.56207275390625, 1.764404296875, 1.96673583984375, 2.1690673828125, 2.37139892578125, 2.57373046875, 2.77606201171875, 2.9783935546875, 3.18072509765625, 3.383056640625, 3.58538818359375, 3.7877197265625, 3.99005126953125, 4.1923828125, 4.39471435546875, 4.5970458984375, 4.79937744140625, 5.001708984375, 5.20404052734375, 5.4063720703125, 5.60870361328125, 5.81103515625, 6.01336669921875, 6.2156982421875, 6.41802978515625, 6.620361328125, 6.82269287109375, 7.0250244140625, 7.22735595703125, 7.4296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 7.0, 3.0, 11.0, 15.0, 11.0, 20.0, 21.0, 25.0, 24.0, 37.0, 55.0, 74.0, 89.0, 133.0, 193.0, 298.0, 347.0, 489.0, 504.0, 460.0, 343.0, 229.0, 182.0, 116.0, 90.0, 59.0, 53.0, 40.0, 32.0, 23.0, 18.0, 18.0, 9.0, 8.0, 9.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.8359375, -4.686279296875, -4.53662109375, -4.386962890625, -4.2373046875, -4.087646484375, -3.93798828125, -3.788330078125, -3.638671875, -3.489013671875, -3.33935546875, -3.189697265625, -3.0400390625, -2.890380859375, -2.74072265625, -2.591064453125, -2.44140625, -2.291748046875, -2.14208984375, -1.992431640625, -1.8427734375, -1.693115234375, -1.54345703125, -1.393798828125, -1.244140625, -1.094482421875, -0.94482421875, -0.795166015625, -0.6455078125, -0.495849609375, -0.34619140625, -0.196533203125, -0.046875, 0.102783203125, 0.25244140625, 0.402099609375, 0.5517578125, 0.701416015625, 0.85107421875, 1.000732421875, 1.150390625, 1.300048828125, 1.44970703125, 1.599365234375, 1.7490234375, 1.898681640625, 2.04833984375, 2.197998046875, 2.34765625, 2.497314453125, 2.64697265625, 2.796630859375, 2.9462890625, 3.095947265625, 3.24560546875, 3.395263671875, 3.544921875, 3.694580078125, 3.84423828125, 3.993896484375, 4.1435546875, 4.293212890625, 4.44287109375, 4.592529296875, 4.7421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 7.0, 11.0, 27.0, 52.0, 94.0, 166.0, 185.0, 170.0, 109.0, 89.0, 36.0, 17.0, 9.0, 3.0, 6.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.386962890625, -72.24458312988281, -70.10221099853516, -67.95983123779297, -65.81745910644531, -63.675079345703125, -61.5327033996582, -59.39032745361328, -57.247947692871094, -55.10557174682617, -52.96319580078125, -50.82081604003906, -48.67844009399414, -46.53606414794922, -44.3936882019043, -42.251312255859375, -40.10893630981445, -37.96656036376953, -35.82418441772461, -33.68180847167969, -31.5394287109375, -29.397052764892578, -27.254676818847656, -25.112300872802734, -22.96992301940918, -20.827547073364258, -18.685169219970703, -16.54279327392578, -14.400416374206543, -12.258039474487305, -10.115663528442383, -7.9732866287231445, -5.830905914306641, -3.6885292530059814, -1.5461525917053223, 0.5962238311767578, 2.738600730895996, 4.880977630615234, 7.023353576660156, 9.165730476379395, 11.308107376098633, 13.450484275817871, 15.59286117553711, 17.73523712158203, 19.877613067626953, 22.019990921020508, 24.16236686706543, 26.304744720458984, 28.447120666503906, 30.589496612548828, 32.73187255859375, 34.87425231933594, 37.01662826538086, 39.15900421142578, 41.3013801574707, 43.443756103515625, 45.58613586425781, 47.728511810302734, 49.870887756347656, 52.013267517089844, 54.155643463134766, 56.29801940917969, 58.44039535522461, 60.58277130126953, 62.72514724731445]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 10.0, 1.0, 6.0, 9.0, 9.0, 17.0, 20.0, 15.0, 23.0, 31.0, 37.0, 35.0, 33.0, 46.0, 46.0, 58.0, 45.0, 60.0, 55.0, 35.0, 48.0, 48.0, 45.0, 29.0, 38.0, 26.0, 41.0, 27.0, 26.0, 22.0, 11.0, 12.0, 13.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.262693405151367, -30.378803253173828, -29.494915008544922, -28.611024856567383, -27.727134704589844, -26.843246459960938, -25.9593563079834, -25.07546615600586, -24.191577911376953, -23.307687759399414, -22.423799514770508, -21.53990936279297, -20.65601921081543, -19.77212905883789, -18.888240814208984, -18.004350662231445, -17.120460510253906, -16.236570358276367, -15.352681159973145, -14.468791961669922, -13.584901809692383, -12.70101261138916, -11.817123413085938, -10.933233261108398, -10.049344062805176, -9.165454864501953, -8.281564712524414, -7.397675514221191, -6.5137858390808105, -5.62989616394043, -4.746006965637207, -3.862117290496826, -2.978229522705078, -2.0943398475646973, -1.2104504108428955, -0.32656097412109375, 0.5573287010192871, 1.441218376159668, 2.3251075744628906, 3.2089972496032715, 4.092886924743652, 4.976776599884033, 5.860666275024414, 6.744555473327637, 7.628445148468018, 8.512334823608398, 9.396224021911621, 10.280113220214844, 11.164003372192383, 12.047892570495605, 12.931782722473145, 13.815671920776367, 14.699562072753906, 15.583451271057129, 16.46734046936035, 17.35123062133789, 18.235118865966797, 19.119009017944336, 20.002897262573242, 20.88678741455078, 21.77067756652832, 22.65456771850586, 23.538455963134766, 24.422346115112305, 25.306236267089844]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 14.0, 15.0, 31.0, 57.0, 91.0, 187.0, 331.0, 661.0, 1428.0, 3143.0, 8369.0, 28468.0, 135205.0, 501997.0, 288391.0, 57033.0, 14189.0, 4964.0, 2008.0, 940.0, 496.0, 231.0, 121.0, 71.0, 39.0, 28.0, 14.0, 14.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.015625, -5.8472900390625, -5.678955078125, -5.5106201171875, -5.34228515625, -5.1739501953125, -5.005615234375, -4.8372802734375, -4.6689453125, -4.5006103515625, -4.332275390625, -4.1639404296875, -3.99560546875, -3.8272705078125, -3.658935546875, -3.4906005859375, -3.322265625, -3.1539306640625, -2.985595703125, -2.8172607421875, -2.64892578125, -2.4805908203125, -2.312255859375, -2.1439208984375, -1.9755859375, -1.8072509765625, -1.638916015625, -1.4705810546875, -1.30224609375, -1.1339111328125, -0.965576171875, -0.7972412109375, -0.62890625, -0.4605712890625, -0.292236328125, -0.1239013671875, 0.04443359375, 0.2127685546875, 0.381103515625, 0.5494384765625, 0.7177734375, 0.8861083984375, 1.054443359375, 1.2227783203125, 1.39111328125, 1.5594482421875, 1.727783203125, 1.8961181640625, 2.064453125, 2.2327880859375, 2.401123046875, 2.5694580078125, 2.73779296875, 2.9061279296875, 3.074462890625, 3.2427978515625, 3.4111328125, 3.5794677734375, 3.747802734375, 3.9161376953125, 4.08447265625, 4.2528076171875, 4.421142578125, 4.5894775390625, 4.7578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 11.0, 14.0, 11.0, 15.0, 18.0, 16.0, 30.0, 30.0, 28.0, 43.0, 32.0, 40.0, 50.0, 48.0, 50.0, 46.0, 49.0, 61.0, 47.0, 52.0, 45.0, 46.0, 34.0, 24.0, 38.0, 21.0, 17.0, 15.0, 18.0, 13.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.033172607421875, -1.95501708984375, -1.876861572265625, -1.7987060546875, -1.720550537109375, -1.64239501953125, -1.564239501953125, -1.486083984375, -1.407928466796875, -1.32977294921875, -1.251617431640625, -1.1734619140625, -1.095306396484375, -1.01715087890625, -0.938995361328125, -0.86083984375, -0.782684326171875, -0.70452880859375, -0.626373291015625, -0.5482177734375, -0.470062255859375, -0.39190673828125, -0.313751220703125, -0.235595703125, -0.157440185546875, -0.07928466796875, -0.001129150390625, 0.0770263671875, 0.155181884765625, 0.23333740234375, 0.311492919921875, 0.3896484375, 0.467803955078125, 0.54595947265625, 0.624114990234375, 0.7022705078125, 0.780426025390625, 0.85858154296875, 0.936737060546875, 1.014892578125, 1.093048095703125, 1.17120361328125, 1.249359130859375, 1.3275146484375, 1.405670166015625, 1.48382568359375, 1.561981201171875, 1.64013671875, 1.718292236328125, 1.79644775390625, 1.874603271484375, 1.9527587890625, 2.030914306640625, 2.10906982421875, 2.187225341796875, 2.265380859375, 2.343536376953125, 2.42169189453125, 2.499847412109375, 2.5780029296875, 2.656158447265625, 2.73431396484375, 2.812469482421875, 2.890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 6.0, 4.0, 7.0, 9.0, 11.0, 21.0, 25.0, 41.0, 65.0, 103.0, 174.0, 336.0, 725.0, 1603.0, 3992.0, 13877.0, 82835.0, 677201.0, 226891.0, 29452.0, 6712.0, 2414.0, 945.0, 481.0, 269.0, 131.0, 79.0, 39.0, 32.0, 22.0, 13.0, 12.0, 5.0, 5.0, 2.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.151123046875, -4.94287109375, -4.734619140625, -4.5263671875, -4.318115234375, -4.10986328125, -3.901611328125, -3.693359375, -3.485107421875, -3.27685546875, -3.068603515625, -2.8603515625, -2.652099609375, -2.44384765625, -2.235595703125, -2.02734375, -1.819091796875, -1.61083984375, -1.402587890625, -1.1943359375, -0.986083984375, -0.77783203125, -0.569580078125, -0.361328125, -0.153076171875, 0.05517578125, 0.263427734375, 0.4716796875, 0.679931640625, 0.88818359375, 1.096435546875, 1.3046875, 1.512939453125, 1.72119140625, 1.929443359375, 2.1376953125, 2.345947265625, 2.55419921875, 2.762451171875, 2.970703125, 3.178955078125, 3.38720703125, 3.595458984375, 3.8037109375, 4.011962890625, 4.22021484375, 4.428466796875, 4.63671875, 4.844970703125, 5.05322265625, 5.261474609375, 5.4697265625, 5.677978515625, 5.88623046875, 6.094482421875, 6.302734375, 6.510986328125, 6.71923828125, 6.927490234375, 7.1357421875, 7.343994140625, 7.55224609375, 7.760498046875, 7.96875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 8.0, 6.0, 7.0, 4.0, 9.0, 17.0, 23.0, 22.0, 21.0, 33.0, 38.0, 45.0, 37.0, 48.0, 52.0, 41.0, 61.0, 58.0, 58.0, 51.0, 51.0, 51.0, 47.0, 43.0, 24.0, 30.0, 20.0, 18.0, 9.0, 18.0, 4.0, 12.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.546875, -8.2684326171875, -7.989990234375, -7.7115478515625, -7.43310546875, -7.1546630859375, -6.876220703125, -6.5977783203125, -6.3193359375, -6.0408935546875, -5.762451171875, -5.4840087890625, -5.20556640625, -4.9271240234375, -4.648681640625, -4.3702392578125, -4.091796875, -3.8133544921875, -3.534912109375, -3.2564697265625, -2.97802734375, -2.6995849609375, -2.421142578125, -2.1427001953125, -1.8642578125, -1.5858154296875, -1.307373046875, -1.0289306640625, -0.75048828125, -0.4720458984375, -0.193603515625, 0.0848388671875, 0.36328125, 0.6417236328125, 0.920166015625, 1.1986083984375, 1.47705078125, 1.7554931640625, 2.033935546875, 2.3123779296875, 2.5908203125, 2.8692626953125, 3.147705078125, 3.4261474609375, 3.70458984375, 3.9830322265625, 4.261474609375, 4.5399169921875, 4.818359375, 5.0968017578125, 5.375244140625, 5.6536865234375, 5.93212890625, 6.2105712890625, 6.489013671875, 6.7674560546875, 7.0458984375, 7.3243408203125, 7.602783203125, 7.8812255859375, 8.15966796875, 8.4381103515625, 8.716552734375, 8.9949951171875, 9.2734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 19.0, 30.0, 38.0, 67.0, 80.0, 197.0, 387.0, 723.0, 1460.0, 3341.0, 8208.0, 23355.0, 81306.0, 317609.0, 483039.0, 88180.0, 25075.0, 8683.0, 3526.0, 1612.0, 734.0, 373.0, 179.0, 106.0, 75.0, 40.0, 34.0, 16.0, 14.0, 7.0, 9.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.919921875, -1.855987548828125, -1.79205322265625, -1.728118896484375, -1.6641845703125, -1.600250244140625, -1.53631591796875, -1.472381591796875, -1.408447265625, -1.344512939453125, -1.28057861328125, -1.216644287109375, -1.1527099609375, -1.088775634765625, -1.02484130859375, -0.960906982421875, -0.89697265625, -0.833038330078125, -0.76910400390625, -0.705169677734375, -0.6412353515625, -0.577301025390625, -0.51336669921875, -0.449432373046875, -0.385498046875, -0.321563720703125, -0.25762939453125, -0.193695068359375, -0.1297607421875, -0.065826416015625, -0.00189208984375, 0.062042236328125, 0.1259765625, 0.189910888671875, 0.25384521484375, 0.317779541015625, 0.3817138671875, 0.445648193359375, 0.50958251953125, 0.573516845703125, 0.637451171875, 0.701385498046875, 0.76531982421875, 0.829254150390625, 0.8931884765625, 0.957122802734375, 1.02105712890625, 1.084991455078125, 1.14892578125, 1.212860107421875, 1.27679443359375, 1.340728759765625, 1.4046630859375, 1.468597412109375, 1.53253173828125, 1.596466064453125, 1.660400390625, 1.724334716796875, 1.78826904296875, 1.852203369140625, 1.9161376953125, 1.980072021484375, 2.04400634765625, 2.107940673828125, 2.171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 4.0, 12.0, 16.0, 17.0, 29.0, 49.0, 87.0, 116.0, 155.0, 126.0, 131.0, 84.0, 55.0, 35.0, 23.0, 16.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008730888366699219, -0.0008431300520896912, -0.0008131712675094604, -0.0007832124829292297, -0.000753253698348999, -0.0007232949137687683, -0.0006933361291885376, -0.0006633773446083069, -0.0006334185600280762, -0.0006034597754478455, -0.0005735009908676147, -0.000543542206287384, -0.0005135834217071533, -0.0004836246371269226, -0.0004536658525466919, -0.0004237070679664612, -0.00039374828338623047, -0.00036378949880599976, -0.00033383071422576904, -0.00030387192964553833, -0.0002739131450653076, -0.0002439543604850769, -0.0002139955759048462, -0.00018403679132461548, -0.00015407800674438477, -0.00012411922216415405, -9.416043758392334e-05, -6.420165300369263e-05, -3.4242868423461914e-05, -4.284083843231201e-06, 2.5674700736999512e-05, 5.5633485317230225e-05, 8.559226989746094e-05, 0.00011555105447769165, 0.00014550983905792236, 0.00017546862363815308, 0.0002054274082183838, 0.0002353861927986145, 0.0002653449773788452, 0.00029530376195907593, 0.00032526254653930664, 0.00035522133111953735, 0.00038518011569976807, 0.0004151389002799988, 0.0004450976848602295, 0.0004750564694404602, 0.0005050152540206909, 0.0005349740386009216, 0.0005649328231811523, 0.0005948916077613831, 0.0006248503923416138, 0.0006548091769218445, 0.0006847679615020752, 0.0007147267460823059, 0.0007446855306625366, 0.0007746443152427673, 0.000804603099822998, 0.0008345618844032288, 0.0008645206689834595, 0.0008944794535636902, 0.0009244382381439209, 0.0009543970227241516, 0.0009843558073043823, 0.001014314591884613, 0.0010442733764648438]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 9.0, 5.0, 14.0, 11.0, 36.0, 35.0, 58.0, 99.0, 180.0, 322.0, 603.0, 1247.0, 2648.0, 6230.0, 16642.0, 53704.0, 197351.0, 560248.0, 145656.0, 40734.0, 13305.0, 5043.0, 2159.0, 995.0, 504.0, 300.0, 145.0, 85.0, 61.0, 34.0, 25.0, 20.0, 8.0, 6.0, 7.0, 3.0, 4.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-2.48046875, -2.4158477783203125, -2.351226806640625, -2.2866058349609375, -2.22198486328125, -2.1573638916015625, -2.092742919921875, -2.0281219482421875, -1.9635009765625, -1.8988800048828125, -1.834259033203125, -1.7696380615234375, -1.70501708984375, -1.6403961181640625, -1.575775146484375, -1.5111541748046875, -1.446533203125, -1.3819122314453125, -1.317291259765625, -1.2526702880859375, -1.18804931640625, -1.1234283447265625, -1.058807373046875, -0.9941864013671875, -0.9295654296875, -0.8649444580078125, -0.800323486328125, -0.7357025146484375, -0.67108154296875, -0.6064605712890625, -0.541839599609375, -0.4772186279296875, -0.41259765625, -0.3479766845703125, -0.283355712890625, -0.2187347412109375, -0.15411376953125, -0.0894927978515625, -0.024871826171875, 0.0397491455078125, 0.1043701171875, 0.1689910888671875, 0.233612060546875, 0.2982330322265625, 0.36285400390625, 0.4274749755859375, 0.492095947265625, 0.5567169189453125, 0.621337890625, 0.6859588623046875, 0.750579833984375, 0.8152008056640625, 0.87982177734375, 0.9444427490234375, 1.009063720703125, 1.0736846923828125, 1.1383056640625, 1.2029266357421875, 1.267547607421875, 1.3321685791015625, 1.39678955078125, 1.4614105224609375, 1.526031494140625, 1.5906524658203125, 1.6552734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 7.0, 5.0, 8.0, 6.0, 13.0, 19.0, 24.0, 23.0, 20.0, 33.0, 35.0, 37.0, 50.0, 60.0, 56.0, 80.0, 61.0, 66.0, 60.0, 50.0, 68.0, 37.0, 32.0, 32.0, 22.0, 16.0, 11.0, 12.0, 6.0, 7.0, 5.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.794921875, -1.7410125732421875, -1.687103271484375, -1.6331939697265625, -1.57928466796875, -1.5253753662109375, -1.471466064453125, -1.4175567626953125, -1.3636474609375, -1.3097381591796875, -1.255828857421875, -1.2019195556640625, -1.14801025390625, -1.0941009521484375, -1.040191650390625, -0.9862823486328125, -0.932373046875, -0.8784637451171875, -0.824554443359375, -0.7706451416015625, -0.71673583984375, -0.6628265380859375, -0.608917236328125, -0.5550079345703125, -0.5010986328125, -0.4471893310546875, -0.393280029296875, -0.3393707275390625, -0.28546142578125, -0.2315521240234375, -0.177642822265625, -0.1237335205078125, -0.06982421875, -0.0159149169921875, 0.037994384765625, 0.0919036865234375, 0.14581298828125, 0.1997222900390625, 0.253631591796875, 0.3075408935546875, 0.3614501953125, 0.4153594970703125, 0.469268798828125, 0.5231781005859375, 0.57708740234375, 0.6309967041015625, 0.684906005859375, 0.7388153076171875, 0.792724609375, 0.8466339111328125, 0.900543212890625, 0.9544525146484375, 1.00836181640625, 1.0622711181640625, 1.116180419921875, 1.1700897216796875, 1.2239990234375, 1.2779083251953125, 1.331817626953125, 1.3857269287109375, 1.43963623046875, 1.4935455322265625, 1.547454833984375, 1.6013641357421875, 1.6552734375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 10.0, 16.0, 34.0, 61.0, 133.0, 226.0, 187.0, 142.0, 76.0, 33.0, 32.0, 15.0, 5.0, 3.0, 1.0, 1.0, 8.0, 0.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.842132568359375, -42.143985748291016, -40.44583511352539, -38.74768829345703, -37.049537658691406, -35.35139083862305, -33.65324401855469, -31.955095291137695, -30.256946563720703, -28.55879783630371, -26.86064910888672, -25.16250228881836, -23.464353561401367, -21.766204833984375, -20.068058013916016, -18.369909286499023, -16.67176055908203, -14.973611831665039, -13.275464057922363, -11.577316284179688, -9.879167556762695, -8.181018829345703, -6.482871055603027, -4.784723281860352, -3.0865745544433594, -1.3884263038635254, 0.3097219467163086, 2.0078701972961426, 3.7060184478759766, 5.404167175292969, 7.1023149490356445, 8.80046272277832, 10.498611450195312, 12.196760177612305, 13.89490795135498, 15.593055725097656, 17.29120445251465, 18.98935317993164, 20.6875, 22.385648727416992, 24.083797454833984, 25.781946182250977, 27.48009490966797, 29.178241729736328, 30.87639045715332, 32.57453918457031, 34.27268600463867, 35.97083282470703, 37.668983459472656, 39.367130279541016, 41.06528091430664, 42.763427734375, 44.461578369140625, 46.159725189208984, 47.857872009277344, 49.55602264404297, 51.25416946411133, 52.95231628417969, 54.65046691894531, 56.34861373901367, 58.04676055908203, 59.744911193847656, 61.443058013916016, 63.141204833984375, 64.83935546875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 5.0, 2.0, 11.0, 5.0, 9.0, 8.0, 12.0, 14.0, 19.0, 21.0, 22.0, 20.0, 24.0, 32.0, 34.0, 29.0, 44.0, 59.0, 67.0, 81.0, 80.0, 64.0, 47.0, 48.0, 35.0, 30.0, 29.0, 33.0, 14.0, 19.0, 12.0, 14.0, 12.0, 8.0, 8.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.29172897338867, -35.244815826416016, -34.19790267944336, -33.1509895324707, -32.10407638549805, -31.05716323852539, -30.0102481842041, -28.963335037231445, -27.91642189025879, -26.869508743286133, -25.822595596313477, -24.77568244934082, -23.72876739501953, -22.681854248046875, -21.63494110107422, -20.588027954101562, -19.541114807128906, -18.49420166015625, -17.447288513183594, -16.400375366210938, -15.353461265563965, -14.306548118591309, -13.259634017944336, -12.21272087097168, -11.165807723999023, -10.118894577026367, -9.071981430053711, -8.025067329406738, -6.978154182434082, -5.931241035461426, -4.884327411651611, -3.837413787841797, -2.7905006408691406, -1.7435872554779053, -0.6966738700866699, 0.35023951530456543, 1.3971529006958008, 2.444066047668457, 3.4909796714782715, 4.537893295288086, 5.584806442260742, 6.631719589233398, 7.678633213043213, 8.725546836853027, 9.772459983825684, 10.81937313079834, 11.866287231445312, 12.913200378417969, 13.960113525390625, 15.007026672363281, 16.053939819335938, 17.100852966308594, 18.14776611328125, 19.194679260253906, 20.241594314575195, 21.28850746154785, 22.335420608520508, 23.382333755493164, 24.42924690246582, 25.476160049438477, 26.523075103759766, 27.569988250732422, 28.616901397705078, 29.663814544677734, 30.71072769165039]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 15.0, 16.0, 36.0, 79.0, 122.0, 233.0, 418.0, 835.0, 1788.0, 4246.0, 11790.0, 38542.0, 172556.0, 1401551.0, 2210711.0, 273742.0, 52624.0, 15257.0, 5465.0, 2149.0, 1037.0, 502.0, 253.0, 131.0, 71.0, 42.0, 28.0, 15.0, 7.0, 8.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46484375, -4.344573974609375, -4.22430419921875, -4.104034423828125, -3.9837646484375, -3.863494873046875, -3.74322509765625, -3.622955322265625, -3.502685546875, -3.382415771484375, -3.26214599609375, -3.141876220703125, -3.0216064453125, -2.901336669921875, -2.78106689453125, -2.660797119140625, -2.54052734375, -2.420257568359375, -2.29998779296875, -2.179718017578125, -2.0594482421875, -1.939178466796875, -1.81890869140625, -1.698638916015625, -1.578369140625, -1.458099365234375, -1.33782958984375, -1.217559814453125, -1.0972900390625, -0.977020263671875, -0.85675048828125, -0.736480712890625, -0.6162109375, -0.495941162109375, -0.37567138671875, -0.255401611328125, -0.1351318359375, -0.014862060546875, 0.10540771484375, 0.225677490234375, 0.345947265625, 0.466217041015625, 0.58648681640625, 0.706756591796875, 0.8270263671875, 0.947296142578125, 1.06756591796875, 1.187835693359375, 1.30810546875, 1.428375244140625, 1.54864501953125, 1.668914794921875, 1.7891845703125, 1.909454345703125, 2.02972412109375, 2.149993896484375, 2.270263671875, 2.390533447265625, 2.51080322265625, 2.631072998046875, 2.7513427734375, 2.871612548828125, 2.99188232421875, 3.112152099609375, 3.232421875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 1.0, 9.0, 6.0, 2.0, 15.0, 16.0, 13.0, 17.0, 33.0, 31.0, 21.0, 40.0, 36.0, 37.0, 32.0, 39.0, 45.0, 47.0, 51.0, 42.0, 44.0, 40.0, 49.0, 43.0, 38.0, 30.0, 30.0, 34.0, 28.0, 26.0, 19.0, 11.0, 20.0, 7.0, 10.0, 12.0, 3.0, 4.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.15625, -2.0888671875, -2.021484375, -1.9541015625, -1.88671875, -1.8193359375, -1.751953125, -1.6845703125, -1.6171875, -1.5498046875, -1.482421875, -1.4150390625, -1.34765625, -1.2802734375, -1.212890625, -1.1455078125, -1.078125, -1.0107421875, -0.943359375, -0.8759765625, -0.80859375, -0.7412109375, -0.673828125, -0.6064453125, -0.5390625, -0.4716796875, -0.404296875, -0.3369140625, -0.26953125, -0.2021484375, -0.134765625, -0.0673828125, 0.0, 0.0673828125, 0.134765625, 0.2021484375, 0.26953125, 0.3369140625, 0.404296875, 0.4716796875, 0.5390625, 0.6064453125, 0.673828125, 0.7412109375, 0.80859375, 0.8759765625, 0.943359375, 1.0107421875, 1.078125, 1.1455078125, 1.212890625, 1.2802734375, 1.34765625, 1.4150390625, 1.482421875, 1.5498046875, 1.6171875, 1.6845703125, 1.751953125, 1.8193359375, 1.88671875, 1.9541015625, 2.021484375, 2.0888671875, 2.15625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 4.0, 3.0, 4.0, 5.0, 3.0, 10.0, 16.0, 16.0, 29.0, 33.0, 56.0, 80.0, 138.0, 299.0, 721.0, 1718.0, 5771.0, 23904.0, 161146.0, 2732349.0, 1162828.0, 83934.0, 14981.0, 4005.0, 1212.0, 481.0, 186.0, 132.0, 70.0, 26.0, 30.0, 22.0, 19.0, 11.0, 14.0, 3.0, 5.0, 2.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5703125, -6.364013671875, -6.15771484375, -5.951416015625, -5.7451171875, -5.538818359375, -5.33251953125, -5.126220703125, -4.919921875, -4.713623046875, -4.50732421875, -4.301025390625, -4.0947265625, -3.888427734375, -3.68212890625, -3.475830078125, -3.26953125, -3.063232421875, -2.85693359375, -2.650634765625, -2.4443359375, -2.238037109375, -2.03173828125, -1.825439453125, -1.619140625, -1.412841796875, -1.20654296875, -1.000244140625, -0.7939453125, -0.587646484375, -0.38134765625, -0.175048828125, 0.03125, 0.237548828125, 0.44384765625, 0.650146484375, 0.8564453125, 1.062744140625, 1.26904296875, 1.475341796875, 1.681640625, 1.887939453125, 2.09423828125, 2.300537109375, 2.5068359375, 2.713134765625, 2.91943359375, 3.125732421875, 3.33203125, 3.538330078125, 3.74462890625, 3.950927734375, 4.1572265625, 4.363525390625, 4.56982421875, 4.776123046875, 4.982421875, 5.188720703125, 5.39501953125, 5.601318359375, 5.8076171875, 6.013916015625, 6.22021484375, 6.426513671875, 6.6328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 6.0, 22.0, 24.0, 27.0, 40.0, 56.0, 68.0, 81.0, 141.0, 168.0, 267.0, 429.0, 595.0, 582.0, 437.0, 307.0, 233.0, 147.0, 120.0, 63.0, 55.0, 36.0, 32.0, 25.0, 7.0, 13.0, 16.0, 10.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.3515625, -5.20367431640625, -5.0557861328125, -4.90789794921875, -4.760009765625, -4.61212158203125, -4.4642333984375, -4.31634521484375, -4.16845703125, -4.02056884765625, -3.8726806640625, -3.72479248046875, -3.576904296875, -3.42901611328125, -3.2811279296875, -3.13323974609375, -2.9853515625, -2.83746337890625, -2.6895751953125, -2.54168701171875, -2.393798828125, -2.24591064453125, -2.0980224609375, -1.95013427734375, -1.80224609375, -1.65435791015625, -1.5064697265625, -1.35858154296875, -1.210693359375, -1.06280517578125, -0.9149169921875, -0.76702880859375, -0.619140625, -0.47125244140625, -0.3233642578125, -0.17547607421875, -0.027587890625, 0.12030029296875, 0.2681884765625, 0.41607666015625, 0.56396484375, 0.71185302734375, 0.8597412109375, 1.00762939453125, 1.155517578125, 1.30340576171875, 1.4512939453125, 1.59918212890625, 1.7470703125, 1.89495849609375, 2.0428466796875, 2.19073486328125, 2.338623046875, 2.48651123046875, 2.6343994140625, 2.78228759765625, 2.93017578125, 3.07806396484375, 3.2259521484375, 3.37384033203125, 3.521728515625, 3.66961669921875, 3.8175048828125, 3.96539306640625, 4.11328125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 10.0, 15.0, 28.0, 77.0, 147.0, 233.0, 214.0, 156.0, 65.0, 29.0, 18.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-118.6193618774414, -116.09321594238281, -113.56706237792969, -111.04090881347656, -108.51476287841797, -105.98861694335938, -103.46246337890625, -100.93630981445312, -98.41016387939453, -95.88401794433594, -93.35786437988281, -90.83171081542969, -88.3055648803711, -85.7794189453125, -83.25326538085938, -80.72711181640625, -78.20096588134766, -75.67481994628906, -73.14866638183594, -70.62251281738281, -68.09636688232422, -65.57022094726562, -63.0440673828125, -60.51791763305664, -57.99176788330078, -55.46561813354492, -52.93946838378906, -50.4133186340332, -47.887168884277344, -45.361019134521484, -42.834869384765625, -40.308719635009766, -37.78256607055664, -35.25641632080078, -32.73026657104492, -30.204116821289062, -27.677967071533203, -25.151817321777344, -22.625667572021484, -20.099517822265625, -17.573368072509766, -15.047218322753906, -12.521068572998047, -9.994918823242188, -7.468769073486328, -4.942619323730469, -2.4164695739746094, 0.10968017578125, 2.6358299255371094, 5.161979675292969, 7.688129425048828, 10.214279174804688, 12.740428924560547, 15.266578674316406, 17.792728424072266, 20.318878173828125, 22.845027923583984, 25.371177673339844, 27.897327423095703, 30.423477172851562, 32.94962692260742, 35.47577667236328, 38.00192642211914, 40.528076171875, 43.05422592163086]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 2.0, 6.0, 14.0, 8.0, 8.0, 11.0, 11.0, 15.0, 22.0, 20.0, 15.0, 24.0, 34.0, 26.0, 32.0, 38.0, 36.0, 31.0, 55.0, 50.0, 57.0, 56.0, 52.0, 48.0, 41.0, 43.0, 28.0, 30.0, 19.0, 23.0, 18.0, 21.0, 15.0, 16.0, 15.0, 14.0, 8.0, 6.0, 2.0, 7.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-24.950990676879883, -24.231101989746094, -23.511215209960938, -22.79132652282715, -22.07143783569336, -21.351551055908203, -20.631662368774414, -19.911773681640625, -19.19188690185547, -18.47199821472168, -17.752111434936523, -17.032222747802734, -16.312335968017578, -15.592447280883789, -14.87255859375, -14.152670860290527, -13.432783126831055, -12.712895393371582, -11.99300765991211, -11.27311897277832, -10.553231239318848, -9.833343505859375, -9.113454818725586, -8.393567085266113, -7.673679351806641, -6.953791618347168, -6.233903408050537, -5.514015197753906, -4.794127464294434, -4.074239730834961, -3.35435152053833, -2.634463310241699, -1.9145736694335938, -1.194685697555542, -0.47479772567749023, 0.24509024620056152, 0.9649782180786133, 1.684866189956665, 2.404754161834717, 3.1246423721313477, 3.8445301055908203, 4.564417839050293, 5.284306049346924, 6.004194259643555, 6.724081993103027, 7.4439697265625, 8.163858413696289, 8.883746147155762, 9.603633880615234, 10.323521614074707, 11.04340934753418, 11.763298034667969, 12.483185768127441, 13.203073501586914, 13.922962188720703, 14.642849922180176, 15.362737655639648, 16.082626342773438, 16.802513122558594, 17.522401809692383, 18.242290496826172, 18.962177276611328, 19.682065963745117, 20.401954650878906, 21.121841430664062]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 11.0, 18.0, 28.0, 41.0, 75.0, 131.0, 181.0, 339.0, 632.0, 1233.0, 2283.0, 5424.0, 13611.0, 40381.0, 142091.0, 435471.0, 288407.0, 77921.0, 24149.0, 8669.0, 3661.0, 1697.0, 893.0, 496.0, 291.0, 157.0, 81.0, 67.0, 32.0, 30.0, 19.0, 11.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58203125, -4.45025634765625, -4.3184814453125, -4.18670654296875, -4.054931640625, -3.92315673828125, -3.7913818359375, -3.65960693359375, -3.52783203125, -3.39605712890625, -3.2642822265625, -3.13250732421875, -3.000732421875, -2.86895751953125, -2.7371826171875, -2.60540771484375, -2.4736328125, -2.34185791015625, -2.2100830078125, -2.07830810546875, -1.946533203125, -1.81475830078125, -1.6829833984375, -1.55120849609375, -1.41943359375, -1.28765869140625, -1.1558837890625, -1.02410888671875, -0.892333984375, -0.76055908203125, -0.6287841796875, -0.49700927734375, -0.365234375, -0.23345947265625, -0.1016845703125, 0.03009033203125, 0.161865234375, 0.29364013671875, 0.4254150390625, 0.55718994140625, 0.68896484375, 0.82073974609375, 0.9525146484375, 1.08428955078125, 1.216064453125, 1.34783935546875, 1.4796142578125, 1.61138916015625, 1.7431640625, 1.87493896484375, 2.0067138671875, 2.13848876953125, 2.270263671875, 2.40203857421875, 2.5338134765625, 2.66558837890625, 2.79736328125, 2.92913818359375, 3.0609130859375, 3.19268798828125, 3.324462890625, 3.45623779296875, 3.5880126953125, 3.71978759765625, 3.8515625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 11.0, 12.0, 9.0, 13.0, 15.0, 18.0, 10.0, 17.0, 19.0, 24.0, 29.0, 33.0, 32.0, 30.0, 40.0, 33.0, 33.0, 35.0, 45.0, 33.0, 39.0, 54.0, 34.0, 45.0, 33.0, 33.0, 38.0, 26.0, 15.0, 35.0, 27.0, 19.0, 15.0, 12.0, 10.0, 8.0, 9.0, 6.0, 9.0, 0.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.19140625, -2.1271514892578125, -2.062896728515625, -1.9986419677734375, -1.93438720703125, -1.8701324462890625, -1.805877685546875, -1.7416229248046875, -1.6773681640625, -1.6131134033203125, -1.548858642578125, -1.4846038818359375, -1.42034912109375, -1.3560943603515625, -1.291839599609375, -1.2275848388671875, -1.163330078125, -1.0990753173828125, -1.034820556640625, -0.9705657958984375, -0.90631103515625, -0.8420562744140625, -0.777801513671875, -0.7135467529296875, -0.6492919921875, -0.5850372314453125, -0.520782470703125, -0.4565277099609375, -0.39227294921875, -0.3280181884765625, -0.263763427734375, -0.1995086669921875, -0.13525390625, -0.0709991455078125, -0.006744384765625, 0.0575103759765625, 0.12176513671875, 0.1860198974609375, 0.250274658203125, 0.3145294189453125, 0.3787841796875, 0.4430389404296875, 0.507293701171875, 0.5715484619140625, 0.63580322265625, 0.7000579833984375, 0.764312744140625, 0.8285675048828125, 0.892822265625, 0.9570770263671875, 1.021331787109375, 1.0855865478515625, 1.14984130859375, 1.2140960693359375, 1.278350830078125, 1.3426055908203125, 1.4068603515625, 1.4711151123046875, 1.535369873046875, 1.5996246337890625, 1.66387939453125, 1.7281341552734375, 1.792388916015625, 1.8566436767578125, 1.9208984375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 10.0, 8.0, 10.0, 11.0, 15.0, 16.0, 24.0, 34.0, 62.0, 94.0, 159.0, 185.0, 274.0, 500.0, 955.0, 2219.0, 6404.0, 24608.0, 146958.0, 714797.0, 119852.0, 21487.0, 5718.0, 2083.0, 843.0, 457.0, 244.0, 157.0, 113.0, 80.0, 55.0, 36.0, 21.0, 15.0, 11.0, 17.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.08807373046875, -4.9027099609375, -4.71734619140625, -4.531982421875, -4.34661865234375, -4.1612548828125, -3.97589111328125, -3.79052734375, -3.60516357421875, -3.4197998046875, -3.23443603515625, -3.049072265625, -2.86370849609375, -2.6783447265625, -2.49298095703125, -2.3076171875, -2.12225341796875, -1.9368896484375, -1.75152587890625, -1.566162109375, -1.38079833984375, -1.1954345703125, -1.01007080078125, -0.82470703125, -0.63934326171875, -0.4539794921875, -0.26861572265625, -0.083251953125, 0.10211181640625, 0.2874755859375, 0.47283935546875, 0.658203125, 0.84356689453125, 1.0289306640625, 1.21429443359375, 1.399658203125, 1.58502197265625, 1.7703857421875, 1.95574951171875, 2.14111328125, 2.32647705078125, 2.5118408203125, 2.69720458984375, 2.882568359375, 3.06793212890625, 3.2532958984375, 3.43865966796875, 3.6240234375, 3.80938720703125, 3.9947509765625, 4.18011474609375, 4.365478515625, 4.55084228515625, 4.7362060546875, 4.92156982421875, 5.10693359375, 5.29229736328125, 5.4776611328125, 5.66302490234375, 5.848388671875, 6.03375244140625, 6.2191162109375, 6.40447998046875, 6.58984375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 11.0, 7.0, 3.0, 11.0, 12.0, 13.0, 11.0, 15.0, 29.0, 25.0, 39.0, 49.0, 54.0, 61.0, 67.0, 66.0, 71.0, 70.0, 60.0, 42.0, 37.0, 47.0, 33.0, 35.0, 20.0, 22.0, 24.0, 14.0, 15.0, 9.0, 5.0, 5.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.484375, -12.1336669921875, -11.782958984375, -11.4322509765625, -11.08154296875, -10.7308349609375, -10.380126953125, -10.0294189453125, -9.6787109375, -9.3280029296875, -8.977294921875, -8.6265869140625, -8.27587890625, -7.9251708984375, -7.574462890625, -7.2237548828125, -6.873046875, -6.5223388671875, -6.171630859375, -5.8209228515625, -5.47021484375, -5.1195068359375, -4.768798828125, -4.4180908203125, -4.0673828125, -3.7166748046875, -3.365966796875, -3.0152587890625, -2.66455078125, -2.3138427734375, -1.963134765625, -1.6124267578125, -1.26171875, -0.9110107421875, -0.560302734375, -0.2095947265625, 0.14111328125, 0.4918212890625, 0.842529296875, 1.1932373046875, 1.5439453125, 1.8946533203125, 2.245361328125, 2.5960693359375, 2.94677734375, 3.2974853515625, 3.648193359375, 3.9989013671875, 4.349609375, 4.7003173828125, 5.051025390625, 5.4017333984375, 5.75244140625, 6.1031494140625, 6.453857421875, 6.8045654296875, 7.1552734375, 7.5059814453125, 7.856689453125, 8.2073974609375, 8.55810546875, 8.9088134765625, 9.259521484375, 9.6102294921875, 9.9609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 11.0, 22.0, 22.0, 34.0, 51.0, 66.0, 107.0, 166.0, 290.0, 448.0, 835.0, 1458.0, 2816.0, 5856.0, 13142.0, 35510.0, 118790.0, 628696.0, 163732.0, 45449.0, 16707.0, 7122.0, 3270.0, 1654.0, 884.0, 510.0, 322.0, 185.0, 128.0, 74.0, 53.0, 33.0, 24.0, 20.0, 11.0, 12.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.06640625, -2.0099639892578125, -1.953521728515625, -1.8970794677734375, -1.84063720703125, -1.7841949462890625, -1.727752685546875, -1.6713104248046875, -1.6148681640625, -1.5584259033203125, -1.501983642578125, -1.4455413818359375, -1.38909912109375, -1.3326568603515625, -1.276214599609375, -1.2197723388671875, -1.163330078125, -1.1068878173828125, -1.050445556640625, -0.9940032958984375, -0.93756103515625, -0.8811187744140625, -0.824676513671875, -0.7682342529296875, -0.7117919921875, -0.6553497314453125, -0.598907470703125, -0.5424652099609375, -0.48602294921875, -0.4295806884765625, -0.373138427734375, -0.3166961669921875, -0.26025390625, -0.2038116455078125, -0.147369384765625, -0.0909271240234375, -0.03448486328125, 0.0219573974609375, 0.078399658203125, 0.1348419189453125, 0.1912841796875, 0.2477264404296875, 0.304168701171875, 0.3606109619140625, 0.41705322265625, 0.4734954833984375, 0.529937744140625, 0.5863800048828125, 0.642822265625, 0.6992645263671875, 0.755706787109375, 0.8121490478515625, 0.86859130859375, 0.9250335693359375, 0.981475830078125, 1.0379180908203125, 1.0943603515625, 1.1508026123046875, 1.207244873046875, 1.2636871337890625, 1.32012939453125, 1.3765716552734375, 1.433013916015625, 1.4894561767578125, 1.5458984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 15.0, 13.0, 19.0, 23.0, 19.0, 29.0, 48.0, 48.0, 71.0, 110.0, 101.0, 114.0, 95.0, 64.0, 49.0, 43.0, 21.0, 30.0, 18.0, 10.0, 8.0, 9.0, 4.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0007658004760742188, -0.0007460415363311768, -0.0007262825965881348, -0.0007065236568450928, -0.0006867647171020508, -0.0006670057773590088, -0.0006472468376159668, -0.0006274878978729248, -0.0006077289581298828, -0.0005879700183868408, -0.0005682110786437988, -0.0005484521389007568, -0.0005286931991577148, -0.0005089342594146729, -0.0004891753196716309, -0.00046941637992858887, -0.0004496574401855469, -0.0004298985004425049, -0.0004101395606994629, -0.0003903806209564209, -0.0003706216812133789, -0.0003508627414703369, -0.0003311038017272949, -0.00031134486198425293, -0.00029158592224121094, -0.00027182698249816895, -0.00025206804275512695, -0.00023230910301208496, -0.00021255016326904297, -0.00019279122352600098, -0.00017303228378295898, -0.000153273344039917, -0.000133514404296875, -0.00011375546455383301, -9.399652481079102e-05, -7.423758506774902e-05, -5.447864532470703e-05, -3.471970558166504e-05, -1.4960765838623047e-05, 4.798173904418945e-06, 2.4557113647460938e-05, 4.431605339050293e-05, 6.407499313354492e-05, 8.383393287658691e-05, 0.0001035928726196289, 0.0001233518123626709, 0.0001431107521057129, 0.00016286969184875488, 0.00018262863159179688, 0.00020238757133483887, 0.00022214651107788086, 0.00024190545082092285, 0.00026166439056396484, 0.00028142333030700684, 0.00030118227005004883, 0.0003209412097930908, 0.0003407001495361328, 0.0003604590892791748, 0.0003802180290222168, 0.0003999769687652588, 0.0004197359085083008, 0.0004394948482513428, 0.00045925378799438477, 0.00047901272773742676, 0.0004987716674804688]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 14.0, 25.0, 47.0, 75.0, 104.0, 231.0, 373.0, 709.0, 1695.0, 4361.0, 13216.0, 51809.0, 348527.0, 550171.0, 55013.0, 14125.0, 4633.0, 1765.0, 740.0, 385.0, 226.0, 111.0, 59.0, 40.0, 26.0, 22.0, 9.0, 8.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.77734375, -2.695709228515625, -2.61407470703125, -2.532440185546875, -2.4508056640625, -2.369171142578125, -2.28753662109375, -2.205902099609375, -2.124267578125, -2.042633056640625, -1.96099853515625, -1.879364013671875, -1.7977294921875, -1.716094970703125, -1.63446044921875, -1.552825927734375, -1.47119140625, -1.389556884765625, -1.30792236328125, -1.226287841796875, -1.1446533203125, -1.063018798828125, -0.98138427734375, -0.899749755859375, -0.818115234375, -0.736480712890625, -0.65484619140625, -0.573211669921875, -0.4915771484375, -0.409942626953125, -0.32830810546875, -0.246673583984375, -0.1650390625, -0.083404541015625, -0.00177001953125, 0.079864501953125, 0.1614990234375, 0.243133544921875, 0.32476806640625, 0.406402587890625, 0.488037109375, 0.569671630859375, 0.65130615234375, 0.732940673828125, 0.8145751953125, 0.896209716796875, 0.97784423828125, 1.059478759765625, 1.14111328125, 1.222747802734375, 1.30438232421875, 1.386016845703125, 1.4676513671875, 1.549285888671875, 1.63092041015625, 1.712554931640625, 1.794189453125, 1.875823974609375, 1.95745849609375, 2.039093017578125, 2.1207275390625, 2.202362060546875, 2.28399658203125, 2.365631103515625, 2.447265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 11.0, 24.0, 27.0, 25.0, 34.0, 60.0, 73.0, 119.0, 102.0, 121.0, 109.0, 63.0, 48.0, 40.0, 26.0, 18.0, 15.0, 9.0, 8.0, 9.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.586090087890625, -2.50225830078125, -2.418426513671875, -2.3345947265625, -2.250762939453125, -2.16693115234375, -2.083099365234375, -1.999267578125, -1.915435791015625, -1.83160400390625, -1.747772216796875, -1.6639404296875, -1.580108642578125, -1.49627685546875, -1.412445068359375, -1.32861328125, -1.244781494140625, -1.16094970703125, -1.077117919921875, -0.9932861328125, -0.909454345703125, -0.82562255859375, -0.741790771484375, -0.657958984375, -0.574127197265625, -0.49029541015625, -0.406463623046875, -0.3226318359375, -0.238800048828125, -0.15496826171875, -0.071136474609375, 0.0126953125, 0.096527099609375, 0.18035888671875, 0.264190673828125, 0.3480224609375, 0.431854248046875, 0.51568603515625, 0.599517822265625, 0.683349609375, 0.767181396484375, 0.85101318359375, 0.934844970703125, 1.0186767578125, 1.102508544921875, 1.18634033203125, 1.270172119140625, 1.35400390625, 1.437835693359375, 1.52166748046875, 1.605499267578125, 1.6893310546875, 1.773162841796875, 1.85699462890625, 1.940826416015625, 2.024658203125, 2.108489990234375, 2.19232177734375, 2.276153564453125, 2.3599853515625, 2.443817138671875, 2.52764892578125, 2.611480712890625, 2.6953125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 14.0, 29.0, 56.0, 107.0, 235.0, 282.0, 123.0, 80.0, 23.0, 16.0, 7.0, 11.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.64256286621094, -57.44483184814453, -55.24709701538086, -53.04936599731445, -50.85163497924805, -48.653900146484375, -46.45616912841797, -44.25843811035156, -42.060707092285156, -39.86297607421875, -37.66524124145508, -35.46751022338867, -33.269779205322266, -31.072046279907227, -28.874313354492188, -26.67658233642578, -24.47884750366211, -22.28111457824707, -20.083383560180664, -17.885650634765625, -15.687918663024902, -13.49018669128418, -11.29245376586914, -9.094721794128418, -6.896989822387695, -4.699257850646973, -2.501525402069092, -0.30379295349121094, 1.8939390182495117, 4.091670989990234, 6.289403915405273, 8.487135887145996, 10.684867858886719, 12.882599830627441, 15.080331802368164, 17.278064727783203, 19.47579574584961, 21.67352867126465, 23.871261596679688, 26.068992614746094, 28.266725540161133, 30.464458465576172, 32.66218948364258, 34.85992431640625, 37.057655334472656, 39.25538635253906, 41.45311737060547, 43.65085220336914, 45.84858322143555, 48.04631423950195, 50.244049072265625, 52.44178009033203, 54.63951110839844, 56.837242126464844, 59.034976959228516, 61.23270797729492, 63.430442810058594, 65.628173828125, 67.8259048461914, 70.02363586425781, 72.22137451171875, 74.41910552978516, 76.61683654785156, 78.81456756591797, 81.01229858398438]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 7.0, 12.0, 6.0, 7.0, 11.0, 11.0, 14.0, 22.0, 34.0, 17.0, 19.0, 23.0, 40.0, 38.0, 42.0, 48.0, 69.0, 89.0, 84.0, 78.0, 45.0, 31.0, 42.0, 27.0, 29.0, 26.0, 18.0, 13.0, 15.0, 21.0, 12.0, 11.0, 8.0, 6.0, 7.0, 4.0, 4.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.689926147460938, -29.546859741210938, -28.403793334960938, -27.260726928710938, -26.117660522460938, -24.974594116210938, -23.831527709960938, -22.688461303710938, -21.545394897460938, -20.402328491210938, -19.259262084960938, -18.116195678710938, -16.973129272460938, -15.830062866210938, -14.686995506286621, -13.543929100036621, -12.400861740112305, -11.257795333862305, -10.114728927612305, -8.971662521362305, -7.8285956382751465, -6.6855292320251465, -5.542462348937988, -4.399395942687988, -3.2563295364379883, -2.1132631301879883, -0.9701964855194092, 0.17287015914916992, 1.31593656539917, 2.45900297164917, 3.602069854736328, 4.745136260986328, 5.888202667236328, 7.031269073486328, 8.174335479736328, 9.317401885986328, 10.460468292236328, 11.603534698486328, 12.746602058410645, 13.889668464660645, 15.032734870910645, 16.17580223083496, 17.31886863708496, 18.46193504333496, 19.60500144958496, 20.74806785583496, 21.89113426208496, 23.03420066833496, 24.17726707458496, 25.32033348083496, 26.46339988708496, 27.60646629333496, 28.74953269958496, 29.89259910583496, 31.035667419433594, 32.178733825683594, 33.321800231933594, 34.464866638183594, 35.607933044433594, 36.750999450683594, 37.894065856933594, 39.037132263183594, 40.180198669433594, 41.323265075683594, 42.466331481933594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 10.0, 7.0, 12.0, 15.0, 35.0, 53.0, 71.0, 119.0, 217.0, 345.0, 646.0, 1125.0, 2118.0, 4211.0, 8771.0, 20424.0, 54142.0, 180406.0, 809558.0, 2186837.0, 681986.0, 158836.0, 48650.0, 18778.0, 8297.0, 4048.0, 2050.0, 1055.0, 604.0, 337.0, 213.0, 112.0, 74.0, 42.0, 28.0, 16.0, 9.0, 9.0, 9.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.216339111328125, -3.12017822265625, -3.024017333984375, -2.9278564453125, -2.831695556640625, -2.73553466796875, -2.639373779296875, -2.543212890625, -2.447052001953125, -2.35089111328125, -2.254730224609375, -2.1585693359375, -2.062408447265625, -1.96624755859375, -1.870086669921875, -1.77392578125, -1.677764892578125, -1.58160400390625, -1.485443115234375, -1.3892822265625, -1.293121337890625, -1.19696044921875, -1.100799560546875, -1.004638671875, -0.908477783203125, -0.81231689453125, -0.716156005859375, -0.6199951171875, -0.523834228515625, -0.42767333984375, -0.331512451171875, -0.2353515625, -0.139190673828125, -0.04302978515625, 0.053131103515625, 0.1492919921875, 0.245452880859375, 0.34161376953125, 0.437774658203125, 0.533935546875, 0.630096435546875, 0.72625732421875, 0.822418212890625, 0.9185791015625, 1.014739990234375, 1.11090087890625, 1.207061767578125, 1.30322265625, 1.399383544921875, 1.49554443359375, 1.591705322265625, 1.6878662109375, 1.784027099609375, 1.88018798828125, 1.976348876953125, 2.072509765625, 2.168670654296875, 2.26483154296875, 2.360992431640625, 2.4571533203125, 2.553314208984375, 2.64947509765625, 2.745635986328125, 2.841796875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 4.0, 6.0, 11.0, 7.0, 14.0, 20.0, 16.0, 12.0, 20.0, 27.0, 31.0, 44.0, 36.0, 42.0, 44.0, 49.0, 50.0, 48.0, 59.0, 43.0, 52.0, 39.0, 41.0, 42.0, 28.0, 32.0, 23.0, 34.0, 23.0, 19.0, 16.0, 11.0, 14.0, 9.0, 11.0, 4.0, 6.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.578125, -2.5, -2.421875, -2.34375, -2.265625, -2.1875, -2.109375, -2.03125, -1.953125, -1.875, -1.796875, -1.71875, -1.640625, -1.5625, -1.484375, -1.40625, -1.328125, -1.25, -1.171875, -1.09375, -1.015625, -0.9375, -0.859375, -0.78125, -0.703125, -0.625, -0.546875, -0.46875, -0.390625, -0.3125, -0.234375, -0.15625, -0.078125, 0.0, 0.078125, 0.15625, 0.234375, 0.3125, 0.390625, 0.46875, 0.546875, 0.625, 0.703125, 0.78125, 0.859375, 0.9375, 1.015625, 1.09375, 1.171875, 1.25, 1.328125, 1.40625, 1.484375, 1.5625, 1.640625, 1.71875, 1.796875, 1.875, 1.953125, 2.03125, 2.109375, 2.1875, 2.265625, 2.34375, 2.421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 8.0, 6.0, 16.0, 18.0, 17.0, 15.0, 38.0, 68.0, 104.0, 179.0, 521.0, 1488.0, 5562.0, 33388.0, 620613.0, 3393410.0, 121047.0, 13278.0, 2921.0, 898.0, 302.0, 155.0, 78.0, 59.0, 24.0, 20.0, 12.0, 15.0, 6.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90234375, -7.61248779296875, -7.3226318359375, -7.03277587890625, -6.742919921875, -6.45306396484375, -6.1632080078125, -5.87335205078125, -5.58349609375, -5.29364013671875, -5.0037841796875, -4.71392822265625, -4.424072265625, -4.13421630859375, -3.8443603515625, -3.55450439453125, -3.2646484375, -2.97479248046875, -2.6849365234375, -2.39508056640625, -2.105224609375, -1.81536865234375, -1.5255126953125, -1.23565673828125, -0.94580078125, -0.65594482421875, -0.3660888671875, -0.07623291015625, 0.213623046875, 0.50347900390625, 0.7933349609375, 1.08319091796875, 1.373046875, 1.66290283203125, 1.9527587890625, 2.24261474609375, 2.532470703125, 2.82232666015625, 3.1121826171875, 3.40203857421875, 3.69189453125, 3.98175048828125, 4.2716064453125, 4.56146240234375, 4.851318359375, 5.14117431640625, 5.4310302734375, 5.72088623046875, 6.0107421875, 6.30059814453125, 6.5904541015625, 6.88031005859375, 7.170166015625, 7.46002197265625, 7.7498779296875, 8.03973388671875, 8.32958984375, 8.61944580078125, 8.9093017578125, 9.19915771484375, 9.489013671875, 9.77886962890625, 10.0687255859375, 10.35858154296875, 10.6484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 3.0, 7.0, 4.0, 12.0, 16.0, 14.0, 24.0, 30.0, 47.0, 84.0, 111.0, 150.0, 215.0, 340.0, 566.0, 671.0, 622.0, 395.0, 236.0, 154.0, 119.0, 67.0, 52.0, 31.0, 25.0, 16.0, 16.0, 8.0, 13.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.875, -5.6768798828125, -5.478759765625, -5.2806396484375, -5.08251953125, -4.8843994140625, -4.686279296875, -4.4881591796875, -4.2900390625, -4.0919189453125, -3.893798828125, -3.6956787109375, -3.49755859375, -3.2994384765625, -3.101318359375, -2.9031982421875, -2.705078125, -2.5069580078125, -2.308837890625, -2.1107177734375, -1.91259765625, -1.7144775390625, -1.516357421875, -1.3182373046875, -1.1201171875, -0.9219970703125, -0.723876953125, -0.5257568359375, -0.32763671875, -0.1295166015625, 0.068603515625, 0.2667236328125, 0.46484375, 0.6629638671875, 0.861083984375, 1.0592041015625, 1.25732421875, 1.4554443359375, 1.653564453125, 1.8516845703125, 2.0498046875, 2.2479248046875, 2.446044921875, 2.6441650390625, 2.84228515625, 3.0404052734375, 3.238525390625, 3.4366455078125, 3.634765625, 3.8328857421875, 4.031005859375, 4.2291259765625, 4.42724609375, 4.6253662109375, 4.823486328125, 5.0216064453125, 5.2197265625, 5.4178466796875, 5.615966796875, 5.8140869140625, 6.01220703125, 6.2103271484375, 6.408447265625, 6.6065673828125, 6.8046875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 12.0, 51.0, 141.0, 352.0, 281.0, 109.0, 35.0, 13.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-214.80784606933594, -210.74838256835938, -206.6889190673828, -202.62945556640625, -198.5699920654297, -194.51052856445312, -190.45106506347656, -186.3916015625, -182.3321533203125, -178.27268981933594, -174.21322631835938, -170.1537628173828, -166.09429931640625, -162.0348358154297, -157.97537231445312, -153.91592407226562, -149.8564453125, -145.79698181152344, -141.73751831054688, -137.6780548095703, -133.61859130859375, -129.5591278076172, -125.49967193603516, -121.4402084350586, -117.38074493408203, -113.32128143310547, -109.2618179321289, -105.20235443115234, -101.14289855957031, -97.08343505859375, -93.02397155761719, -88.96450805664062, -84.905029296875, -80.84556579589844, -76.78610229492188, -72.72663879394531, -68.66717529296875, -64.60771179199219, -60.548255920410156, -56.488792419433594, -52.42932891845703, -48.36986541748047, -44.310401916503906, -40.25094223022461, -36.19147872924805, -32.132015228271484, -28.072553634643555, -24.013092041015625, -19.953628540039062, -15.894165992736816, -11.83470344543457, -7.775240898132324, -3.715778350830078, 0.3436851501464844, 4.403146743774414, 8.462608337402344, 12.522071838378906, 16.58153533935547, 20.6409969329834, 24.700458526611328, 28.75992202758789, 32.81938552856445, 36.87884521484375, 40.93830871582031, 44.997772216796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 9.0, 19.0, 13.0, 30.0, 23.0, 26.0, 30.0, 29.0, 36.0, 41.0, 49.0, 55.0, 45.0, 53.0, 50.0, 63.0, 41.0, 45.0, 41.0, 39.0, 39.0, 30.0, 33.0, 27.0, 18.0, 18.0, 20.0, 17.0, 16.0, 12.0, 8.0, 5.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.557758331298828, -28.66191864013672, -27.76607894897461, -26.8702392578125, -25.974401473999023, -25.078561782836914, -24.182722091674805, -23.286882400512695, -22.39104461669922, -21.49520492553711, -20.599365234375, -19.70352554321289, -18.807687759399414, -17.911848068237305, -17.016008377075195, -16.120168685913086, -15.224328994750977, -14.328489303588867, -13.432650566101074, -12.536810874938965, -11.640972137451172, -10.745132446289062, -9.849292755126953, -8.953453063964844, -8.05761432647705, -7.1617751121521, -6.265935897827148, -5.370096206665039, -4.474256992340088, -3.5784177780151367, -2.6825780868530273, -1.7867388725280762, -0.8908977508544922, 0.004941582679748535, 0.9007809162139893, 1.7966203689575195, 2.6924595832824707, 3.588298797607422, 4.484138488769531, 5.379977703094482, 6.275816917419434, 7.171656131744385, 8.067495346069336, 8.963335037231445, 9.859174728393555, 10.755013465881348, 11.650853157043457, 12.54669189453125, 13.44253158569336, 14.338371276855469, 15.234210014343262, 16.130050659179688, 17.025888442993164, 17.921728134155273, 18.817567825317383, 19.713407516479492, 20.60924530029297, 21.505084991455078, 22.400924682617188, 23.296764373779297, 24.192602157592773, 25.088441848754883, 25.984281539916992, 26.8801212310791, 27.77596092224121]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 13.0, 23.0, 28.0, 31.0, 59.0, 90.0, 139.0, 202.0, 299.0, 549.0, 1029.0, 2002.0, 4312.0, 10166.0, 26421.0, 80029.0, 284324.0, 430535.0, 138528.0, 42209.0, 15347.0, 6234.0, 2765.0, 1338.0, 750.0, 416.0, 240.0, 147.0, 105.0, 60.0, 41.0, 39.0, 22.0, 15.0, 11.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.0911865234375, -3.955810546875, -3.8204345703125, -3.68505859375, -3.5496826171875, -3.414306640625, -3.2789306640625, -3.1435546875, -3.0081787109375, -2.872802734375, -2.7374267578125, -2.60205078125, -2.4666748046875, -2.331298828125, -2.1959228515625, -2.060546875, -1.9251708984375, -1.789794921875, -1.6544189453125, -1.51904296875, -1.3836669921875, -1.248291015625, -1.1129150390625, -0.9775390625, -0.8421630859375, -0.706787109375, -0.5714111328125, -0.43603515625, -0.3006591796875, -0.165283203125, -0.0299072265625, 0.10546875, 0.2408447265625, 0.376220703125, 0.5115966796875, 0.64697265625, 0.7823486328125, 0.917724609375, 1.0531005859375, 1.1884765625, 1.3238525390625, 1.459228515625, 1.5946044921875, 1.72998046875, 1.8653564453125, 2.000732421875, 2.1361083984375, 2.271484375, 2.4068603515625, 2.542236328125, 2.6776123046875, 2.81298828125, 2.9483642578125, 3.083740234375, 3.2191162109375, 3.3544921875, 3.4898681640625, 3.625244140625, 3.7606201171875, 3.89599609375, 4.0313720703125, 4.166748046875, 4.3021240234375, 4.4375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 7.0, 10.0, 4.0, 8.0, 19.0, 22.0, 16.0, 18.0, 25.0, 23.0, 35.0, 31.0, 41.0, 42.0, 42.0, 51.0, 37.0, 34.0, 37.0, 41.0, 59.0, 45.0, 44.0, 34.0, 26.0, 37.0, 38.0, 23.0, 21.0, 21.0, 13.0, 15.0, 10.0, 14.0, 5.0, 10.0, 7.0, 2.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.89453125, -2.81591796875, -2.7373046875, -2.65869140625, -2.580078125, -2.50146484375, -2.4228515625, -2.34423828125, -2.265625, -2.18701171875, -2.1083984375, -2.02978515625, -1.951171875, -1.87255859375, -1.7939453125, -1.71533203125, -1.63671875, -1.55810546875, -1.4794921875, -1.40087890625, -1.322265625, -1.24365234375, -1.1650390625, -1.08642578125, -1.0078125, -0.92919921875, -0.8505859375, -0.77197265625, -0.693359375, -0.61474609375, -0.5361328125, -0.45751953125, -0.37890625, -0.30029296875, -0.2216796875, -0.14306640625, -0.064453125, 0.01416015625, 0.0927734375, 0.17138671875, 0.25, 0.32861328125, 0.4072265625, 0.48583984375, 0.564453125, 0.64306640625, 0.7216796875, 0.80029296875, 0.87890625, 0.95751953125, 1.0361328125, 1.11474609375, 1.193359375, 1.27197265625, 1.3505859375, 1.42919921875, 1.5078125, 1.58642578125, 1.6650390625, 1.74365234375, 1.822265625, 1.90087890625, 1.9794921875, 2.05810546875, 2.13671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 17.0, 15.0, 25.0, 32.0, 43.0, 53.0, 79.0, 108.0, 144.0, 287.0, 431.0, 816.0, 1663.0, 3653.0, 10252.0, 39513.0, 246470.0, 659117.0, 62408.0, 14197.0, 4684.0, 2023.0, 1001.0, 532.0, 327.0, 193.0, 126.0, 96.0, 57.0, 37.0, 32.0, 24.0, 13.0, 16.0, 18.0, 7.0, 6.0, 7.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.34600830078125, -5.1490478515625, -4.95208740234375, -4.755126953125, -4.55816650390625, -4.3612060546875, -4.16424560546875, -3.96728515625, -3.77032470703125, -3.5733642578125, -3.37640380859375, -3.179443359375, -2.98248291015625, -2.7855224609375, -2.58856201171875, -2.3916015625, -2.19464111328125, -1.9976806640625, -1.80072021484375, -1.603759765625, -1.40679931640625, -1.2098388671875, -1.01287841796875, -0.81591796875, -0.61895751953125, -0.4219970703125, -0.22503662109375, -0.028076171875, 0.16888427734375, 0.3658447265625, 0.56280517578125, 0.759765625, 0.95672607421875, 1.1536865234375, 1.35064697265625, 1.547607421875, 1.74456787109375, 1.9415283203125, 2.13848876953125, 2.33544921875, 2.53240966796875, 2.7293701171875, 2.92633056640625, 3.123291015625, 3.32025146484375, 3.5172119140625, 3.71417236328125, 3.9111328125, 4.10809326171875, 4.3050537109375, 4.50201416015625, 4.698974609375, 4.89593505859375, 5.0928955078125, 5.28985595703125, 5.48681640625, 5.68377685546875, 5.8807373046875, 6.07769775390625, 6.274658203125, 6.47161865234375, 6.6685791015625, 6.86553955078125, 7.0625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 7.0, 5.0, 15.0, 16.0, 17.0, 20.0, 18.0, 33.0, 31.0, 33.0, 41.0, 55.0, 55.0, 59.0, 69.0, 53.0, 77.0, 53.0, 49.0, 48.0, 44.0, 29.0, 32.0, 21.0, 24.0, 14.0, 10.0, 8.0, 14.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.19482421875, -8.8427734375, -8.49072265625, -8.138671875, -7.78662109375, -7.4345703125, -7.08251953125, -6.73046875, -6.37841796875, -6.0263671875, -5.67431640625, -5.322265625, -4.97021484375, -4.6181640625, -4.26611328125, -3.9140625, -3.56201171875, -3.2099609375, -2.85791015625, -2.505859375, -2.15380859375, -1.8017578125, -1.44970703125, -1.09765625, -0.74560546875, -0.3935546875, -0.04150390625, 0.310546875, 0.66259765625, 1.0146484375, 1.36669921875, 1.71875, 2.07080078125, 2.4228515625, 2.77490234375, 3.126953125, 3.47900390625, 3.8310546875, 4.18310546875, 4.53515625, 4.88720703125, 5.2392578125, 5.59130859375, 5.943359375, 6.29541015625, 6.6474609375, 6.99951171875, 7.3515625, 7.70361328125, 8.0556640625, 8.40771484375, 8.759765625, 9.11181640625, 9.4638671875, 9.81591796875, 10.16796875, 10.52001953125, 10.8720703125, 11.22412109375, 11.576171875, 11.92822265625, 12.2802734375, 12.63232421875, 12.984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 14.0, 12.0, 36.0, 46.0, 66.0, 89.0, 168.0, 346.0, 566.0, 1207.0, 2600.0, 6432.0, 18254.0, 61884.0, 370304.0, 493532.0, 62310.0, 18709.0, 6587.0, 2683.0, 1277.0, 599.0, 349.0, 193.0, 100.0, 46.0, 36.0, 27.0, 22.0, 11.0, 13.0, 4.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.642578125, -1.589599609375, -1.53662109375, -1.483642578125, -1.4306640625, -1.377685546875, -1.32470703125, -1.271728515625, -1.21875, -1.165771484375, -1.11279296875, -1.059814453125, -1.0068359375, -0.953857421875, -0.90087890625, -0.847900390625, -0.794921875, -0.741943359375, -0.68896484375, -0.635986328125, -0.5830078125, -0.530029296875, -0.47705078125, -0.424072265625, -0.37109375, -0.318115234375, -0.26513671875, -0.212158203125, -0.1591796875, -0.106201171875, -0.05322265625, -0.000244140625, 0.052734375, 0.105712890625, 0.15869140625, 0.211669921875, 0.2646484375, 0.317626953125, 0.37060546875, 0.423583984375, 0.4765625, 0.529541015625, 0.58251953125, 0.635498046875, 0.6884765625, 0.741455078125, 0.79443359375, 0.847412109375, 0.900390625, 0.953369140625, 1.00634765625, 1.059326171875, 1.1123046875, 1.165283203125, 1.21826171875, 1.271240234375, 1.32421875, 1.377197265625, 1.43017578125, 1.483154296875, 1.5361328125, 1.589111328125, 1.64208984375, 1.695068359375, 1.748046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 2.0, 3.0, 6.0, 0.0, 7.0, 5.0, 8.0, 12.0, 11.0, 15.0, 21.0, 29.0, 49.0, 64.0, 92.0, 130.0, 152.0, 108.0, 69.0, 62.0, 40.0, 27.0, 23.0, 16.0, 10.0, 11.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006480216979980469, -0.0006274133920669556, -0.0006068050861358643, -0.000586196780204773, -0.0005655884742736816, -0.0005449801683425903, -0.000524371862411499, -0.0005037635564804077, -0.0004831552505493164, -0.0004625469446182251, -0.0004419386386871338, -0.0004213303327560425, -0.00040072202682495117, -0.00038011372089385986, -0.00035950541496276855, -0.00033889710903167725, -0.00031828880310058594, -0.00029768049716949463, -0.0002770721912384033, -0.000256463885307312, -0.0002358555793762207, -0.0002152472734451294, -0.00019463896751403809, -0.00017403066158294678, -0.00015342235565185547, -0.00013281404972076416, -0.00011220574378967285, -9.159743785858154e-05, -7.098913192749023e-05, -5.0380825996398926e-05, -2.9772520065307617e-05, -9.164214134216309e-06, 1.1444091796875e-05, 3.205239772796631e-05, 5.266070365905762e-05, 7.326900959014893e-05, 9.387731552124023e-05, 0.00011448562145233154, 0.00013509392738342285, 0.00015570223331451416, 0.00017631053924560547, 0.00019691884517669678, 0.00021752715110778809, 0.0002381354570388794, 0.0002587437629699707, 0.000279352068901062, 0.0002999603748321533, 0.00032056868076324463, 0.00034117698669433594, 0.00036178529262542725, 0.00038239359855651855, 0.00040300190448760986, 0.00042361021041870117, 0.0004442185163497925, 0.0004648268222808838, 0.0004854351282119751, 0.0005060434341430664, 0.0005266517400741577, 0.000547260046005249, 0.0005678683519363403, 0.0005884766578674316, 0.000609084963798523, 0.0006296932697296143, 0.0006503015756607056, 0.0006709098815917969]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 9.0, 20.0, 27.0, 22.0, 36.0, 78.0, 107.0, 179.0, 264.0, 547.0, 1066.0, 2074.0, 4906.0, 12711.0, 37768.0, 126861.0, 644505.0, 149617.0, 43105.0, 14356.0, 5466.0, 2368.0, 1095.0, 531.0, 318.0, 192.0, 112.0, 70.0, 43.0, 33.0, 21.0, 19.0, 4.0, 10.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.6943359375, -1.6453094482421875, -1.596282958984375, -1.5472564697265625, -1.49822998046875, -1.4492034912109375, -1.400177001953125, -1.3511505126953125, -1.3021240234375, -1.2530975341796875, -1.204071044921875, -1.1550445556640625, -1.10601806640625, -1.0569915771484375, -1.007965087890625, -0.9589385986328125, -0.909912109375, -0.8608856201171875, -0.811859130859375, -0.7628326416015625, -0.71380615234375, -0.6647796630859375, -0.615753173828125, -0.5667266845703125, -0.5177001953125, -0.4686737060546875, -0.419647216796875, -0.3706207275390625, -0.32159423828125, -0.2725677490234375, -0.223541259765625, -0.1745147705078125, -0.12548828125, -0.0764617919921875, -0.027435302734375, 0.0215911865234375, 0.07061767578125, 0.1196441650390625, 0.168670654296875, 0.2176971435546875, 0.2667236328125, 0.3157501220703125, 0.364776611328125, 0.4138031005859375, 0.46282958984375, 0.5118560791015625, 0.560882568359375, 0.6099090576171875, 0.658935546875, 0.7079620361328125, 0.756988525390625, 0.8060150146484375, 0.85504150390625, 0.9040679931640625, 0.953094482421875, 1.0021209716796875, 1.0511474609375, 1.1001739501953125, 1.149200439453125, 1.1982269287109375, 1.24725341796875, 1.2962799072265625, 1.345306396484375, 1.3943328857421875, 1.443359375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 9.0, 9.0, 15.0, 9.0, 17.0, 13.0, 21.0, 21.0, 34.0, 34.0, 39.0, 36.0, 53.0, 83.0, 81.0, 58.0, 83.0, 47.0, 46.0, 48.0, 39.0, 35.0, 29.0, 21.0, 23.0, 13.0, 16.0, 9.0, 13.0, 11.0, 6.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.826171875, -1.775390625, -1.724609375, -1.673828125, -1.623046875, -1.572265625, -1.521484375, -1.470703125, -1.419921875, -1.369140625, -1.318359375, -1.267578125, -1.216796875, -1.166015625, -1.115234375, -1.064453125, -1.013671875, -0.962890625, -0.912109375, -0.861328125, -0.810546875, -0.759765625, -0.708984375, -0.658203125, -0.607421875, -0.556640625, -0.505859375, -0.455078125, -0.404296875, -0.353515625, -0.302734375, -0.251953125, -0.201171875, -0.150390625, -0.099609375, -0.048828125, 0.001953125, 0.052734375, 0.103515625, 0.154296875, 0.205078125, 0.255859375, 0.306640625, 0.357421875, 0.408203125, 0.458984375, 0.509765625, 0.560546875, 0.611328125, 0.662109375, 0.712890625, 0.763671875, 0.814453125, 0.865234375, 0.916015625, 0.966796875, 1.017578125, 1.068359375, 1.119140625, 1.169921875, 1.220703125, 1.271484375, 1.322265625, 1.373046875, 1.423828125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 6.0, 7.0, 10.0, 24.0, 27.0, 44.0, 70.0, 106.0, 210.0, 201.0, 92.0, 63.0, 45.0, 23.0, 18.0, 9.0, 5.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.154144287109375, -24.8507137298584, -23.547283172607422, -22.243852615356445, -20.94042205810547, -19.636993408203125, -18.33356285095215, -17.030132293701172, -15.726701736450195, -14.423271179199219, -13.119840621948242, -11.816411018371582, -10.512980461120605, -9.209549903869629, -7.9061198234558105, -6.602689743041992, -5.299259185791016, -3.995828866958618, -2.6923985481262207, -1.3889682292938232, -0.08553791046142578, 1.2178926467895508, 2.521322727203369, 3.8247528076171875, 5.128183364868164, 6.431613922119141, 7.735044002532959, 9.038474082946777, 10.341904640197754, 11.64533519744873, 12.94876480102539, 14.252195358276367, 15.555625915527344, 16.85905647277832, 18.162487030029297, 19.465917587280273, 20.76934814453125, 22.072776794433594, 23.37620735168457, 24.679637908935547, 25.983068466186523, 27.2864990234375, 28.589929580688477, 29.893360137939453, 31.196788787841797, 32.500221252441406, 33.80364990234375, 35.107078552246094, 36.4105110168457, 37.71393966674805, 39.017372131347656, 40.32080078125, 41.62423324584961, 42.92766189575195, 44.23109436035156, 45.534523010253906, 46.83795166015625, 48.141380310058594, 49.4448127746582, 50.74824142456055, 52.051673889160156, 53.3551025390625, 54.65853500366211, 55.96196365356445, 57.26539611816406]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 8.0, 15.0, 16.0, 19.0, 23.0, 16.0, 17.0, 17.0, 25.0, 33.0, 29.0, 35.0, 59.0, 95.0, 143.0, 87.0, 60.0, 49.0, 25.0, 28.0, 24.0, 25.0, 22.0, 15.0, 11.0, 8.0, 5.0, 10.0, 4.0, 13.0, 6.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0], "bins": [-46.954917907714844, -45.70467758178711, -44.454437255859375, -43.20419692993164, -41.953956604003906, -40.70371627807617, -39.45347595214844, -38.2032356262207, -36.95299530029297, -35.702754974365234, -34.4525146484375, -33.202274322509766, -31.95203399658203, -30.701793670654297, -29.451553344726562, -28.201313018798828, -26.951072692871094, -25.70083236694336, -24.450592041015625, -23.20035171508789, -21.950111389160156, -20.699871063232422, -19.449630737304688, -18.199390411376953, -16.94915008544922, -15.698909759521484, -14.44866943359375, -13.198429107666016, -11.948188781738281, -10.697948455810547, -9.447708129882812, -8.197467803955078, -6.947227478027344, -5.696987152099609, -4.446746826171875, -3.1965065002441406, -1.9462661743164062, -0.6960258483886719, 0.5542144775390625, 1.8044548034667969, 3.0546951293945312, 4.304935455322266, 5.55517578125, 6.805416107177734, 8.055656433105469, 9.305896759033203, 10.556137084960938, 11.806377410888672, 13.056617736816406, 14.30685806274414, 15.557098388671875, 16.80733871459961, 18.057579040527344, 19.307819366455078, 20.558059692382812, 21.808300018310547, 23.05854034423828, 24.308780670166016, 25.55902099609375, 26.809261322021484, 28.05950164794922, 29.309741973876953, 30.559982299804688, 31.810222625732422, 33.060462951660156]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 18.0, 20.0, 21.0, 36.0, 60.0, 99.0, 144.0, 252.0, 459.0, 748.0, 1301.0, 2397.0, 4535.0, 9537.0, 21482.0, 53730.0, 160585.0, 550772.0, 1627078.0, 1212423.0, 366627.0, 110837.0, 39281.0, 15966.0, 7531.0, 3665.0, 1932.0, 1119.0, 639.0, 374.0, 229.0, 131.0, 88.0, 47.0, 46.0, 16.0, 18.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.705078125, -3.580902099609375, -3.45672607421875, -3.332550048828125, -3.2083740234375, -3.084197998046875, -2.96002197265625, -2.835845947265625, -2.711669921875, -2.587493896484375, -2.46331787109375, -2.339141845703125, -2.2149658203125, -2.090789794921875, -1.96661376953125, -1.842437744140625, -1.71826171875, -1.594085693359375, -1.46990966796875, -1.345733642578125, -1.2215576171875, -1.097381591796875, -0.97320556640625, -0.849029541015625, -0.724853515625, -0.600677490234375, -0.47650146484375, -0.352325439453125, -0.2281494140625, -0.103973388671875, 0.02020263671875, 0.144378662109375, 0.2685546875, 0.392730712890625, 0.51690673828125, 0.641082763671875, 0.7652587890625, 0.889434814453125, 1.01361083984375, 1.137786865234375, 1.261962890625, 1.386138916015625, 1.51031494140625, 1.634490966796875, 1.7586669921875, 1.882843017578125, 2.00701904296875, 2.131195068359375, 2.25537109375, 2.379547119140625, 2.50372314453125, 2.627899169921875, 2.7520751953125, 2.876251220703125, 3.00042724609375, 3.124603271484375, 3.248779296875, 3.372955322265625, 3.49713134765625, 3.621307373046875, 3.7454833984375, 3.869659423828125, 3.99383544921875, 4.118011474609375, 4.2421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 6.0, 6.0, 7.0, 8.0, 18.0, 8.0, 18.0, 16.0, 22.0, 22.0, 24.0, 29.0, 31.0, 40.0, 35.0, 29.0, 39.0, 38.0, 50.0, 45.0, 40.0, 48.0, 43.0, 32.0, 37.0, 32.0, 43.0, 36.0, 33.0, 30.0, 24.0, 10.0, 20.0, 16.0, 13.0, 8.0, 10.0, 8.0, 5.0, 3.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.5546875, -2.48236083984375, -2.4100341796875, -2.33770751953125, -2.265380859375, -2.19305419921875, -2.1207275390625, -2.04840087890625, -1.97607421875, -1.90374755859375, -1.8314208984375, -1.75909423828125, -1.686767578125, -1.61444091796875, -1.5421142578125, -1.46978759765625, -1.3974609375, -1.32513427734375, -1.2528076171875, -1.18048095703125, -1.108154296875, -1.03582763671875, -0.9635009765625, -0.89117431640625, -0.81884765625, -0.74652099609375, -0.6741943359375, -0.60186767578125, -0.529541015625, -0.45721435546875, -0.3848876953125, -0.31256103515625, -0.240234375, -0.16790771484375, -0.0955810546875, -0.02325439453125, 0.049072265625, 0.12139892578125, 0.1937255859375, 0.26605224609375, 0.33837890625, 0.41070556640625, 0.4830322265625, 0.55535888671875, 0.627685546875, 0.70001220703125, 0.7723388671875, 0.84466552734375, 0.9169921875, 0.98931884765625, 1.0616455078125, 1.13397216796875, 1.206298828125, 1.27862548828125, 1.3509521484375, 1.42327880859375, 1.49560546875, 1.56793212890625, 1.6402587890625, 1.71258544921875, 1.784912109375, 1.85723876953125, 1.9295654296875, 2.00189208984375, 2.07421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 4.0, 8.0, 14.0, 26.0, 31.0, 45.0, 95.0, 156.0, 287.0, 571.0, 1484.0, 7358.0, 194405.0, 3933135.0, 50492.0, 4177.0, 1018.0, 387.0, 237.0, 124.0, 75.0, 49.0, 31.0, 19.0, 14.0, 9.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-28.609375, -27.91748046875, -27.2255859375, -26.53369140625, -25.841796875, -25.14990234375, -24.4580078125, -23.76611328125, -23.07421875, -22.38232421875, -21.6904296875, -20.99853515625, -20.306640625, -19.61474609375, -18.9228515625, -18.23095703125, -17.5390625, -16.84716796875, -16.1552734375, -15.46337890625, -14.771484375, -14.07958984375, -13.3876953125, -12.69580078125, -12.00390625, -11.31201171875, -10.6201171875, -9.92822265625, -9.236328125, -8.54443359375, -7.8525390625, -7.16064453125, -6.46875, -5.77685546875, -5.0849609375, -4.39306640625, -3.701171875, -3.00927734375, -2.3173828125, -1.62548828125, -0.93359375, -0.24169921875, 0.4501953125, 1.14208984375, 1.833984375, 2.52587890625, 3.2177734375, 3.90966796875, 4.6015625, 5.29345703125, 5.9853515625, 6.67724609375, 7.369140625, 8.06103515625, 8.7529296875, 9.44482421875, 10.13671875, 10.82861328125, 11.5205078125, 12.21240234375, 12.904296875, 13.59619140625, 14.2880859375, 14.97998046875, 15.671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 8.0, 5.0, 9.0, 10.0, 10.0, 24.0, 27.0, 43.0, 37.0, 63.0, 77.0, 106.0, 153.0, 201.0, 286.0, 323.0, 480.0, 476.0, 411.0, 349.0, 240.0, 181.0, 139.0, 100.0, 94.0, 58.0, 40.0, 26.0, 26.0, 14.0, 15.0, 9.0, 4.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.23828125, -6.99298095703125, -6.7476806640625, -6.50238037109375, -6.257080078125, -6.01177978515625, -5.7664794921875, -5.52117919921875, -5.27587890625, -5.03057861328125, -4.7852783203125, -4.53997802734375, -4.294677734375, -4.04937744140625, -3.8040771484375, -3.55877685546875, -3.3134765625, -3.06817626953125, -2.8228759765625, -2.57757568359375, -2.332275390625, -2.08697509765625, -1.8416748046875, -1.59637451171875, -1.35107421875, -1.10577392578125, -0.8604736328125, -0.61517333984375, -0.369873046875, -0.12457275390625, 0.1207275390625, 0.36602783203125, 0.611328125, 0.85662841796875, 1.1019287109375, 1.34722900390625, 1.592529296875, 1.83782958984375, 2.0831298828125, 2.32843017578125, 2.57373046875, 2.81903076171875, 3.0643310546875, 3.30963134765625, 3.554931640625, 3.80023193359375, 4.0455322265625, 4.29083251953125, 4.5361328125, 4.78143310546875, 5.0267333984375, 5.27203369140625, 5.517333984375, 5.76263427734375, 6.0079345703125, 6.25323486328125, 6.49853515625, 6.74383544921875, 6.9891357421875, 7.23443603515625, 7.479736328125, 7.72503662109375, 7.9703369140625, 8.21563720703125, 8.4609375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 11.0, 20.0, 17.0, 28.0, 43.0, 73.0, 111.0, 150.0, 174.0, 125.0, 92.0, 44.0, 38.0, 19.0, 11.0, 10.0, 5.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.85687255859375, -117.5990219116211, -114.34117126464844, -111.08331298828125, -107.8254623413086, -104.56761169433594, -101.30976104736328, -98.05191040039062, -94.79405212402344, -91.53620147705078, -88.27835083007812, -85.02049255371094, -81.76264190673828, -78.50479125976562, -75.24694061279297, -71.98908996582031, -68.73123931884766, -65.473388671875, -62.21553421020508, -58.95768356323242, -55.6998291015625, -52.441978454589844, -49.18412780761719, -45.92627716064453, -42.66842269897461, -39.41057205200195, -36.15271759033203, -32.894866943359375, -29.637014389038086, -26.379161834716797, -23.12131118774414, -19.86345863342285, -16.605613708496094, -13.347761154174805, -10.089909553527832, -6.832057952880859, -3.5742053985595703, -0.31635284423828125, 2.941497802734375, 6.199350357055664, 9.457202911376953, 12.715055465698242, 15.972907066345215, 19.230758666992188, 22.488611221313477, 25.746463775634766, 29.004314422607422, 32.262168884277344, 35.52001953125, 38.777870178222656, 42.03572463989258, 45.293575286865234, 48.551429748535156, 51.80928039550781, 55.06713104248047, 58.324981689453125, 61.58283615112305, 64.84069061279297, 68.09854125976562, 71.35639190673828, 74.61424255371094, 77.87210083007812, 81.12994384765625, 84.38780212402344, 87.6456527709961]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 6.0, 10.0, 13.0, 10.0, 6.0, 15.0, 14.0, 16.0, 25.0, 28.0, 26.0, 22.0, 33.0, 44.0, 31.0, 45.0, 40.0, 55.0, 53.0, 59.0, 53.0, 50.0, 30.0, 40.0, 35.0, 28.0, 41.0, 27.0, 24.0, 25.0, 19.0, 19.0, 15.0, 11.0, 8.0, 4.0, 3.0, 3.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.165245056152344, -39.78171157836914, -38.39817810058594, -37.01464080810547, -35.631107330322266, -34.24757385253906, -32.86404037475586, -31.480506896972656, -30.09697151184082, -28.713438034057617, -27.32990264892578, -25.946369171142578, -24.562835693359375, -23.17930030822754, -21.795766830444336, -20.4122314453125, -19.028697967529297, -17.645164489746094, -16.261629104614258, -14.878095626831055, -13.494561195373535, -12.111026763916016, -10.727493286132812, -9.343958854675293, -7.960424423217773, -6.576889991760254, -5.193356037139893, -3.8098220825195312, -2.4262876510620117, -1.0427532196044922, 0.34078025817871094, 1.7243146896362305, 3.10784912109375, 4.4913835525512695, 5.874917507171631, 7.258451461791992, 8.641985893249512, 10.025520324707031, 11.409053802490234, 12.792588233947754, 14.176122665405273, 15.559657096862793, 16.943191528320312, 18.326725006103516, 19.71025848388672, 21.093793869018555, 22.477327346801758, 23.860862731933594, 25.244396209716797, 26.6279296875, 28.011465072631836, 29.39499855041504, 30.778533935546875, 32.16206741333008, 33.54560089111328, 34.929134368896484, 36.31266784667969, 37.69620132446289, 39.079734802246094, 40.46327209472656, 41.846805572509766, 43.23033905029297, 44.61387252807617, 45.997406005859375, 47.380943298339844]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 10.0, 9.0, 19.0, 28.0, 49.0, 53.0, 97.0, 142.0, 220.0, 379.0, 581.0, 1035.0, 1929.0, 3910.0, 8619.0, 22182.0, 69182.0, 299989.0, 489106.0, 99425.0, 30289.0, 11108.0, 4825.0, 2309.0, 1215.0, 731.0, 423.0, 254.0, 147.0, 103.0, 51.0, 38.0, 22.0, 20.0, 17.0, 8.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.81640625, -4.67108154296875, -4.5257568359375, -4.38043212890625, -4.235107421875, -4.08978271484375, -3.9444580078125, -3.79913330078125, -3.65380859375, -3.50848388671875, -3.3631591796875, -3.21783447265625, -3.072509765625, -2.92718505859375, -2.7818603515625, -2.63653564453125, -2.4912109375, -2.34588623046875, -2.2005615234375, -2.05523681640625, -1.909912109375, -1.76458740234375, -1.6192626953125, -1.47393798828125, -1.32861328125, -1.18328857421875, -1.0379638671875, -0.89263916015625, -0.747314453125, -0.60198974609375, -0.4566650390625, -0.31134033203125, -0.166015625, -0.02069091796875, 0.1246337890625, 0.26995849609375, 0.415283203125, 0.56060791015625, 0.7059326171875, 0.85125732421875, 0.99658203125, 1.14190673828125, 1.2872314453125, 1.43255615234375, 1.577880859375, 1.72320556640625, 1.8685302734375, 2.01385498046875, 2.1591796875, 2.30450439453125, 2.4498291015625, 2.59515380859375, 2.740478515625, 2.88580322265625, 3.0311279296875, 3.17645263671875, 3.32177734375, 3.46710205078125, 3.6124267578125, 3.75775146484375, 3.903076171875, 4.04840087890625, 4.1937255859375, 4.33905029296875, 4.484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 4.0, 5.0, 14.0, 9.0, 15.0, 13.0, 22.0, 18.0, 25.0, 19.0, 30.0, 37.0, 29.0, 33.0, 43.0, 40.0, 40.0, 52.0, 53.0, 57.0, 43.0, 43.0, 31.0, 42.0, 43.0, 40.0, 35.0, 35.0, 22.0, 17.0, 18.0, 10.0, 10.0, 17.0, 8.0, 5.0, 10.0, 3.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.75390625, -3.6519775390625, -3.550048828125, -3.4481201171875, -3.34619140625, -3.2442626953125, -3.142333984375, -3.0404052734375, -2.9384765625, -2.8365478515625, -2.734619140625, -2.6326904296875, -2.53076171875, -2.4288330078125, -2.326904296875, -2.2249755859375, -2.123046875, -2.0211181640625, -1.919189453125, -1.8172607421875, -1.71533203125, -1.6134033203125, -1.511474609375, -1.4095458984375, -1.3076171875, -1.2056884765625, -1.103759765625, -1.0018310546875, -0.89990234375, -0.7979736328125, -0.696044921875, -0.5941162109375, -0.4921875, -0.3902587890625, -0.288330078125, -0.1864013671875, -0.08447265625, 0.0174560546875, 0.119384765625, 0.2213134765625, 0.3232421875, 0.4251708984375, 0.527099609375, 0.6290283203125, 0.73095703125, 0.8328857421875, 0.934814453125, 1.0367431640625, 1.138671875, 1.2406005859375, 1.342529296875, 1.4444580078125, 1.54638671875, 1.6483154296875, 1.750244140625, 1.8521728515625, 1.9541015625, 2.0560302734375, 2.157958984375, 2.2598876953125, 2.36181640625, 2.4637451171875, 2.565673828125, 2.6676025390625, 2.76953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 10.0, 10.0, 8.0, 15.0, 19.0, 24.0, 36.0, 67.0, 105.0, 145.0, 210.0, 355.0, 688.0, 1402.0, 3529.0, 12128.0, 66453.0, 867013.0, 76273.0, 13190.0, 3706.0, 1431.0, 679.0, 361.0, 234.0, 140.0, 84.0, 69.0, 46.0, 29.0, 19.0, 24.0, 10.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75390625, -5.53704833984375, -5.3201904296875, -5.10333251953125, -4.886474609375, -4.66961669921875, -4.4527587890625, -4.23590087890625, -4.01904296875, -3.80218505859375, -3.5853271484375, -3.36846923828125, -3.151611328125, -2.93475341796875, -2.7178955078125, -2.50103759765625, -2.2841796875, -2.06732177734375, -1.8504638671875, -1.63360595703125, -1.416748046875, -1.19989013671875, -0.9830322265625, -0.76617431640625, -0.54931640625, -0.33245849609375, -0.1156005859375, 0.10125732421875, 0.318115234375, 0.53497314453125, 0.7518310546875, 0.96868896484375, 1.185546875, 1.40240478515625, 1.6192626953125, 1.83612060546875, 2.052978515625, 2.26983642578125, 2.4866943359375, 2.70355224609375, 2.92041015625, 3.13726806640625, 3.3541259765625, 3.57098388671875, 3.787841796875, 4.00469970703125, 4.2215576171875, 4.43841552734375, 4.6552734375, 4.87213134765625, 5.0889892578125, 5.30584716796875, 5.522705078125, 5.73956298828125, 5.9564208984375, 6.17327880859375, 6.39013671875, 6.60699462890625, 6.8238525390625, 7.04071044921875, 7.257568359375, 7.47442626953125, 7.6912841796875, 7.90814208984375, 8.125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 6.0, 5.0, 4.0, 5.0, 11.0, 14.0, 16.0, 17.0, 19.0, 21.0, 30.0, 17.0, 29.0, 48.0, 48.0, 52.0, 80.0, 83.0, 84.0, 70.0, 67.0, 41.0, 47.0, 39.0, 20.0, 22.0, 20.0, 15.0, 15.0, 10.0, 9.0, 6.0, 5.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.3917236328125, -11.947509765625, -11.5032958984375, -11.05908203125, -10.6148681640625, -10.170654296875, -9.7264404296875, -9.2822265625, -8.8380126953125, -8.393798828125, -7.9495849609375, -7.50537109375, -7.0611572265625, -6.616943359375, -6.1727294921875, -5.728515625, -5.2843017578125, -4.840087890625, -4.3958740234375, -3.95166015625, -3.5074462890625, -3.063232421875, -2.6190185546875, -2.1748046875, -1.7305908203125, -1.286376953125, -0.8421630859375, -0.39794921875, 0.0462646484375, 0.490478515625, 0.9346923828125, 1.37890625, 1.8231201171875, 2.267333984375, 2.7115478515625, 3.15576171875, 3.5999755859375, 4.044189453125, 4.4884033203125, 4.9326171875, 5.3768310546875, 5.821044921875, 6.2652587890625, 6.70947265625, 7.1536865234375, 7.597900390625, 8.0421142578125, 8.486328125, 8.9305419921875, 9.374755859375, 9.8189697265625, 10.26318359375, 10.7073974609375, 11.151611328125, 11.5958251953125, 12.0400390625, 12.4842529296875, 12.928466796875, 13.3726806640625, 13.81689453125, 14.2611083984375, 14.705322265625, 15.1495361328125, 15.59375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 12.0, 26.0, 21.0, 30.0, 50.0, 83.0, 155.0, 217.0, 377.0, 646.0, 1096.0, 2287.0, 4857.0, 11807.0, 33697.0, 147796.0, 747601.0, 63997.0, 19349.0, 7438.0, 3355.0, 1563.0, 786.0, 463.0, 286.0, 193.0, 107.0, 82.0, 50.0, 26.0, 21.0, 19.0, 10.0, 10.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.107421875, -1.0741119384765625, -1.040802001953125, -1.0074920654296875, -0.97418212890625, -0.9408721923828125, -0.907562255859375, -0.8742523193359375, -0.8409423828125, -0.8076324462890625, -0.774322509765625, -0.7410125732421875, -0.70770263671875, -0.6743927001953125, -0.641082763671875, -0.6077728271484375, -0.574462890625, -0.5411529541015625, -0.507843017578125, -0.4745330810546875, -0.44122314453125, -0.4079132080078125, -0.374603271484375, -0.3412933349609375, -0.3079833984375, -0.2746734619140625, -0.241363525390625, -0.2080535888671875, -0.17474365234375, -0.1414337158203125, -0.108123779296875, -0.0748138427734375, -0.04150390625, -0.0081939697265625, 0.025115966796875, 0.0584259033203125, 0.09173583984375, 0.1250457763671875, 0.158355712890625, 0.1916656494140625, 0.2249755859375, 0.2582855224609375, 0.291595458984375, 0.3249053955078125, 0.35821533203125, 0.3915252685546875, 0.424835205078125, 0.4581451416015625, 0.491455078125, 0.5247650146484375, 0.558074951171875, 0.5913848876953125, 0.62469482421875, 0.6580047607421875, 0.691314697265625, 0.7246246337890625, 0.7579345703125, 0.7912445068359375, 0.824554443359375, 0.8578643798828125, 0.89117431640625, 0.9244842529296875, 0.957794189453125, 0.9911041259765625, 1.0244140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 4.0, 3.0, 5.0, 7.0, 12.0, 13.0, 16.0, 21.0, 24.0, 34.0, 53.0, 94.0, 119.0, 130.0, 122.0, 98.0, 55.0, 46.0, 28.0, 21.0, 16.0, 8.0, 10.0, 9.0, 7.0, 8.0, 4.0, 3.0, 4.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004742145538330078, -0.000458691269159317, -0.0004431679844856262, -0.0004276446998119354, -0.00041212141513824463, -0.00039659813046455383, -0.00038107484579086304, -0.00036555156111717224, -0.00035002827644348145, -0.00033450499176979065, -0.00031898170709609985, -0.00030345842242240906, -0.00028793513774871826, -0.00027241185307502747, -0.00025688856840133667, -0.00024136528372764587, -0.00022584199905395508, -0.00021031871438026428, -0.00019479542970657349, -0.0001792721450328827, -0.0001637488603591919, -0.0001482255756855011, -0.0001327022910118103, -0.00011717900633811951, -0.00010165572166442871, -8.613243699073792e-05, -7.060915231704712e-05, -5.508586764335632e-05, -3.956258296966553e-05, -2.403929829597473e-05, -8.516013622283936e-06, 7.00727105140686e-06, 2.2530555725097656e-05, 3.805384039878845e-05, 5.357712507247925e-05, 6.910040974617004e-05, 8.462369441986084e-05, 0.00010014697909355164, 0.00011567026376724243, 0.00013119354844093323, 0.00014671683311462402, 0.00016224011778831482, 0.00017776340246200562, 0.0001932866871356964, 0.0002088099718093872, 0.000224333256483078, 0.0002398565411567688, 0.0002553798258304596, 0.0002709031105041504, 0.0002864263951778412, 0.000301949679851532, 0.0003174729645252228, 0.0003329962491989136, 0.00034851953387260437, 0.00036404281854629517, 0.00037956610321998596, 0.00039508938789367676, 0.00041061267256736755, 0.00042613595724105835, 0.00044165924191474915, 0.00045718252658843994, 0.00047270581126213074, 0.00048822909593582153, 0.0005037523806095123, 0.0005192756652832031]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 11.0, 11.0, 10.0, 18.0, 36.0, 66.0, 93.0, 144.0, 293.0, 612.0, 1184.0, 2804.0, 6785.0, 18589.0, 69467.0, 785523.0, 119939.0, 27041.0, 9225.0, 3603.0, 1477.0, 722.0, 409.0, 194.0, 123.0, 70.0, 37.0, 21.0, 17.0, 6.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.580078125, -1.53448486328125, -1.4888916015625, -1.44329833984375, -1.397705078125, -1.35211181640625, -1.3065185546875, -1.26092529296875, -1.21533203125, -1.16973876953125, -1.1241455078125, -1.07855224609375, -1.032958984375, -0.98736572265625, -0.9417724609375, -0.89617919921875, -0.8505859375, -0.80499267578125, -0.7593994140625, -0.71380615234375, -0.668212890625, -0.62261962890625, -0.5770263671875, -0.53143310546875, -0.48583984375, -0.44024658203125, -0.3946533203125, -0.34906005859375, -0.303466796875, -0.25787353515625, -0.2122802734375, -0.16668701171875, -0.12109375, -0.07550048828125, -0.0299072265625, 0.01568603515625, 0.061279296875, 0.10687255859375, 0.1524658203125, 0.19805908203125, 0.24365234375, 0.28924560546875, 0.3348388671875, 0.38043212890625, 0.426025390625, 0.47161865234375, 0.5172119140625, 0.56280517578125, 0.6083984375, 0.65399169921875, 0.6995849609375, 0.74517822265625, 0.790771484375, 0.83636474609375, 0.8819580078125, 0.92755126953125, 0.97314453125, 1.01873779296875, 1.0643310546875, 1.10992431640625, 1.155517578125, 1.20111083984375, 1.2467041015625, 1.29229736328125, 1.337890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 2.0, 7.0, 5.0, 12.0, 22.0, 20.0, 36.0, 47.0, 87.0, 83.0, 127.0, 120.0, 83.0, 76.0, 76.0, 32.0, 27.0, 29.0, 20.0, 12.0, 10.0, 9.0, 4.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.71875, -1.67254638671875, -1.6263427734375, -1.58013916015625, -1.533935546875, -1.48773193359375, -1.4415283203125, -1.39532470703125, -1.34912109375, -1.30291748046875, -1.2567138671875, -1.21051025390625, -1.164306640625, -1.11810302734375, -1.0718994140625, -1.02569580078125, -0.9794921875, -0.93328857421875, -0.8870849609375, -0.84088134765625, -0.794677734375, -0.74847412109375, -0.7022705078125, -0.65606689453125, -0.60986328125, -0.56365966796875, -0.5174560546875, -0.47125244140625, -0.425048828125, -0.37884521484375, -0.3326416015625, -0.28643798828125, -0.240234375, -0.19403076171875, -0.1478271484375, -0.10162353515625, -0.055419921875, -0.00921630859375, 0.0369873046875, 0.08319091796875, 0.12939453125, 0.17559814453125, 0.2218017578125, 0.26800537109375, 0.314208984375, 0.36041259765625, 0.4066162109375, 0.45281982421875, 0.4990234375, 0.54522705078125, 0.5914306640625, 0.63763427734375, 0.683837890625, 0.73004150390625, 0.7762451171875, 0.82244873046875, 0.86865234375, 0.91485595703125, 0.9610595703125, 1.00726318359375, 1.053466796875, 1.09967041015625, 1.1458740234375, 1.19207763671875, 1.23828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 8.0, 19.0, 28.0, 54.0, 138.0, 399.0, 180.0, 70.0, 32.0, 34.0, 16.0, 6.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.836883544921875, -42.853431701660156, -40.86997985839844, -38.88652801513672, -36.903076171875, -34.91962432861328, -32.93617248535156, -30.952722549438477, -28.969270706176758, -26.98581886291504, -25.00236701965332, -23.018917083740234, -21.035465240478516, -19.052013397216797, -17.068561553955078, -15.08510971069336, -13.10165786743164, -11.118206024169922, -9.134754180908203, -7.151303291320801, -5.167851448059082, -3.1843996047973633, -1.200948715209961, 0.7825031280517578, 2.7659549713134766, 4.749406814575195, 6.732858180999756, 8.716309547424316, 10.699761390686035, 12.683213233947754, 14.666664123535156, 16.650115966796875, 18.633567810058594, 20.617019653320312, 22.60047149658203, 24.58392333984375, 26.56737518310547, 28.550827026367188, 30.534276962280273, 32.517730712890625, 34.501182556152344, 36.48463439941406, 38.46808624267578, 40.4515380859375, 42.43498992919922, 44.41844177246094, 46.401893615722656, 48.385345458984375, 50.36879348754883, 52.35224533081055, 54.335697174072266, 56.319149017333984, 58.3026008605957, 60.28605270385742, 62.269500732421875, 64.2529525756836, 66.23640441894531, 68.21985626220703, 70.20330810546875, 72.18675994873047, 74.17021179199219, 76.1536636352539, 78.13711547851562, 80.12056732177734, 82.10401916503906]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 9.0, 4.0, 9.0, 14.0, 12.0, 10.0, 17.0, 21.0, 19.0, 11.0, 16.0, 20.0, 26.0, 38.0, 73.0, 101.0, 104.0, 116.0, 109.0, 64.0, 40.0, 20.0, 17.0, 10.0, 23.0, 24.0, 19.0, 11.0, 10.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.46061325073242, -34.2375373840332, -33.014461517333984, -31.7913875579834, -30.56831169128418, -29.34523582458496, -28.122161865234375, -26.899085998535156, -25.676010131835938, -24.45293426513672, -23.2298583984375, -22.006784439086914, -20.783708572387695, -19.560632705688477, -18.33755874633789, -17.114482879638672, -15.891407012939453, -14.668331146240234, -13.445256233215332, -12.22218132019043, -10.999105453491211, -9.776029586791992, -8.55295467376709, -7.3298797607421875, -6.106803894042969, -4.883728504180908, -3.6606531143188477, -2.437577724456787, -1.2145023345947266, 0.008573055267333984, 1.2316484451293945, 2.454723358154297, 3.67779541015625, 4.9008708000183105, 6.123946189880371, 7.347021579742432, 8.570096969604492, 9.793172836303711, 11.016247749328613, 12.239322662353516, 13.462398529052734, 14.685474395751953, 15.908549308776855, 17.131624221801758, 18.354700088500977, 19.577775955200195, 20.80084991455078, 22.02392578125, 23.24700164794922, 24.470077514648438, 25.693153381347656, 26.916227340698242, 28.13930320739746, 29.36237907409668, 30.585453033447266, 31.808528900146484, 33.0316047668457, 34.25468063354492, 35.47775650024414, 36.70083236694336, 37.92390441894531, 39.14698028564453, 40.37005615234375, 41.59313201904297, 42.81620788574219]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 11.0, 11.0, 6.0, 19.0, 18.0, 14.0, 13.0, 22.0, 30.0, 26.0, 37.0, 41.0, 29.0, 78.0, 174.0, 110.0, 67.0, 35.0, 26.0, 30.0, 21.0, 24.0, 23.0, 21.0, 24.0, 12.0, 14.0, 11.0, 9.0, 6.0, 8.0, 4.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37109375, -3.26806640625, -3.1650390625, -3.06201171875, -2.958984375, -2.85595703125, -2.7529296875, -2.64990234375, -2.546875, -2.44384765625, -2.3408203125, -2.23779296875, -2.134765625, -2.03173828125, -1.9287109375, -1.82568359375, -1.72265625, -1.61962890625, -1.5166015625, -1.41357421875, -1.310546875, -1.20751953125, -1.1044921875, -1.00146484375, -0.8984375, -0.79541015625, -0.6923828125, -0.58935546875, -0.486328125, -0.38330078125, -0.2802734375, -0.17724609375, -0.07421875, 0.02880859375, 0.1318359375, 0.23486328125, 0.337890625, 0.44091796875, 0.5439453125, 0.64697265625, 0.75, 0.85302734375, 0.9560546875, 1.05908203125, 1.162109375, 1.26513671875, 1.3681640625, 1.47119140625, 1.57421875, 1.67724609375, 1.7802734375, 1.88330078125, 1.986328125, 2.08935546875, 2.1923828125, 2.29541015625, 2.3984375, 2.50146484375, 2.6044921875, 2.70751953125, 2.810546875, 2.91357421875, 3.0166015625, 3.11962890625, 3.22265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 9.0, 10.0, 13.0, 15.0, 36.0, 46.0, 124.0, 209.0, 713.0, 3524.0, 48867.0, 8326156.0, 6920.0, 1251.0, 379.0, 126.0, 74.0, 25.0, 21.0, 4.0, 6.0, 14.0, 16.0, 16.0, 3.0, 0.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-37.74658966064453, -36.452911376953125, -35.15923309326172, -33.86555480957031, -32.571876525878906, -31.278196334838867, -29.98451805114746, -28.690837860107422, -27.397159576416016, -26.10348129272461, -24.809803009033203, -23.516124725341797, -22.222444534301758, -20.92876625061035, -19.635087966918945, -18.341407775878906, -17.047731399536133, -15.754053115844727, -14.460373878479004, -13.166695594787598, -11.873016357421875, -10.579338073730469, -9.285659790039062, -7.99198055267334, -6.698302268981934, -5.404623508453369, -4.110944747924805, -2.8172664642333984, -1.523587703704834, -0.22990894317626953, 1.0637693405151367, 2.3574485778808594, 3.6511268615722656, 4.94480562210083, 6.2384843826293945, 7.532162666320801, 8.825841903686523, 10.11952018737793, 11.413198471069336, 12.706877708435059, 14.000555992126465, 15.294234275817871, 16.587913513183594, 17.881591796875, 19.175270080566406, 20.468948364257812, 21.76262664794922, 23.056306838989258, 24.349985122680664, 25.64366340637207, 26.937341690063477, 28.231021881103516, 29.524700164794922, 30.818378448486328, 32.112056732177734, 33.40573501586914, 34.69941329956055, 35.99309158325195, 37.28676986694336, 38.580448150634766, 39.87412643432617, 41.167808532714844, 42.46148681640625, 43.755165100097656, 45.04884338378906]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 3.0, 2.0, 7.0, 4.0, 3.0, 3.0, 1.0, 9.0, 5.0, 8.0, 4.0, 8.0, 7.0, 3.0, 4.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.25182342529297, -41.656986236572266, -40.06214904785156, -38.46731185913086, -36.872474670410156, -35.27763748168945, -33.68280029296875, -32.08796310424805, -30.493125915527344, -28.89828872680664, -27.303451538085938, -25.708614349365234, -24.11377716064453, -22.518939971923828, -20.924102783203125, -19.329265594482422, -17.73443031311035, -16.13959312438965, -14.544755935668945, -12.949918746948242, -11.355081558227539, -9.760244369506836, -8.16540813446045, -6.570570945739746, -4.975733757019043, -3.38089656829834, -1.7860596179962158, -0.1912226676940918, 1.4036145210266113, 2.9984517097473145, 4.593288421630859, 6.1881256103515625, 7.782962799072266, 9.377799987792969, 10.972637176513672, 12.567474365234375, 14.162311553955078, 15.757148742675781, 17.351985931396484, 18.946823120117188, 20.54166030883789, 22.136497497558594, 23.731334686279297, 25.326171875, 26.921009063720703, 28.515846252441406, 30.11068344116211, 31.705520629882812, 33.30035400390625, 34.89519119262695, 36.490028381347656, 38.08486557006836, 39.67970275878906, 41.274539947509766, 42.86937713623047, 44.46421432495117, 46.059051513671875, 47.65388870239258, 49.24872589111328, 50.843563079833984, 52.43840026855469, 54.03323745727539, 55.628074645996094, 57.2229118347168, 58.8177490234375]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 8.0, 3.0, 8.0, 10.0, 12.0, 15.0, 20.0, 19.0, 11.0, 31.0, 37.0, 52.0, 51.0, 52.0, 62.0, 67.0, 73.0, 64.0, 60.0, 65.0, 42.0, 49.0, 42.0, 34.0, 32.0, 24.0, 12.0, 17.0, 9.0, 2.0, 5.0, 1.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.2191162109375, -2.135498046875, -2.0518798828125, -1.96826171875, -1.8846435546875, -1.801025390625, -1.7174072265625, -1.6337890625, -1.5501708984375, -1.466552734375, -1.3829345703125, -1.29931640625, -1.2156982421875, -1.132080078125, -1.0484619140625, -0.96484375, -0.8812255859375, -0.797607421875, -0.7139892578125, -0.63037109375, -0.5467529296875, -0.463134765625, -0.3795166015625, -0.2958984375, -0.2122802734375, -0.128662109375, -0.0450439453125, 0.03857421875, 0.1221923828125, 0.205810546875, 0.2894287109375, 0.373046875, 0.4566650390625, 0.540283203125, 0.6239013671875, 0.70751953125, 0.7911376953125, 0.874755859375, 0.9583740234375, 1.0419921875, 1.1256103515625, 1.209228515625, 1.2928466796875, 1.37646484375, 1.4600830078125, 1.543701171875, 1.6273193359375, 1.7109375, 1.7945556640625, 1.878173828125, 1.9617919921875, 2.04541015625, 2.1290283203125, 2.212646484375, 2.2962646484375, 2.3798828125, 2.4635009765625, 2.547119140625, 2.6307373046875, 2.71435546875, 2.7979736328125, 2.881591796875, 2.9652099609375, 3.048828125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 13.0, 18.0, 39.0, 50.0, 80.0, 128.0, 183.0, 322.0, 579.0, 999.0, 2125.0, 4394.0, 9784.0, 22821.0, 53473.0, 119309.0, 157101.0, 86699.0, 36838.0, 15587.0, 6905.0, 3197.0, 1588.0, 823.0, 457.0, 264.0, 171.0, 102.0, 64.0, 50.0, 25.0, 18.0, 11.0, 9.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.328125, -18.68994140625, -18.0517578125, -17.41357421875, -16.775390625, -16.13720703125, -15.4990234375, -14.86083984375, -14.22265625, -13.58447265625, -12.9462890625, -12.30810546875, -11.669921875, -11.03173828125, -10.3935546875, -9.75537109375, -9.1171875, -8.47900390625, -7.8408203125, -7.20263671875, -6.564453125, -5.92626953125, -5.2880859375, -4.64990234375, -4.01171875, -3.37353515625, -2.7353515625, -2.09716796875, -1.458984375, -0.82080078125, -0.1826171875, 0.45556640625, 1.09375, 1.73193359375, 2.3701171875, 3.00830078125, 3.646484375, 4.28466796875, 4.9228515625, 5.56103515625, 6.19921875, 6.83740234375, 7.4755859375, 8.11376953125, 8.751953125, 9.39013671875, 10.0283203125, 10.66650390625, 11.3046875, 11.94287109375, 12.5810546875, 13.21923828125, 13.857421875, 14.49560546875, 15.1337890625, 15.77197265625, 16.41015625, 17.04833984375, 17.6865234375, 18.32470703125, 18.962890625, 19.60107421875, 20.2392578125, 20.87744140625, 21.515625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 15.0, 9.0, 16.0, 17.0, 17.0, 23.0, 24.0, 21.0, 35.0, 28.0, 35.0, 46.0, 50.0, 48.0, 53.0, 46.0, 47.0, 64.0, 50.0, 47.0, 34.0, 28.0, 39.0, 27.0, 23.0, 21.0, 23.0, 23.0, 19.0, 5.0, 9.0, 9.0, 5.0, 8.0, 5.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.08648681640625, -2.9893798828125, -2.89227294921875, -2.795166015625, -2.69805908203125, -2.6009521484375, -2.50384521484375, -2.40673828125, -2.30963134765625, -2.2125244140625, -2.11541748046875, -2.018310546875, -1.92120361328125, -1.8240966796875, -1.72698974609375, -1.6298828125, -1.53277587890625, -1.4356689453125, -1.33856201171875, -1.241455078125, -1.14434814453125, -1.0472412109375, -0.95013427734375, -0.85302734375, -0.75592041015625, -0.6588134765625, -0.56170654296875, -0.464599609375, -0.36749267578125, -0.2703857421875, -0.17327880859375, -0.076171875, 0.02093505859375, 0.1180419921875, 0.21514892578125, 0.312255859375, 0.40936279296875, 0.5064697265625, 0.60357666015625, 0.70068359375, 0.79779052734375, 0.8948974609375, 0.99200439453125, 1.089111328125, 1.18621826171875, 1.2833251953125, 1.38043212890625, 1.4775390625, 1.57464599609375, 1.6717529296875, 1.76885986328125, 1.865966796875, 1.96307373046875, 2.0601806640625, 2.15728759765625, 2.25439453125, 2.35150146484375, 2.4486083984375, 2.54571533203125, 2.642822265625, 2.73992919921875, 2.8370361328125, 2.93414306640625, 3.03125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 21.0, 25.0, 62.0, 105.0, 105.0, 61.0, 31.0, 16.0, 4.0, 3.0, 4.0, 6.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.659820556640625, -30.639490127563477, -29.619159698486328, -28.598827362060547, -27.5784969329834, -26.55816650390625, -25.5378360748291, -24.517505645751953, -23.497173309326172, -22.476842880249023, -21.456512451171875, -20.436180114746094, -19.415849685668945, -18.395519256591797, -17.37518882751465, -16.3548583984375, -15.334527969360352, -14.314197540283203, -13.293866157531738, -12.27353572845459, -11.253204345703125, -10.232873916625977, -9.212543487548828, -8.19221305847168, -7.171881675720215, -6.151550769805908, -5.131219863891602, -4.110889434814453, -3.0905585289001465, -2.07022762298584, -1.0498971939086914, -0.029566287994384766, 0.9907646179199219, 2.0110955238342285, 3.031426191329956, 4.051756858825684, 5.07208776473999, 6.092418670654297, 7.112749099731445, 8.133079528808594, 9.153410911560059, 10.173741340637207, 11.194072723388672, 12.21440315246582, 13.234733581542969, 14.255064964294434, 15.275395393371582, 16.295726776123047, 17.316057205200195, 18.336387634277344, 19.356718063354492, 20.37704849243164, 21.397380828857422, 22.41771125793457, 23.43804168701172, 24.458372116088867, 25.478702545166016, 26.499032974243164, 27.519363403320312, 28.539695739746094, 29.560026168823242, 30.58035659790039, 31.60068702697754, 32.62101745605469, 33.64134979248047]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 5.0, 7.0, 9.0, 8.0, 9.0, 16.0, 21.0, 32.0, 58.0, 55.0, 72.0, 45.0, 27.0, 27.0, 18.0, 11.0, 7.0, 10.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.537559509277344, -15.982501029968262, -15.42744255065918, -14.872384071350098, -14.317325592041016, -13.76226806640625, -13.207209587097168, -12.652151107788086, -12.097092628479004, -11.542034149169922, -10.98697566986084, -10.431917190551758, -9.876859664916992, -9.321800231933594, -8.766742706298828, -8.211684226989746, -7.656625747680664, -7.101567268371582, -6.5465087890625, -5.991450786590576, -5.436392307281494, -4.881333827972412, -4.326275825500488, -3.7712173461914062, -3.216158866882324, -2.661100387573242, -2.1060421466827393, -1.5509837865829468, -0.9959254264831543, -0.44086694717407227, 0.11419129371643066, 0.6692495346069336, 1.2243061065673828, 1.7793644666671753, 2.3344228267669678, 2.8894810676574707, 3.4445395469665527, 3.9995980262756348, 4.554656028747559, 5.109714508056641, 5.664772987365723, 6.219831466674805, 6.774889945983887, 7.3299479484558105, 7.885006427764893, 8.440065383911133, 8.995122909545898, 9.55018138885498, 10.105239868164062, 10.660298347473145, 11.215356826782227, 11.770415306091309, 12.32547378540039, 12.880531311035156, 13.435589790344238, 13.99064826965332, 14.545706748962402, 15.100765228271484, 15.655823707580566, 16.21088218688965, 16.765939712524414, 17.320999145507812, 17.876056671142578, 18.431114196777344, 18.986173629760742]}, "eval/loss": 1.8941514492034912, "eval/wer": 1.1062871876239588, "eval/runtime": 910.08, "eval/samples_per_second": 2.903, "eval/steps_per_second": 0.364} \ No newline at end of file