diff --git "a/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" "b/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" --- "a/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" +++ "b/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.2069, "train/learning_rate": 1.9512195121951218e-06, "train/epoch": 5.0, "train/global_step": 1115, "_runtime": 26937, "_timestamp": 1648264065, "_step": 1118, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 13.0, 18.0, 25.0, 50.0, 74.0, 109.0, 157.0, 160.0, 161.0, 89.0, 56.0, 41.0, 23.0, 17.0, 7.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.614524245262146, -0.5559785962104797, -0.4974329471588135, -0.4388873279094696, -0.38034167885780334, -0.3217960298061371, -0.2632504105567932, -0.20470476150512695, -0.1461591124534607, -0.08761347085237503, -0.029067829251289368, 0.029477804899215698, 0.08802345395088196, 0.14656910300254822, 0.2051147222518921, 0.26366037130355835, 0.3222060203552246, 0.38075166940689087, 0.43929731845855713, 0.497842937707901, 0.5563886165618896, 0.6149342060089111, 0.6734798550605774, 0.7320255041122437, 0.7905711531639099, 0.8491168022155762, 0.9076624512672424, 0.9662081003189087, 1.0247536897659302, 1.0832993984222412, 1.1418449878692627, 1.2003905773162842, 1.2589364051818848, 1.3174819946289062, 1.3760277032852173, 1.4345732927322388, 1.4931190013885498, 1.5516645908355713, 1.6102101802825928, 1.6687558889389038, 1.7273015975952148, 1.7858471870422363, 1.8443928956985474, 1.9029384851455688, 1.9614841938018799, 2.0200297832489014, 2.078575372695923, 2.1371212005615234, 2.195666790008545, 2.2542123794555664, 2.312757968902588, 2.3713037967681885, 2.42984938621521, 2.4883949756622314, 2.546940565109253, 2.6054863929748535, 2.664031744003296, 2.7225773334503174, 2.781122922897339, 2.8396687507629395, 2.898214340209961, 2.9567599296569824, 3.015305519104004, 3.0738511085510254, 3.132396936416626]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 4.0, 7.0, 7.0, 5.0, 8.0, 16.0, 17.0, 13.0, 14.0, 24.0, 20.0, 25.0, 31.0, 27.0, 24.0, 39.0, 29.0, 38.0, 51.0, 40.0, 46.0, 41.0, 32.0, 36.0, 41.0, 34.0, 39.0, 27.0, 32.0, 14.0, 23.0, 25.0, 27.0, 19.0, 19.0, 13.0, 9.0, 15.0, 14.0, 10.0, 5.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 5.0], "bins": [-0.7400795221328735, -0.7190272808074951, -0.6979750990867615, -0.6769228577613831, -0.6558706760406494, -0.634818434715271, -0.6137662529945374, -0.5927140116691589, -0.5716618299484253, -0.5506095886230469, -0.5295574069023132, -0.5085051655769348, -0.48745298385620117, -0.46640077233314514, -0.4453485608100891, -0.4242963194847107, -0.40324410796165466, -0.38219189643859863, -0.3611396849155426, -0.3400874733924866, -0.31903526186943054, -0.2979830503463745, -0.2769308090209961, -0.25587862730026245, -0.23482640087604523, -0.2137741893529892, -0.19272197782993317, -0.17166975140571594, -0.1506175398826599, -0.12956532835960388, -0.10851311683654785, -0.08746090531349182, -0.06640869379043579, -0.04535648226737976, -0.024304267019033432, -0.0032520517706871033, 0.017800159752368927, 0.03885237127542496, 0.059904590249061584, 0.08095680177211761, 0.10200901329517365, 0.12306122481822968, 0.1441134363412857, 0.16516566276550293, 0.18621787428855896, 0.207270085811615, 0.22832229733467102, 0.24937450885772705, 0.2704267203807831, 0.2914789319038391, 0.31253114342689514, 0.33358335494995117, 0.3546355664730072, 0.37568777799606323, 0.39674001932144165, 0.4177922010421753, 0.4388444423675537, 0.45989665389060974, 0.48094886541366577, 0.5020011067390442, 0.5230532884597778, 0.5441055297851562, 0.5651577115058899, 0.5862099528312683, 0.607262134552002]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 17.0, 15.0, 26.0, 30.0, 35.0, 63.0, 97.0, 128.0, 188.0, 280.0, 440.0, 788.0, 1307.0, 2487.0, 5555.0, 14801.0, 99328.0, 1248391.0, 2544552.0, 235525.0, 25350.0, 7514.0, 3245.0, 1628.0, 850.0, 515.0, 345.0, 222.0, 156.0, 135.0, 69.0, 52.0, 37.0, 32.0, 17.0, 15.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0], "bins": [-3.935546875, -3.829681396484375, -3.72381591796875, -3.617950439453125, -3.5120849609375, -3.406219482421875, -3.30035400390625, -3.194488525390625, -3.088623046875, -2.982757568359375, -2.87689208984375, -2.771026611328125, -2.6651611328125, -2.559295654296875, -2.45343017578125, -2.347564697265625, -2.24169921875, -2.135833740234375, -2.02996826171875, -1.924102783203125, -1.8182373046875, -1.712371826171875, -1.60650634765625, -1.500640869140625, -1.394775390625, -1.288909912109375, -1.18304443359375, -1.077178955078125, -0.9713134765625, -0.865447998046875, -0.75958251953125, -0.653717041015625, -0.5478515625, -0.441986083984375, -0.33612060546875, -0.230255126953125, -0.1243896484375, -0.018524169921875, 0.08734130859375, 0.193206787109375, 0.299072265625, 0.404937744140625, 0.51080322265625, 0.616668701171875, 0.7225341796875, 0.828399658203125, 0.93426513671875, 1.040130615234375, 1.14599609375, 1.251861572265625, 1.35772705078125, 1.463592529296875, 1.5694580078125, 1.675323486328125, 1.78118896484375, 1.887054443359375, 1.992919921875, 2.098785400390625, 2.20465087890625, 2.310516357421875, 2.4163818359375, 2.522247314453125, 2.62811279296875, 2.733978271484375, 2.83984375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 9.0, 10.0, 8.0, 20.0, 18.0, 26.0, 21.0, 22.0, 34.0, 32.0, 29.0, 33.0, 45.0, 34.0, 57.0, 56.0, 54.0, 32.0, 41.0, 46.0, 38.0, 50.0, 33.0, 23.0, 30.0, 22.0, 29.0, 18.0, 22.0, 15.0, 10.0, 8.0, 12.0, 9.0, 9.0, 10.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.7158203125, -1.6680145263671875, -1.620208740234375, -1.5724029541015625, -1.52459716796875, -1.4767913818359375, -1.428985595703125, -1.3811798095703125, -1.3333740234375, -1.2855682373046875, -1.237762451171875, -1.1899566650390625, -1.14215087890625, -1.0943450927734375, -1.046539306640625, -0.9987335205078125, -0.950927734375, -0.9031219482421875, -0.855316162109375, -0.8075103759765625, -0.75970458984375, -0.7118988037109375, -0.664093017578125, -0.6162872314453125, -0.5684814453125, -0.5206756591796875, -0.472869873046875, -0.4250640869140625, -0.37725830078125, -0.3294525146484375, -0.281646728515625, -0.2338409423828125, -0.18603515625, -0.1382293701171875, -0.090423583984375, -0.0426177978515625, 0.00518798828125, 0.0529937744140625, 0.100799560546875, 0.1486053466796875, 0.1964111328125, 0.2442169189453125, 0.292022705078125, 0.3398284912109375, 0.38763427734375, 0.4354400634765625, 0.483245849609375, 0.5310516357421875, 0.578857421875, 0.6266632080078125, 0.674468994140625, 0.7222747802734375, 0.77008056640625, 0.8178863525390625, 0.865692138671875, 0.9134979248046875, 0.9613037109375, 1.0091094970703125, 1.056915283203125, 1.1047210693359375, 1.15252685546875, 1.2003326416015625, 1.248138427734375, 1.2959442138671875, 1.34375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 13.0, 22.0, 17.0, 39.0, 74.0, 132.0, 333.0, 1811.0, 55303.0, 4126606.0, 8398.0, 912.0, 313.0, 113.0, 58.0, 41.0, 24.0, 17.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9609375, -12.533203125, -12.10546875, -11.677734375, -11.25, -10.822265625, -10.39453125, -9.966796875, -9.5390625, -9.111328125, -8.68359375, -8.255859375, -7.828125, -7.400390625, -6.97265625, -6.544921875, -6.1171875, -5.689453125, -5.26171875, -4.833984375, -4.40625, -3.978515625, -3.55078125, -3.123046875, -2.6953125, -2.267578125, -1.83984375, -1.412109375, -0.984375, -0.556640625, -0.12890625, 0.298828125, 0.7265625, 1.154296875, 1.58203125, 2.009765625, 2.4375, 2.865234375, 3.29296875, 3.720703125, 4.1484375, 4.576171875, 5.00390625, 5.431640625, 5.859375, 6.287109375, 6.71484375, 7.142578125, 7.5703125, 7.998046875, 8.42578125, 8.853515625, 9.28125, 9.708984375, 10.13671875, 10.564453125, 10.9921875, 11.419921875, 11.84765625, 12.275390625, 12.703125, 13.130859375, 13.55859375, 13.986328125, 14.4140625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 4.0, 9.0, 10.0, 24.0, 21.0, 44.0, 79.0, 118.0, 221.0, 658.0, 1295.0, 822.0, 338.0, 165.0, 90.0, 63.0, 32.0, 25.0, 15.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8875885009765625, -0.854278564453125, -0.8209686279296875, -0.78765869140625, -0.7543487548828125, -0.721038818359375, -0.6877288818359375, -0.6544189453125, -0.6211090087890625, -0.587799072265625, -0.5544891357421875, -0.52117919921875, -0.4878692626953125, -0.454559326171875, -0.4212493896484375, -0.387939453125, -0.3546295166015625, -0.321319580078125, -0.2880096435546875, -0.25469970703125, -0.2213897705078125, -0.188079833984375, -0.1547698974609375, -0.1214599609375, -0.0881500244140625, -0.054840087890625, -0.0215301513671875, 0.01177978515625, 0.0450897216796875, 0.078399658203125, 0.1117095947265625, 0.14501953125, 0.1783294677734375, 0.211639404296875, 0.2449493408203125, 0.27825927734375, 0.3115692138671875, 0.344879150390625, 0.3781890869140625, 0.4114990234375, 0.4448089599609375, 0.478118896484375, 0.5114288330078125, 0.54473876953125, 0.5780487060546875, 0.611358642578125, 0.6446685791015625, 0.677978515625, 0.7112884521484375, 0.744598388671875, 0.7779083251953125, 0.81121826171875, 0.8445281982421875, 0.877838134765625, 0.9111480712890625, 0.9444580078125, 0.9777679443359375, 1.011077880859375, 1.0443878173828125, 1.07769775390625, 1.1110076904296875, 1.144317626953125, 1.1776275634765625, 1.2109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 11.0, 17.0, 15.0, 18.0, 14.0, 20.0, 32.0, 35.0, 61.0, 62.0, 76.0, 86.0, 81.0, 95.0, 81.0, 64.0, 50.0, 33.0, 34.0, 23.0, 23.0, 12.0, 14.0, 11.0, 7.0, 10.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.188549280166626, -2.1190285682678223, -2.0495080947875977, -1.979987382888794, -1.9104666709899902, -1.840946078300476, -1.771425485610962, -1.7019047737121582, -1.632384181022644, -1.5628635883331299, -1.4933428764343262, -1.423822283744812, -1.3543016910552979, -1.2847809791564941, -1.21526038646698, -1.1457397937774658, -1.076219081878662, -1.006698489189148, -0.9371777772903442, -0.8676571846008301, -0.7981365323066711, -0.7286158800125122, -0.659095287322998, -0.5895746350288391, -0.5200539827346802, -0.45053333044052124, -0.3810127079486847, -0.31149208545684814, -0.2419714331626892, -0.17245078086853027, -0.10293015837669373, -0.03340953588485718, 0.03611111640930176, 0.1056317538022995, 0.17515239119529724, 0.24467302858829498, 0.3141936659812927, 0.38371431827545166, 0.4532349407672882, 0.5227555632591248, 0.5922762155532837, 0.6617968678474426, 0.7313175201416016, 0.8008381128311157, 0.8703587651252747, 0.9398794174194336, 1.0094000101089478, 1.078920602798462, 1.1484413146972656, 1.2179619073867798, 1.2874826192855835, 1.3570032119750977, 1.4265239238739014, 1.4960445165634155, 1.5655651092529297, 1.6350858211517334, 1.7046064138412476, 1.7741270065307617, 1.8436477184295654, 1.9131683111190796, 1.9826889038085938, 2.0522096157073975, 2.121730327606201, 2.191250801086426, 2.2607715129852295]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 5.0, 14.0, 12.0, 11.0, 14.0, 19.0, 16.0, 28.0, 35.0, 36.0, 40.0, 39.0, 38.0, 44.0, 50.0, 42.0, 38.0, 56.0, 36.0, 38.0, 51.0, 35.0, 32.0, 40.0, 25.0, 32.0, 25.0, 25.0, 22.0, 16.0, 18.0, 9.0, 15.0, 8.0, 8.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.7684389352798462, -1.720792293548584, -1.6731456518173218, -1.6254990100860596, -1.5778523683547974, -1.5302057266235352, -1.482559084892273, -1.4349124431610107, -1.3872658014297485, -1.3396191596984863, -1.2919725179672241, -1.244325876235962, -1.1966792345046997, -1.1490325927734375, -1.1013859510421753, -1.053739309310913, -1.0060926675796509, -0.9584460258483887, -0.9107993841171265, -0.8631527423858643, -0.815506100654602, -0.7678594589233398, -0.7202128171920776, -0.6725661754608154, -0.6249195337295532, -0.577272891998291, -0.5296262502670288, -0.4819796085357666, -0.4343329668045044, -0.3866863250732422, -0.33903968334198, -0.2913930416107178, -0.24374651908874512, -0.1960998773574829, -0.1484532356262207, -0.1008065938949585, -0.05315995216369629, -0.005513310432434082, 0.042133331298828125, 0.08977997303009033, 0.13742661476135254, 0.18507325649261475, 0.23271989822387695, 0.28036653995513916, 0.32801318168640137, 0.3756598234176636, 0.4233064651489258, 0.470953106880188, 0.5185997486114502, 0.5662463903427124, 0.6138930320739746, 0.6615396738052368, 0.709186315536499, 0.7568329572677612, 0.8044795989990234, 0.8521262407302856, 0.8997728824615479, 0.9474195241928101, 0.9950661659240723, 1.0427128076553345, 1.0903594493865967, 1.1380060911178589, 1.185652732849121, 1.2332993745803833, 1.2809460163116455]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 6.0, 12.0, 14.0, 30.0, 32.0, 40.0, 67.0, 108.0, 162.0, 249.0, 372.0, 607.0, 898.0, 1588.0, 2695.0, 5145.0, 9935.0, 21051.0, 46848.0, 108909.0, 254478.0, 324257.0, 151142.0, 64048.0, 27879.0, 13056.0, 6534.0, 3393.0, 1934.0, 1120.0, 672.0, 438.0, 292.0, 169.0, 120.0, 70.0, 46.0, 38.0, 32.0, 26.0, 17.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.755859375, -0.7308197021484375, -0.705780029296875, -0.6807403564453125, -0.65570068359375, -0.6306610107421875, -0.605621337890625, -0.5805816650390625, -0.5555419921875, -0.5305023193359375, -0.505462646484375, -0.4804229736328125, -0.45538330078125, -0.4303436279296875, -0.405303955078125, -0.3802642822265625, -0.355224609375, -0.3301849365234375, -0.305145263671875, -0.2801055908203125, -0.25506591796875, -0.2300262451171875, -0.204986572265625, -0.1799468994140625, -0.1549072265625, -0.1298675537109375, -0.104827880859375, -0.0797882080078125, -0.05474853515625, -0.0297088623046875, -0.004669189453125, 0.0203704833984375, 0.04541015625, 0.0704498291015625, 0.095489501953125, 0.1205291748046875, 0.14556884765625, 0.1706085205078125, 0.195648193359375, 0.2206878662109375, 0.2457275390625, 0.2707672119140625, 0.295806884765625, 0.3208465576171875, 0.34588623046875, 0.3709259033203125, 0.395965576171875, 0.4210052490234375, 0.446044921875, 0.4710845947265625, 0.496124267578125, 0.5211639404296875, 0.54620361328125, 0.5712432861328125, 0.596282958984375, 0.6213226318359375, 0.6463623046875, 0.6714019775390625, 0.696441650390625, 0.7214813232421875, 0.74652099609375, 0.7715606689453125, 0.796600341796875, 0.8216400146484375, 0.8466796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 10.0, 10.0, 23.0, 10.0, 16.0, 19.0, 30.0, 30.0, 38.0, 42.0, 45.0, 43.0, 32.0, 37.0, 54.0, 42.0, 37.0, 43.0, 49.0, 38.0, 43.0, 39.0, 39.0, 27.0, 31.0, 26.0, 19.0, 21.0, 17.0, 9.0, 12.0, 9.0, 12.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.998291015625, -0.96826171875, -0.938232421875, -0.908203125, -0.878173828125, -0.84814453125, -0.818115234375, -0.7880859375, -0.758056640625, -0.72802734375, -0.697998046875, -0.66796875, -0.637939453125, -0.60791015625, -0.577880859375, -0.5478515625, -0.517822265625, -0.48779296875, -0.457763671875, -0.427734375, -0.397705078125, -0.36767578125, -0.337646484375, -0.3076171875, -0.277587890625, -0.24755859375, -0.217529296875, -0.1875, -0.157470703125, -0.12744140625, -0.097412109375, -0.0673828125, -0.037353515625, -0.00732421875, 0.022705078125, 0.052734375, 0.082763671875, 0.11279296875, 0.142822265625, 0.1728515625, 0.202880859375, 0.23291015625, 0.262939453125, 0.29296875, 0.322998046875, 0.35302734375, 0.383056640625, 0.4130859375, 0.443115234375, 0.47314453125, 0.503173828125, 0.533203125, 0.563232421875, 0.59326171875, 0.623291015625, 0.6533203125, 0.683349609375, 0.71337890625, 0.743408203125, 0.7734375, 0.803466796875, 0.83349609375, 0.863525390625, 0.8935546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 13.0, 17.0, 28.0, 52.0, 85.0, 107.0, 175.0, 312.0, 434.0, 930.0, 1738.0, 3460.0, 8021.0, 20772.0, 64294.0, 239131.0, 472048.0, 163144.0, 45991.0, 15690.0, 6183.0, 2696.0, 1385.0, 761.0, 396.0, 246.0, 149.0, 87.0, 65.0, 33.0, 31.0, 19.0, 15.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8739700317382812, -0.8431549072265625, -0.8123397827148438, -0.781524658203125, -0.7507095336914062, -0.7198944091796875, -0.6890792846679688, -0.65826416015625, -0.6274490356445312, -0.5966339111328125, -0.5658187866210938, -0.535003662109375, -0.5041885375976562, -0.4733734130859375, -0.44255828857421875, -0.4117431640625, -0.38092803955078125, -0.3501129150390625, -0.31929779052734375, -0.288482666015625, -0.25766754150390625, -0.2268524169921875, -0.19603729248046875, -0.16522216796875, -0.13440704345703125, -0.1035919189453125, -0.07277679443359375, -0.041961669921875, -0.01114654541015625, 0.0196685791015625, 0.05048370361328125, 0.081298828125, 0.11211395263671875, 0.1429290771484375, 0.17374420166015625, 0.204559326171875, 0.23537445068359375, 0.2661895751953125, 0.29700469970703125, 0.32781982421875, 0.35863494873046875, 0.3894500732421875, 0.42026519775390625, 0.451080322265625, 0.48189544677734375, 0.5127105712890625, 0.5435256958007812, 0.5743408203125, 0.6051559448242188, 0.6359710693359375, 0.6667861938476562, 0.697601318359375, 0.7284164428710938, 0.7592315673828125, 0.7900466918945312, 0.82086181640625, 0.8516769409179688, 0.8824920654296875, 0.9133071899414062, 0.944122314453125, 0.9749374389648438, 1.0057525634765625, 1.0365676879882812, 1.0673828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 10.0, 16.0, 15.0, 13.0, 10.0, 22.0, 20.0, 16.0, 32.0, 44.0, 43.0, 35.0, 49.0, 47.0, 51.0, 32.0, 48.0, 46.0, 51.0, 33.0, 51.0, 42.0, 29.0, 29.0, 25.0, 22.0, 16.0, 18.0, 19.0, 11.0, 9.0, 11.0, 14.0, 6.0, 8.0, 7.0, 4.0, 3.0, 8.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9306640625, -1.8682098388671875, -1.805755615234375, -1.7433013916015625, -1.68084716796875, -1.6183929443359375, -1.555938720703125, -1.4934844970703125, -1.4310302734375, -1.3685760498046875, -1.306121826171875, -1.2436676025390625, -1.18121337890625, -1.1187591552734375, -1.056304931640625, -0.9938507080078125, -0.931396484375, -0.8689422607421875, -0.806488037109375, -0.7440338134765625, -0.68157958984375, -0.6191253662109375, -0.556671142578125, -0.4942169189453125, -0.4317626953125, -0.3693084716796875, -0.306854248046875, -0.2444000244140625, -0.18194580078125, -0.1194915771484375, -0.057037353515625, 0.0054168701171875, 0.06787109375, 0.1303253173828125, 0.192779541015625, 0.2552337646484375, 0.31768798828125, 0.3801422119140625, 0.442596435546875, 0.5050506591796875, 0.5675048828125, 0.6299591064453125, 0.692413330078125, 0.7548675537109375, 0.81732177734375, 0.8797760009765625, 0.942230224609375, 1.0046844482421875, 1.067138671875, 1.1295928955078125, 1.192047119140625, 1.2545013427734375, 1.31695556640625, 1.3794097900390625, 1.441864013671875, 1.5043182373046875, 1.5667724609375, 1.6292266845703125, 1.691680908203125, 1.7541351318359375, 1.81658935546875, 1.8790435791015625, 1.941497802734375, 2.0039520263671875, 2.06640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 12.0, 15.0, 35.0, 54.0, 45.0, 76.0, 145.0, 205.0, 311.0, 530.0, 876.0, 1483.0, 2792.0, 5473.0, 12108.0, 30805.0, 131137.0, 624842.0, 174003.0, 36964.0, 13422.0, 6118.0, 2921.0, 1680.0, 1002.0, 531.0, 346.0, 207.0, 121.0, 92.0, 54.0, 37.0, 25.0, 25.0, 12.0, 12.0, 10.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2384033203125, -0.23130226135253906, -0.22420120239257812, -0.2171001434326172, -0.20999908447265625, -0.2028980255126953, -0.19579696655273438, -0.18869590759277344, -0.1815948486328125, -0.17449378967285156, -0.16739273071289062, -0.1602916717529297, -0.15319061279296875, -0.1460895538330078, -0.13898849487304688, -0.13188743591308594, -0.124786376953125, -0.11768531799316406, -0.11058425903320312, -0.10348320007324219, -0.09638214111328125, -0.08928108215332031, -0.08218002319335938, -0.07507896423339844, -0.0679779052734375, -0.06087684631347656, -0.053775787353515625, -0.04667472839355469, -0.03957366943359375, -0.03247261047363281, -0.025371551513671875, -0.018270492553710938, -0.01116943359375, -0.0040683746337890625, 0.003032684326171875, 0.010133743286132812, 0.01723480224609375, 0.024335861206054688, 0.031436920166015625, 0.03853797912597656, 0.0456390380859375, 0.05274009704589844, 0.059841156005859375, 0.06694221496582031, 0.07404327392578125, 0.08114433288574219, 0.08824539184570312, 0.09534645080566406, 0.102447509765625, 0.10954856872558594, 0.11664962768554688, 0.12375068664550781, 0.13085174560546875, 0.1379528045654297, 0.14505386352539062, 0.15215492248535156, 0.1592559814453125, 0.16635704040527344, 0.17345809936523438, 0.1805591583251953, 0.18766021728515625, 0.1947612762451172, 0.20186233520507812, 0.20896339416503906, 0.216064453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 6.0, 10.0, 18.0, 15.0, 39.0, 41.0, 103.0, 150.0, 203.0, 140.0, 85.0, 47.0, 30.0, 23.0, 21.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020241737365722656, -0.0001963600516319275, -0.00019030272960662842, -0.00018424540758132935, -0.00017818808555603027, -0.0001721307635307312, -0.00016607344150543213, -0.00016001611948013306, -0.00015395879745483398, -0.0001479014754295349, -0.00014184415340423584, -0.00013578683137893677, -0.0001297295093536377, -0.00012367218732833862, -0.00011761486530303955, -0.00011155754327774048, -0.0001055002212524414, -9.944289922714233e-05, -9.338557720184326e-05, -8.732825517654419e-05, -8.127093315124512e-05, -7.521361112594604e-05, -6.915628910064697e-05, -6.30989670753479e-05, -5.704164505004883e-05, -5.0984323024749756e-05, -4.4927000999450684e-05, -3.886967897415161e-05, -3.281235694885254e-05, -2.6755034923553467e-05, -2.0697712898254395e-05, -1.4640390872955322e-05, -8.58306884765625e-06, -2.5257468223571777e-06, 3.5315752029418945e-06, 9.588897228240967e-06, 1.564621925354004e-05, 2.170354127883911e-05, 2.7760863304138184e-05, 3.3818185329437256e-05, 3.987550735473633e-05, 4.59328293800354e-05, 5.199015140533447e-05, 5.8047473430633545e-05, 6.410479545593262e-05, 7.016211748123169e-05, 7.621943950653076e-05, 8.227676153182983e-05, 8.83340835571289e-05, 9.439140558242798e-05, 0.00010044872760772705, 0.00010650604963302612, 0.0001125633716583252, 0.00011862069368362427, 0.00012467801570892334, 0.0001307353377342224, 0.00013679265975952148, 0.00014284998178482056, 0.00014890730381011963, 0.0001549646258354187, 0.00016102194786071777, 0.00016707926988601685, 0.00017313659191131592, 0.000179193913936615, 0.00018525123596191406]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 2.0, 4.0, 5.0, 3.0, 13.0, 14.0, 24.0, 28.0, 41.0, 96.0, 135.0, 308.0, 653.0, 1396.0, 3181.0, 8031.0, 24139.0, 112015.0, 642628.0, 202067.0, 35427.0, 10828.0, 4172.0, 1705.0, 808.0, 386.0, 180.0, 86.0, 48.0, 37.0, 25.0, 12.0, 15.0, 6.0, 10.0, 1.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.287109375, -0.2785758972167969, -0.27004241943359375, -0.2615089416503906, -0.2529754638671875, -0.24444198608398438, -0.23590850830078125, -0.22737503051757812, -0.218841552734375, -0.21030807495117188, -0.20177459716796875, -0.19324111938476562, -0.1847076416015625, -0.17617416381835938, -0.16764068603515625, -0.15910720825195312, -0.15057373046875, -0.14204025268554688, -0.13350677490234375, -0.12497329711914062, -0.1164398193359375, -0.10790634155273438, -0.09937286376953125, -0.09083938598632812, -0.082305908203125, -0.07377243041992188, -0.06523895263671875, -0.056705474853515625, -0.0481719970703125, -0.039638519287109375, -0.03110504150390625, -0.022571563720703125, -0.0140380859375, -0.005504608154296875, 0.00302886962890625, 0.011562347412109375, 0.0200958251953125, 0.028629302978515625, 0.03716278076171875, 0.045696258544921875, 0.054229736328125, 0.06276321411132812, 0.07129669189453125, 0.07983016967773438, 0.0883636474609375, 0.09689712524414062, 0.10543060302734375, 0.11396408081054688, 0.12249755859375, 0.13103103637695312, 0.13956451416015625, 0.14809799194335938, 0.1566314697265625, 0.16516494750976562, 0.17369842529296875, 0.18223190307617188, 0.190765380859375, 0.19929885864257812, 0.20783233642578125, 0.21636581420898438, 0.2248992919921875, 0.23343276977539062, 0.24196624755859375, 0.2504997253417969, 0.259033203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 10.0, 8.0, 15.0, 15.0, 18.0, 27.0, 44.0, 43.0, 61.0, 75.0, 82.0, 101.0, 95.0, 86.0, 59.0, 53.0, 30.0, 36.0, 27.0, 23.0, 7.0, 10.0, 13.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0701904296875, -0.0681161880493164, -0.06604194641113281, -0.06396770477294922, -0.061893463134765625, -0.05981922149658203, -0.05774497985839844, -0.055670738220214844, -0.05359649658203125, -0.051522254943847656, -0.04944801330566406, -0.04737377166748047, -0.045299530029296875, -0.04322528839111328, -0.04115104675292969, -0.039076805114746094, -0.0370025634765625, -0.034928321838378906, -0.03285408020019531, -0.03077983856201172, -0.028705596923828125, -0.02663135528564453, -0.024557113647460938, -0.022482872009277344, -0.02040863037109375, -0.018334388732910156, -0.016260147094726562, -0.014185905456542969, -0.012111663818359375, -0.010037422180175781, -0.007963180541992188, -0.005888938903808594, -0.003814697265625, -0.0017404556274414062, 0.0003337860107421875, 0.0024080276489257812, 0.004482269287109375, 0.006556510925292969, 0.008630752563476562, 0.010704994201660156, 0.01277923583984375, 0.014853477478027344, 0.016927719116210938, 0.01900196075439453, 0.021076202392578125, 0.02315044403076172, 0.025224685668945312, 0.027298927307128906, 0.0293731689453125, 0.031447410583496094, 0.03352165222167969, 0.03559589385986328, 0.037670135498046875, 0.03974437713623047, 0.04181861877441406, 0.043892860412597656, 0.04596710205078125, 0.048041343688964844, 0.05011558532714844, 0.05218982696533203, 0.054264068603515625, 0.05633831024169922, 0.05841255187988281, 0.060486793518066406, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 7.0, 13.0, 33.0, 42.0, 62.0, 98.0, 145.0, 196.0, 152.0, 105.0, 47.0, 40.0, 29.0, 10.0, 7.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.620237350463867, -2.541998863220215, -2.4637603759765625, -2.385521650314331, -2.3072831630706787, -2.2290446758270264, -2.150806188583374, -2.0725677013397217, -1.9943290948867798, -1.9160906076431274, -1.8378520011901855, -1.7596135139465332, -1.6813750267028809, -1.603136420249939, -1.5248979330062866, -1.4466593265533447, -1.3684208393096924, -1.29018235206604, -1.2119437456130981, -1.1337052583694458, -1.055466651916504, -0.9772281646728516, -0.8989896774291992, -0.8207511305809021, -0.742512583732605, -0.6642740368843079, -0.5860354900360107, -0.5077970027923584, -0.4295584559440613, -0.35131990909576416, -0.27308139204978943, -0.1948428750038147, -0.11660432815551758, -0.03836579620838165, 0.03987273573875427, 0.1181112676858902, 0.19634979963302612, 0.27458834648132324, 0.352826863527298, 0.4310653805732727, 0.5093039274215698, 0.5875424742698669, 0.6657810211181641, 0.7440195083618164, 0.8222580552101135, 0.9004966020584106, 0.978735089302063, 1.0569736957550049, 1.1352121829986572, 1.2134506702423096, 1.2916892766952515, 1.3699277639389038, 1.4481663703918457, 1.526404857635498, 1.6046433448791504, 1.6828818321228027, 1.7611204385757446, 1.839358925819397, 1.9175975322723389, 1.9958360195159912, 2.0740745067596436, 2.152313232421875, 2.2305517196655273, 2.3087902069091797, 2.387028694152832]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 3.0, 7.0, 12.0, 21.0, 21.0, 18.0, 17.0, 27.0, 28.0, 34.0, 37.0, 38.0, 35.0, 38.0, 47.0, 43.0, 41.0, 41.0, 27.0, 46.0, 40.0, 49.0, 34.0, 33.0, 30.0, 30.0, 31.0, 27.0, 21.0, 20.0, 9.0, 7.0, 20.0, 10.0, 14.0, 6.0, 5.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.9393354058265686, -0.9121330976486206, -0.8849307894706726, -0.8577284812927246, -0.8305262327194214, -0.8033239245414734, -0.7761216163635254, -0.7489193081855774, -0.7217170000076294, -0.6945146918296814, -0.6673123836517334, -0.6401101350784302, -0.6129078269004822, -0.5857055187225342, -0.5585032105445862, -0.5313009023666382, -0.504098653793335, -0.47689634561538696, -0.44969406723976135, -0.42249175906181335, -0.39528948068618774, -0.36808717250823975, -0.34088486433029175, -0.31368255615234375, -0.28648027777671814, -0.25927796959877014, -0.23207569122314453, -0.20487338304519653, -0.17767108976840973, -0.15046879649162292, -0.12326648831367493, -0.09606419503688812, -0.06886190176010132, -0.041659604758024216, -0.014457307755947113, 0.012744992971420288, 0.03994728624820709, 0.0671495795249939, 0.0943518877029419, 0.1215541809797287, 0.1487564742565155, 0.1759587675333023, 0.2031610608100891, 0.2303633689880371, 0.2575656771659851, 0.2847679555416107, 0.3119702637195587, 0.3391725420951843, 0.3663748502731323, 0.3935771584510803, 0.42077943682670593, 0.44798174500465393, 0.47518402338027954, 0.5023863315582275, 0.5295886397361755, 0.5567909479141235, 0.5839931964874268, 0.6111955046653748, 0.6383978128433228, 0.665600061416626, 0.692802369594574, 0.720004677772522, 0.74720698595047, 0.774409294128418, 0.801611602306366]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 7.0, 16.0, 12.0, 33.0, 37.0, 41.0, 50.0, 69.0, 115.0, 182.0, 279.0, 471.0, 820.0, 1381.0, 2596.0, 5119.0, 10773.0, 24766.0, 60498.0, 157344.0, 343180.0, 261970.0, 104436.0, 40859.0, 17267.0, 7853.0, 3695.0, 1915.0, 1006.0, 600.0, 358.0, 242.0, 179.0, 122.0, 76.0, 58.0, 33.0, 22.0, 21.0, 14.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37939453125, -0.3674583435058594, -0.35552215576171875, -0.3435859680175781, -0.3316497802734375, -0.3197135925292969, -0.30777740478515625, -0.2958412170410156, -0.283905029296875, -0.2719688415527344, -0.26003265380859375, -0.24809646606445312, -0.2361602783203125, -0.22422409057617188, -0.21228790283203125, -0.20035171508789062, -0.18841552734375, -0.17647933959960938, -0.16454315185546875, -0.15260696411132812, -0.1406707763671875, -0.12873458862304688, -0.11679840087890625, -0.10486221313476562, -0.092926025390625, -0.08098983764648438, -0.06905364990234375, -0.057117462158203125, -0.0451812744140625, -0.033245086669921875, -0.02130889892578125, -0.009372711181640625, 0.0025634765625, 0.014499664306640625, 0.02643585205078125, 0.038372039794921875, 0.0503082275390625, 0.062244415283203125, 0.07418060302734375, 0.08611679077148438, 0.098052978515625, 0.10998916625976562, 0.12192535400390625, 0.13386154174804688, 0.1457977294921875, 0.15773391723632812, 0.16967010498046875, 0.18160629272460938, 0.19354248046875, 0.20547866821289062, 0.21741485595703125, 0.22935104370117188, 0.2412872314453125, 0.2532234191894531, 0.26515960693359375, 0.2770957946777344, 0.289031982421875, 0.3009681701660156, 0.31290435791015625, 0.3248405456542969, 0.3367767333984375, 0.3487129211425781, 0.36064910888671875, 0.3725852966308594, 0.384521484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 11.0, 12.0, 11.0, 20.0, 15.0, 14.0, 23.0, 19.0, 30.0, 37.0, 36.0, 36.0, 40.0, 29.0, 44.0, 36.0, 39.0, 54.0, 48.0, 47.0, 31.0, 45.0, 42.0, 37.0, 37.0, 29.0, 31.0, 19.0, 16.0, 16.0, 14.0, 11.0, 13.0, 6.0, 8.0, 5.0, 4.0, 6.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.45703125, -5.3033447265625, -5.149658203125, -4.9959716796875, -4.84228515625, -4.6885986328125, -4.534912109375, -4.3812255859375, -4.2275390625, -4.0738525390625, -3.920166015625, -3.7664794921875, -3.61279296875, -3.4591064453125, -3.305419921875, -3.1517333984375, -2.998046875, -2.8443603515625, -2.690673828125, -2.5369873046875, -2.38330078125, -2.2296142578125, -2.075927734375, -1.9222412109375, -1.7685546875, -1.6148681640625, -1.461181640625, -1.3074951171875, -1.15380859375, -1.0001220703125, -0.846435546875, -0.6927490234375, -0.5390625, -0.3853759765625, -0.231689453125, -0.0780029296875, 0.07568359375, 0.2293701171875, 0.383056640625, 0.5367431640625, 0.6904296875, 0.8441162109375, 0.997802734375, 1.1514892578125, 1.30517578125, 1.4588623046875, 1.612548828125, 1.7662353515625, 1.919921875, 2.0736083984375, 2.227294921875, 2.3809814453125, 2.53466796875, 2.6883544921875, 2.842041015625, 2.9957275390625, 3.1494140625, 3.3031005859375, 3.456787109375, 3.6104736328125, 3.76416015625, 3.9178466796875, 4.071533203125, 4.2252197265625, 4.37890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 10.0, 6.0, 9.0, 22.0, 13.0, 21.0, 29.0, 31.0, 41.0, 52.0, 58.0, 85.0, 124.0, 210.0, 385.0, 1213.0, 10878.0, 1012088.0, 20779.0, 1371.0, 450.0, 189.0, 108.0, 70.0, 62.0, 47.0, 42.0, 37.0, 22.0, 15.0, 14.0, 12.0, 11.0, 9.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.157867431640625, -3.06378173828125, -2.969696044921875, -2.8756103515625, -2.781524658203125, -2.68743896484375, -2.593353271484375, -2.499267578125, -2.405181884765625, -2.31109619140625, -2.217010498046875, -2.1229248046875, -2.028839111328125, -1.93475341796875, -1.840667724609375, -1.74658203125, -1.652496337890625, -1.55841064453125, -1.464324951171875, -1.3702392578125, -1.276153564453125, -1.18206787109375, -1.087982177734375, -0.993896484375, -0.899810791015625, -0.80572509765625, -0.711639404296875, -0.6175537109375, -0.523468017578125, -0.42938232421875, -0.335296630859375, -0.2412109375, -0.147125244140625, -0.05303955078125, 0.041046142578125, 0.1351318359375, 0.229217529296875, 0.32330322265625, 0.417388916015625, 0.511474609375, 0.605560302734375, 0.69964599609375, 0.793731689453125, 0.8878173828125, 0.981903076171875, 1.07598876953125, 1.170074462890625, 1.26416015625, 1.358245849609375, 1.45233154296875, 1.546417236328125, 1.6405029296875, 1.734588623046875, 1.82867431640625, 1.922760009765625, 2.016845703125, 2.110931396484375, 2.20501708984375, 2.299102783203125, 2.3931884765625, 2.487274169921875, 2.58135986328125, 2.675445556640625, 2.76953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 3.0, 11.0, 5.0, 7.0, 20.0, 11.0, 18.0, 25.0, 26.0, 34.0, 34.0, 35.0, 33.0, 52.0, 40.0, 36.0, 46.0, 51.0, 51.0, 49.0, 43.0, 35.0, 34.0, 35.0, 35.0, 34.0, 24.0, 31.0, 29.0, 16.0, 16.0, 13.0, 10.0, 11.0, 10.0, 12.0, 5.0, 2.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.99945068359375, -4.8504638671875, -4.70147705078125, -4.552490234375, -4.40350341796875, -4.2545166015625, -4.10552978515625, -3.95654296875, -3.80755615234375, -3.6585693359375, -3.50958251953125, -3.360595703125, -3.21160888671875, -3.0626220703125, -2.91363525390625, -2.7646484375, -2.61566162109375, -2.4666748046875, -2.31768798828125, -2.168701171875, -2.01971435546875, -1.8707275390625, -1.72174072265625, -1.57275390625, -1.42376708984375, -1.2747802734375, -1.12579345703125, -0.976806640625, -0.82781982421875, -0.6788330078125, -0.52984619140625, -0.380859375, -0.23187255859375, -0.0828857421875, 0.06610107421875, 0.215087890625, 0.36407470703125, 0.5130615234375, 0.66204833984375, 0.81103515625, 0.96002197265625, 1.1090087890625, 1.25799560546875, 1.406982421875, 1.55596923828125, 1.7049560546875, 1.85394287109375, 2.0029296875, 2.15191650390625, 2.3009033203125, 2.44989013671875, 2.598876953125, 2.74786376953125, 2.8968505859375, 3.04583740234375, 3.19482421875, 3.34381103515625, 3.4927978515625, 3.64178466796875, 3.790771484375, 3.93975830078125, 4.0887451171875, 4.23773193359375, 4.38671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 8.0, 13.0, 9.0, 17.0, 14.0, 33.0, 31.0, 56.0, 62.0, 98.0, 164.0, 239.0, 396.0, 774.0, 1334.0, 2655.0, 5988.0, 16645.0, 92354.0, 818880.0, 81647.0, 15690.0, 5710.0, 2542.0, 1323.0, 694.0, 411.0, 244.0, 146.0, 118.0, 74.0, 46.0, 37.0, 26.0, 15.0, 16.0, 10.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.14990234375, -0.1451396942138672, -0.14037704467773438, -0.13561439514160156, -0.13085174560546875, -0.12608909606933594, -0.12132644653320312, -0.11656379699707031, -0.1118011474609375, -0.10703849792480469, -0.10227584838867188, -0.09751319885253906, -0.09275054931640625, -0.08798789978027344, -0.08322525024414062, -0.07846260070800781, -0.073699951171875, -0.06893730163574219, -0.06417465209960938, -0.05941200256347656, -0.05464935302734375, -0.04988670349121094, -0.045124053955078125, -0.04036140441894531, -0.0355987548828125, -0.030836105346679688, -0.026073455810546875, -0.021310806274414062, -0.01654815673828125, -0.011785507202148438, -0.007022857666015625, -0.0022602081298828125, 0.00250244140625, 0.0072650909423828125, 0.012027740478515625, 0.016790390014648438, 0.02155303955078125, 0.026315689086914062, 0.031078338623046875, 0.03584098815917969, 0.0406036376953125, 0.04536628723144531, 0.050128936767578125, 0.05489158630371094, 0.05965423583984375, 0.06441688537597656, 0.06917953491210938, 0.07394218444824219, 0.078704833984375, 0.08346748352050781, 0.08823013305664062, 0.09299278259277344, 0.09775543212890625, 0.10251808166503906, 0.10728073120117188, 0.11204338073730469, 0.1168060302734375, 0.12156867980957031, 0.12633132934570312, 0.13109397888183594, 0.13585662841796875, 0.14061927795410156, 0.14538192749023438, 0.1501445770263672, 0.1549072265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 12.0, 29.0, 115.0, 453.0, 266.0, 61.0, 21.0, 11.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.128715515136719e-05, -6.92959874868393e-05, -6.73048198223114e-05, -6.531365215778351e-05, -6.332248449325562e-05, -6.133131682872772e-05, -5.934014916419983e-05, -5.7348981499671936e-05, -5.535781383514404e-05, -5.336664617061615e-05, -5.137547850608826e-05, -4.9384310841560364e-05, -4.739314317703247e-05, -4.540197551250458e-05, -4.3410807847976685e-05, -4.141964018344879e-05, -3.94284725189209e-05, -3.7437304854393005e-05, -3.544613718986511e-05, -3.345496952533722e-05, -3.1463801860809326e-05, -2.9472634196281433e-05, -2.748146653175354e-05, -2.5490298867225647e-05, -2.3499131202697754e-05, -2.150796353816986e-05, -1.9516795873641968e-05, -1.7525628209114075e-05, -1.553446054458618e-05, -1.3543292880058289e-05, -1.1552125215530396e-05, -9.560957551002502e-06, -7.569789886474609e-06, -5.578622221946716e-06, -3.5874545574188232e-06, -1.5962868928909302e-06, 3.948807716369629e-07, 2.386048436164856e-06, 4.377216100692749e-06, 6.368383765220642e-06, 8.359551429748535e-06, 1.0350719094276428e-05, 1.2341886758804321e-05, 1.4333054423332214e-05, 1.6324222087860107e-05, 1.8315389752388e-05, 2.0306557416915894e-05, 2.2297725081443787e-05, 2.428889274597168e-05, 2.6280060410499573e-05, 2.8271228075027466e-05, 3.026239573955536e-05, 3.225356340408325e-05, 3.4244731068611145e-05, 3.623589873313904e-05, 3.822706639766693e-05, 4.0218234062194824e-05, 4.220940172672272e-05, 4.420056939125061e-05, 4.6191737055778503e-05, 4.8182904720306396e-05, 5.017407238483429e-05, 5.216524004936218e-05, 5.4156407713890076e-05, 5.614757537841797e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 5.0, 10.0, 10.0, 31.0, 40.0, 55.0, 91.0, 161.0, 300.0, 612.0, 1469.0, 4791.0, 21665.0, 666509.0, 329105.0, 17157.0, 3995.0, 1339.0, 558.0, 259.0, 163.0, 84.0, 52.0, 27.0, 20.0, 17.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17557525634765625, -0.1685333251953125, -0.16149139404296875, -0.154449462890625, -0.14740753173828125, -0.1403656005859375, -0.13332366943359375, -0.12628173828125, -0.11923980712890625, -0.1121978759765625, -0.10515594482421875, -0.098114013671875, -0.09107208251953125, -0.0840301513671875, -0.07698822021484375, -0.0699462890625, -0.06290435791015625, -0.0558624267578125, -0.04882049560546875, -0.041778564453125, -0.03473663330078125, -0.0276947021484375, -0.02065277099609375, -0.01361083984375, -0.00656890869140625, 0.0004730224609375, 0.00751495361328125, 0.014556884765625, 0.02159881591796875, 0.0286407470703125, 0.03568267822265625, 0.042724609375, 0.04976654052734375, 0.0568084716796875, 0.06385040283203125, 0.070892333984375, 0.07793426513671875, 0.0849761962890625, 0.09201812744140625, 0.09906005859375, 0.10610198974609375, 0.1131439208984375, 0.12018585205078125, 0.127227783203125, 0.13426971435546875, 0.1413116455078125, 0.14835357666015625, 0.1553955078125, 0.16243743896484375, 0.1694793701171875, 0.17652130126953125, 0.183563232421875, 0.19060516357421875, 0.1976470947265625, 0.20468902587890625, 0.21173095703125, 0.21877288818359375, 0.2258148193359375, 0.23285675048828125, 0.239898681640625, 0.24694061279296875, 0.2539825439453125, 0.26102447509765625, 0.26806640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 5.0, 6.0, 9.0, 15.0, 29.0, 43.0, 90.0, 198.0, 237.0, 145.0, 87.0, 43.0, 29.0, 23.0, 13.0, 6.0, 6.0, 4.0, 5.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1058349609375, -0.10308170318603516, -0.10032844543457031, -0.09757518768310547, -0.09482192993164062, -0.09206867218017578, -0.08931541442871094, -0.0865621566772461, -0.08380889892578125, -0.0810556411743164, -0.07830238342285156, -0.07554912567138672, -0.07279586791992188, -0.07004261016845703, -0.06728935241699219, -0.06453609466552734, -0.0617828369140625, -0.059029579162597656, -0.05627632141113281, -0.05352306365966797, -0.050769805908203125, -0.04801654815673828, -0.04526329040527344, -0.042510032653808594, -0.03975677490234375, -0.037003517150878906, -0.03425025939941406, -0.03149700164794922, -0.028743743896484375, -0.02599048614501953, -0.023237228393554688, -0.020483970642089844, -0.017730712890625, -0.014977455139160156, -0.012224197387695312, -0.009470939636230469, -0.006717681884765625, -0.003964424133300781, -0.0012111663818359375, 0.0015420913696289062, 0.00429534912109375, 0.007048606872558594, 0.009801864624023438, 0.012555122375488281, 0.015308380126953125, 0.01806163787841797, 0.020814895629882812, 0.023568153381347656, 0.0263214111328125, 0.029074668884277344, 0.03182792663574219, 0.03458118438720703, 0.037334442138671875, 0.04008769989013672, 0.04284095764160156, 0.045594215393066406, 0.04834747314453125, 0.051100730895996094, 0.05385398864746094, 0.05660724639892578, 0.059360504150390625, 0.06211376190185547, 0.06486701965332031, 0.06762027740478516, 0.07037353515625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 19.0, 17.0, 16.0, 34.0, 53.0, 49.0, 66.0, 102.0, 119.0, 116.0, 97.0, 82.0, 57.0, 44.0, 28.0, 26.0, 21.0, 13.0, 6.0, 10.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.479384660720825, -2.399658441543579, -2.319932460784912, -2.240206241607666, -2.16048002243042, -2.080754041671753, -2.001027822494507, -1.9213017225265503, -1.8415756225585938, -1.7618495225906372, -1.6821233034133911, -1.6023972034454346, -1.522671103477478, -1.4429450035095215, -1.3632187843322754, -1.2834926843643188, -1.2037664651870728, -1.1240403652191162, -1.0443141460418701, -0.9645880460739136, -0.884861946105957, -0.8051357865333557, -0.7254096269607544, -0.6456835269927979, -0.5659573674201965, -0.4862312376499176, -0.40650510787963867, -0.32677894830703735, -0.24705281853675842, -0.1673266887664795, -0.08760052919387817, -0.00787442922592163, 0.07185173034667969, 0.15157786011695862, 0.23130400478839874, 0.31103014945983887, 0.3907562792301178, 0.47048240900039673, 0.550208568572998, 0.6299346685409546, 0.7096608281135559, 0.7893869876861572, 0.8691130876541138, 0.9488392472267151, 1.0285654067993164, 1.108291506767273, 1.1880176067352295, 1.2677438259124756, 1.3474699258804321, 1.4271960258483887, 1.5069222450256348, 1.5866483449935913, 1.6663744449615479, 1.746100664138794, 1.8258267641067505, 1.905552864074707, 1.9852790832519531, 2.065005302429199, 2.144731283187866, 2.2244575023651123, 2.3041837215423584, 2.3839097023010254, 2.4636359214782715, 2.5433621406555176, 2.6230881214141846]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 11.0, 6.0, 6.0, 9.0, 13.0, 9.0, 9.0, 22.0, 21.0, 28.0, 28.0, 25.0, 28.0, 37.0, 26.0, 38.0, 31.0, 35.0, 27.0, 53.0, 40.0, 33.0, 34.0, 36.0, 43.0, 39.0, 29.0, 34.0, 28.0, 25.0, 29.0, 25.0, 24.0, 13.0, 21.0, 21.0, 11.0, 9.0, 9.0, 13.0, 3.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.507295608520508, -6.283201217651367, -6.059106349945068, -5.8350114822387695, -5.610917091369629, -5.386822700500488, -5.1627278327941895, -4.938632965087891, -4.71453857421875, -4.490444183349609, -4.2663493156433105, -4.042254447937012, -3.818160057067871, -3.5940654277801514, -3.3699707984924316, -3.145876169204712, -2.921781539916992, -2.6976869106292725, -2.4735922813415527, -2.249497652053833, -2.0254030227661133, -1.8013083934783936, -1.5772137641906738, -1.353119134902954, -1.1290245056152344, -0.9049298763275146, -0.6808352470397949, -0.4567406177520752, -0.23264598846435547, -0.008551359176635742, 0.21554327011108398, 0.4396378993988037, 0.6637330055236816, 0.8878276348114014, 1.111922264099121, 1.3360168933868408, 1.5601115226745605, 1.7842061519622803, 2.00830078125, 2.2323954105377197, 2.4564900398254395, 2.680584669113159, 2.904679298400879, 3.1287739276885986, 3.3528685569763184, 3.576963186264038, 3.801057815551758, 4.025152206420898, 4.249247074127197, 4.473341941833496, 4.697436332702637, 4.921530723571777, 5.145625591278076, 5.369720458984375, 5.593814849853516, 5.817909240722656, 6.042004108428955, 6.266098976135254, 6.4901933670043945, 6.714287757873535, 6.938382625579834, 7.162477493286133, 7.386571884155273, 7.610666275024414, 7.834761142730713]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 12.0, 9.0, 8.0, 21.0, 22.0, 26.0, 48.0, 99.0, 156.0, 277.0, 616.0, 1469.0, 3742.0, 10691.0, 59128.0, 2125065.0, 1921191.0, 54649.0, 10837.0, 3561.0, 1409.0, 583.0, 268.0, 130.0, 69.0, 59.0, 16.0, 20.0, 13.0, 11.0, 13.0, 18.0, 7.0, 8.0, 3.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.103515625, -3.009429931640625, -2.91534423828125, -2.821258544921875, -2.7271728515625, -2.633087158203125, -2.53900146484375, -2.444915771484375, -2.350830078125, -2.256744384765625, -2.16265869140625, -2.068572998046875, -1.9744873046875, -1.880401611328125, -1.78631591796875, -1.692230224609375, -1.59814453125, -1.504058837890625, -1.40997314453125, -1.315887451171875, -1.2218017578125, -1.127716064453125, -1.03363037109375, -0.939544677734375, -0.845458984375, -0.751373291015625, -0.65728759765625, -0.563201904296875, -0.4691162109375, -0.375030517578125, -0.28094482421875, -0.186859130859375, -0.0927734375, 0.001312255859375, 0.09539794921875, 0.189483642578125, 0.2835693359375, 0.377655029296875, 0.47174072265625, 0.565826416015625, 0.659912109375, 0.753997802734375, 0.84808349609375, 0.942169189453125, 1.0362548828125, 1.130340576171875, 1.22442626953125, 1.318511962890625, 1.41259765625, 1.506683349609375, 1.60076904296875, 1.694854736328125, 1.7889404296875, 1.883026123046875, 1.97711181640625, 2.071197509765625, 2.165283203125, 2.259368896484375, 2.35345458984375, 2.447540283203125, 2.5416259765625, 2.635711669921875, 2.72979736328125, 2.823883056640625, 2.91796875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 7.0, 19.0, 9.0, 15.0, 23.0, 23.0, 28.0, 26.0, 37.0, 36.0, 37.0, 32.0, 39.0, 43.0, 48.0, 50.0, 44.0, 49.0, 42.0, 55.0, 44.0, 31.0, 33.0, 29.0, 32.0, 28.0, 25.0, 20.0, 19.0, 13.0, 9.0, 6.0, 7.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.2216796875, -1.1895370483398438, -1.1573944091796875, -1.1252517700195312, -1.093109130859375, -1.0609664916992188, -1.0288238525390625, -0.9966812133789062, -0.96453857421875, -0.9323959350585938, -0.9002532958984375, -0.8681106567382812, -0.835968017578125, -0.8038253784179688, -0.7716827392578125, -0.7395401000976562, -0.7073974609375, -0.6752548217773438, -0.6431121826171875, -0.6109695434570312, -0.578826904296875, -0.5466842651367188, -0.5145416259765625, -0.48239898681640625, -0.45025634765625, -0.41811370849609375, -0.3859710693359375, -0.35382843017578125, -0.321685791015625, -0.28954315185546875, -0.2574005126953125, -0.22525787353515625, -0.193115234375, -0.16097259521484375, -0.1288299560546875, -0.09668731689453125, -0.064544677734375, -0.03240203857421875, -0.0002593994140625, 0.03188323974609375, 0.06402587890625, 0.09616851806640625, 0.1283111572265625, 0.16045379638671875, 0.192596435546875, 0.22473907470703125, 0.2568817138671875, 0.28902435302734375, 0.3211669921875, 0.35330963134765625, 0.3854522705078125, 0.41759490966796875, 0.449737548828125, 0.48188018798828125, 0.5140228271484375, 0.5461654663085938, 0.57830810546875, 0.6104507446289062, 0.6425933837890625, 0.6747360229492188, 0.706878662109375, 0.7390213012695312, 0.7711639404296875, 0.8033065795898438, 0.83544921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 10.0, 20.0, 37.0, 114.0, 1006.0, 4192238.0, 634.0, 114.0, 40.0, 27.0, 8.0, 14.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -21.9296875, -20.953125, -19.9765625, -19.0, -18.0234375, -17.046875, -16.0703125, -15.09375, -14.1171875, -13.140625, -12.1640625, -11.1875, -10.2109375, -9.234375, -8.2578125, -7.28125, -6.3046875, -5.328125, -4.3515625, -3.375, -2.3984375, -1.421875, -0.4453125, 0.53125, 1.5078125, 2.484375, 3.4609375, 4.4375, 5.4140625, 6.390625, 7.3671875, 8.34375, 9.3203125, 10.296875, 11.2734375, 12.25, 13.2265625, 14.203125, 15.1796875, 16.15625, 17.1328125, 18.109375, 19.0859375, 20.0625, 21.0390625, 22.015625, 22.9921875, 23.96875, 24.9453125, 25.921875, 26.8984375, 27.875, 28.8515625, 29.828125, 30.8046875, 31.78125, 32.7578125, 33.734375, 34.7109375, 35.6875, 36.6640625, 37.640625, 38.6171875, 39.59375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 11.0, 5.0, 15.0, 15.0, 37.0, 27.0, 49.0, 65.0, 106.0, 157.0, 351.0, 758.0, 1122.0, 624.0, 294.0, 138.0, 85.0, 54.0, 45.0, 29.0, 23.0, 21.0, 9.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71826171875, -0.6973495483398438, -0.6764373779296875, -0.6555252075195312, -0.634613037109375, -0.6137008666992188, -0.5927886962890625, -0.5718765258789062, -0.55096435546875, -0.5300521850585938, -0.5091400146484375, -0.48822784423828125, -0.467315673828125, -0.44640350341796875, -0.4254913330078125, -0.40457916259765625, -0.3836669921875, -0.36275482177734375, -0.3418426513671875, -0.32093048095703125, -0.300018310546875, -0.27910614013671875, -0.2581939697265625, -0.23728179931640625, -0.21636962890625, -0.19545745849609375, -0.1745452880859375, -0.15363311767578125, -0.132720947265625, -0.11180877685546875, -0.0908966064453125, -0.06998443603515625, -0.049072265625, -0.02816009521484375, -0.0072479248046875, 0.01366424560546875, 0.034576416015625, 0.05548858642578125, 0.0764007568359375, 0.09731292724609375, 0.11822509765625, 0.13913726806640625, 0.1600494384765625, 0.18096160888671875, 0.201873779296875, 0.22278594970703125, 0.2436981201171875, 0.26461029052734375, 0.2855224609375, 0.30643463134765625, 0.3273468017578125, 0.34825897216796875, 0.369171142578125, 0.39008331298828125, 0.4109954833984375, 0.43190765380859375, 0.45281982421875, 0.47373199462890625, 0.4946441650390625, 0.5155563354492188, 0.536468505859375, 0.5573806762695312, 0.5782928466796875, 0.5992050170898438, 0.6201171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 10.0, 18.0, 18.0, 28.0, 27.0, 32.0, 61.0, 96.0, 105.0, 97.0, 135.0, 85.0, 73.0, 53.0, 37.0, 34.0, 19.0, 16.0, 11.0, 9.0, 6.0, 8.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5102577209472656, -2.450434684753418, -2.3906118869781494, -2.3307888507843018, -2.270966053009033, -2.2111430168151855, -2.151320219039917, -2.0914971828460693, -2.031674385070801, -1.9718514680862427, -1.9120285511016846, -1.8522056341171265, -1.7923827171325684, -1.7325596809387207, -1.6727367639541626, -1.6129138469696045, -1.5530908107757568, -1.4932678937911987, -1.4334449768066406, -1.3736220598220825, -1.3137991428375244, -1.2539761066436768, -1.1941531896591187, -1.1343302726745605, -1.0745073556900024, -1.0146844387054443, -0.9548615217208862, -0.8950385451316833, -0.8352156281471252, -0.7753927111625671, -0.7155697345733643, -0.6557468175888062, -0.5959240198135376, -0.5361011028289795, -0.476278156042099, -0.4164552092552185, -0.3566322922706604, -0.2968093752861023, -0.2369864284992218, -0.1771634817123413, -0.1173405647277832, -0.057517632842063904, 0.0023052990436553955, 0.062128230929374695, 0.121951162815094, 0.1817740797996521, 0.2415970265865326, 0.3014199733734131, 0.3612428903579712, 0.4210658073425293, 0.4808887541294098, 0.5407117009162903, 0.6005346179008484, 0.6603575348854065, 0.7201805114746094, 0.7800034284591675, 0.8398263454437256, 0.8996492624282837, 0.9594721794128418, 1.0192950963974, 1.079118013381958, 1.1389410495758057, 1.1987639665603638, 1.2585868835449219, 1.31840980052948]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 6.0, 15.0, 13.0, 14.0, 19.0, 28.0, 32.0, 31.0, 35.0, 33.0, 27.0, 25.0, 27.0, 33.0, 45.0, 51.0, 53.0, 46.0, 39.0, 42.0, 42.0, 32.0, 33.0, 37.0, 29.0, 23.0, 30.0, 26.0, 26.0, 11.0, 15.0, 7.0, 12.0, 6.0, 6.0, 4.0, 8.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1077584028244019, -1.0767717361450195, -1.0457850694656372, -1.0147982835769653, -0.983811616897583, -0.9528249502182007, -0.9218382835388184, -0.8908515572547913, -0.8598648309707642, -0.8288781642913818, -0.7978914380073547, -0.7669047713279724, -0.7359180450439453, -0.704931378364563, -0.6739447116851807, -0.6429579854011536, -0.6119713187217712, -0.5809846520423889, -0.5499979257583618, -0.5190112590789795, -0.4880245327949524, -0.45703786611557007, -0.42605116963386536, -0.39506447315216064, -0.36407777667045593, -0.3330910801887512, -0.3021043837070465, -0.2711176872253418, -0.24013100564479828, -0.20914430916309357, -0.17815762758255005, -0.14717093110084534, -0.11618417501449585, -0.08519747853279114, -0.05421078950166702, -0.023224100470542908, 0.007762596011161804, 0.038749292492866516, 0.06973597407341003, 0.10072267055511475, 0.13170936703681946, 0.16269606351852417, 0.19368276000022888, 0.2246694415807724, 0.2556561231613159, 0.286642849445343, 0.31762951612472534, 0.34861621260643005, 0.37960290908813477, 0.4105896055698395, 0.4415763020515442, 0.4725629687309265, 0.5035496950149536, 0.5345363616943359, 0.5655230283737183, 0.5965097546577454, 0.6274964809417725, 0.6584831476211548, 0.6894698739051819, 0.7204565405845642, 0.7514432668685913, 0.7824299335479736, 0.813416600227356, 0.8444033265113831, 0.8753899931907654]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 15.0, 14.0, 15.0, 28.0, 45.0, 82.0, 82.0, 114.0, 158.0, 217.0, 304.0, 486.0, 743.0, 1149.0, 1955.0, 3142.0, 5618.0, 10458.0, 22197.0, 51631.0, 140810.0, 387232.0, 264109.0, 87930.0, 35092.0, 15674.0, 7851.0, 4342.0, 2573.0, 1562.0, 984.0, 584.0, 417.0, 260.0, 188.0, 149.0, 102.0, 70.0, 50.0, 22.0, 28.0, 16.0, 17.0, 11.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.488037109375, -0.4731483459472656, -0.45825958251953125, -0.4433708190917969, -0.4284820556640625, -0.4135932922363281, -0.39870452880859375, -0.3838157653808594, -0.368927001953125, -0.3540382385253906, -0.33914947509765625, -0.3242607116699219, -0.3093719482421875, -0.2944831848144531, -0.27959442138671875, -0.2647056579589844, -0.24981689453125, -0.23492813110351562, -0.22003936767578125, -0.20515060424804688, -0.1902618408203125, -0.17537307739257812, -0.16048431396484375, -0.14559555053710938, -0.130706787109375, -0.11581802368164062, -0.10092926025390625, -0.08604049682617188, -0.0711517333984375, -0.056262969970703125, -0.04137420654296875, -0.026485443115234375, -0.0115966796875, 0.003292083740234375, 0.01818084716796875, 0.033069610595703125, 0.0479583740234375, 0.06284713745117188, 0.07773590087890625, 0.09262466430664062, 0.107513427734375, 0.12240219116210938, 0.13729095458984375, 0.15217971801757812, 0.1670684814453125, 0.18195724487304688, 0.19684600830078125, 0.21173477172851562, 0.22662353515625, 0.24151229858398438, 0.25640106201171875, 0.2712898254394531, 0.2861785888671875, 0.3010673522949219, 0.31595611572265625, 0.3308448791503906, 0.345733642578125, 0.3606224060058594, 0.37551116943359375, 0.3903999328613281, 0.4052886962890625, 0.4201774597167969, 0.43506622314453125, 0.4499549865722656, 0.46484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 5.0, 4.0, 6.0, 10.0, 11.0, 5.0, 10.0, 14.0, 23.0, 35.0, 33.0, 22.0, 43.0, 37.0, 34.0, 27.0, 39.0, 37.0, 57.0, 47.0, 45.0, 51.0, 49.0, 39.0, 46.0, 29.0, 33.0, 23.0, 26.0, 29.0, 24.0, 21.0, 12.0, 16.0, 10.0, 8.0, 7.0, 6.0, 3.0, 3.0, 9.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.796875, -0.774658203125, -0.75244140625, -0.730224609375, -0.7080078125, -0.685791015625, -0.66357421875, -0.641357421875, -0.619140625, -0.596923828125, -0.57470703125, -0.552490234375, -0.5302734375, -0.508056640625, -0.48583984375, -0.463623046875, -0.44140625, -0.419189453125, -0.39697265625, -0.374755859375, -0.3525390625, -0.330322265625, -0.30810546875, -0.285888671875, -0.263671875, -0.241455078125, -0.21923828125, -0.197021484375, -0.1748046875, -0.152587890625, -0.13037109375, -0.108154296875, -0.0859375, -0.063720703125, -0.04150390625, -0.019287109375, 0.0029296875, 0.025146484375, 0.04736328125, 0.069580078125, 0.091796875, 0.114013671875, 0.13623046875, 0.158447265625, 0.1806640625, 0.202880859375, 0.22509765625, 0.247314453125, 0.26953125, 0.291748046875, 0.31396484375, 0.336181640625, 0.3583984375, 0.380615234375, 0.40283203125, 0.425048828125, 0.447265625, 0.469482421875, 0.49169921875, 0.513916015625, 0.5361328125, 0.558349609375, 0.58056640625, 0.602783203125, 0.625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 8.0, 10.0, 13.0, 19.0, 19.0, 24.0, 50.0, 72.0, 74.0, 136.0, 177.0, 270.0, 450.0, 604.0, 1059.0, 1822.0, 3393.0, 6704.0, 14834.0, 38305.0, 115876.0, 385495.0, 326855.0, 93807.0, 31969.0, 12940.0, 5936.0, 3014.0, 1744.0, 1015.0, 614.0, 361.0, 275.0, 168.0, 127.0, 86.0, 67.0, 48.0, 34.0, 17.0, 18.0, 13.0, 6.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.487060546875, -0.4722633361816406, -0.45746612548828125, -0.4426689147949219, -0.4278717041015625, -0.4130744934082031, -0.39827728271484375, -0.3834800720214844, -0.368682861328125, -0.3538856506347656, -0.33908843994140625, -0.3242912292480469, -0.3094940185546875, -0.2946968078613281, -0.27989959716796875, -0.2651023864746094, -0.25030517578125, -0.23550796508789062, -0.22071075439453125, -0.20591354370117188, -0.1911163330078125, -0.17631912231445312, -0.16152191162109375, -0.14672470092773438, -0.131927490234375, -0.11713027954101562, -0.10233306884765625, -0.08753585815429688, -0.0727386474609375, -0.057941436767578125, -0.04314422607421875, -0.028347015380859375, -0.0135498046875, 0.001247406005859375, 0.01604461669921875, 0.030841827392578125, 0.0456390380859375, 0.060436248779296875, 0.07523345947265625, 0.09003067016601562, 0.104827880859375, 0.11962509155273438, 0.13442230224609375, 0.14921951293945312, 0.1640167236328125, 0.17881393432617188, 0.19361114501953125, 0.20840835571289062, 0.22320556640625, 0.23800277709960938, 0.25279998779296875, 0.2675971984863281, 0.2823944091796875, 0.2971916198730469, 0.31198883056640625, 0.3267860412597656, 0.341583251953125, 0.3563804626464844, 0.37117767333984375, 0.3859748840332031, 0.4007720947265625, 0.4155693054199219, 0.43036651611328125, 0.4451637268066406, 0.4599609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 16.0, 12.0, 22.0, 23.0, 22.0, 37.0, 29.0, 47.0, 42.0, 42.0, 63.0, 55.0, 64.0, 60.0, 68.0, 62.0, 57.0, 34.0, 45.0, 40.0, 41.0, 28.0, 13.0, 18.0, 19.0, 7.0, 6.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9990234375, -1.9416961669921875, -1.884368896484375, -1.8270416259765625, -1.76971435546875, -1.7123870849609375, -1.655059814453125, -1.5977325439453125, -1.5404052734375, -1.4830780029296875, -1.425750732421875, -1.3684234619140625, -1.31109619140625, -1.2537689208984375, -1.196441650390625, -1.1391143798828125, -1.081787109375, -1.0244598388671875, -0.967132568359375, -0.9098052978515625, -0.85247802734375, -0.7951507568359375, -0.737823486328125, -0.6804962158203125, -0.6231689453125, -0.5658416748046875, -0.508514404296875, -0.4511871337890625, -0.39385986328125, -0.3365325927734375, -0.279205322265625, -0.2218780517578125, -0.16455078125, -0.1072235107421875, -0.049896240234375, 0.0074310302734375, 0.06475830078125, 0.1220855712890625, 0.179412841796875, 0.2367401123046875, 0.2940673828125, 0.3513946533203125, 0.408721923828125, 0.4660491943359375, 0.52337646484375, 0.5807037353515625, 0.638031005859375, 0.6953582763671875, 0.752685546875, 0.8100128173828125, 0.867340087890625, 0.9246673583984375, 0.98199462890625, 1.0393218994140625, 1.096649169921875, 1.1539764404296875, 1.2113037109375, 1.2686309814453125, 1.325958251953125, 1.3832855224609375, 1.44061279296875, 1.4979400634765625, 1.555267333984375, 1.6125946044921875, 1.669921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 6.0, 9.0, 16.0, 18.0, 27.0, 33.0, 70.0, 124.0, 163.0, 284.0, 531.0, 960.0, 2233.0, 5241.0, 16280.0, 63873.0, 369235.0, 476382.0, 81931.0, 20028.0, 6236.0, 2441.0, 1108.0, 590.0, 315.0, 168.0, 94.0, 49.0, 42.0, 19.0, 12.0, 9.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.12181282043457031, -0.11789321899414062, -0.11397361755371094, -0.11005401611328125, -0.10613441467285156, -0.10221481323242188, -0.09829521179199219, -0.0943756103515625, -0.09045600891113281, -0.08653640747070312, -0.08261680603027344, -0.07869720458984375, -0.07477760314941406, -0.07085800170898438, -0.06693840026855469, -0.063018798828125, -0.05909919738769531, -0.055179595947265625, -0.05125999450683594, -0.04734039306640625, -0.04342079162597656, -0.039501190185546875, -0.03558158874511719, -0.0316619873046875, -0.027742385864257812, -0.023822784423828125, -0.019903182983398438, -0.01598358154296875, -0.012063980102539062, -0.008144378662109375, -0.0042247772216796875, -0.00030517578125, 0.0036144256591796875, 0.007534027099609375, 0.011453628540039062, 0.01537322998046875, 0.019292831420898438, 0.023212432861328125, 0.027132034301757812, 0.0310516357421875, 0.03497123718261719, 0.038890838623046875, 0.04281044006347656, 0.04673004150390625, 0.05064964294433594, 0.054569244384765625, 0.05848884582519531, 0.062408447265625, 0.06632804870605469, 0.07024765014648438, 0.07416725158691406, 0.07808685302734375, 0.08200645446777344, 0.08592605590820312, 0.08984565734863281, 0.0937652587890625, 0.09768486022949219, 0.10160446166992188, 0.10552406311035156, 0.10944366455078125, 0.11336326599121094, 0.11728286743164062, 0.12120246887207031, 0.1251220703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 2.0, 2.0, 10.0, 12.0, 16.0, 19.0, 27.0, 32.0, 44.0, 58.0, 63.0, 77.0, 122.0, 100.0, 97.0, 79.0, 57.0, 39.0, 30.0, 28.0, 16.0, 15.0, 9.0, 8.0, 12.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.975101470947266e-05, -7.766392081975937e-05, -7.557682693004608e-05, -7.34897330403328e-05, -7.140263915061951e-05, -6.931554526090622e-05, -6.722845137119293e-05, -6.514135748147964e-05, -6.305426359176636e-05, -6.096716970205307e-05, -5.888007581233978e-05, -5.6792981922626495e-05, -5.470588803291321e-05, -5.261879414319992e-05, -5.053170025348663e-05, -4.8444606363773346e-05, -4.635751247406006e-05, -4.427041858434677e-05, -4.2183324694633484e-05, -4.0096230804920197e-05, -3.800913691520691e-05, -3.592204302549362e-05, -3.3834949135780334e-05, -3.174785524606705e-05, -2.966076135635376e-05, -2.7573667466640472e-05, -2.5486573576927185e-05, -2.3399479687213898e-05, -2.131238579750061e-05, -1.9225291907787323e-05, -1.7138198018074036e-05, -1.5051104128360748e-05, -1.2964010238647461e-05, -1.0876916348934174e-05, -8.789822459220886e-06, -6.702728569507599e-06, -4.6156346797943115e-06, -2.528540790081024e-06, -4.414469003677368e-07, 1.6456469893455505e-06, 3.732740879058838e-06, 5.819834768772125e-06, 7.906928658485413e-06, 9.9940225481987e-06, 1.2081116437911987e-05, 1.4168210327625275e-05, 1.6255304217338562e-05, 1.834239810705185e-05, 2.0429491996765137e-05, 2.2516585886478424e-05, 2.460367977619171e-05, 2.6690773665905e-05, 2.8777867555618286e-05, 3.0864961445331573e-05, 3.295205533504486e-05, 3.503914922475815e-05, 3.7126243114471436e-05, 3.921333700418472e-05, 4.130043089389801e-05, 4.33875247836113e-05, 4.5474618673324585e-05, 4.756171256303787e-05, 4.964880645275116e-05, 5.173590034246445e-05, 5.3822994232177734e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 9.0, 13.0, 5.0, 17.0, 25.0, 29.0, 36.0, 55.0, 128.0, 328.0, 835.0, 2394.0, 7607.0, 30121.0, 180654.0, 665984.0, 127269.0, 23585.0, 6176.0, 1971.0, 700.0, 278.0, 120.0, 81.0, 39.0, 23.0, 21.0, 10.0, 6.0, 5.0, 7.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.13149642944335938, -0.12651824951171875, -0.12154006958007812, -0.1165618896484375, -0.11158370971679688, -0.10660552978515625, -0.10162734985351562, -0.096649169921875, -0.09167098999023438, -0.08669281005859375, -0.08171463012695312, -0.0767364501953125, -0.07175827026367188, -0.06678009033203125, -0.061801910400390625, -0.05682373046875, -0.051845550537109375, -0.04686737060546875, -0.041889190673828125, -0.0369110107421875, -0.031932830810546875, -0.02695465087890625, -0.021976470947265625, -0.016998291015625, -0.012020111083984375, -0.00704193115234375, -0.002063751220703125, 0.0029144287109375, 0.007892608642578125, 0.01287078857421875, 0.017848968505859375, 0.0228271484375, 0.027805328369140625, 0.03278350830078125, 0.037761688232421875, 0.0427398681640625, 0.047718048095703125, 0.05269622802734375, 0.057674407958984375, 0.062652587890625, 0.06763076782226562, 0.07260894775390625, 0.07758712768554688, 0.0825653076171875, 0.08754348754882812, 0.09252166748046875, 0.09749984741210938, 0.10247802734375, 0.10745620727539062, 0.11243438720703125, 0.11741256713867188, 0.1223907470703125, 0.12736892700195312, 0.13234710693359375, 0.13732528686523438, 0.142303466796875, 0.14728164672851562, 0.15225982666015625, 0.15723800659179688, 0.1622161865234375, 0.16719436645507812, 0.17217254638671875, 0.17715072631835938, 0.18212890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 8.0, 0.0, 5.0, 7.0, 5.0, 7.0, 11.0, 10.0, 15.0, 19.0, 27.0, 28.0, 39.0, 56.0, 55.0, 55.0, 62.0, 71.0, 83.0, 92.0, 68.0, 63.0, 28.0, 35.0, 27.0, 28.0, 29.0, 7.0, 12.0, 10.0, 13.0, 7.0, 8.0, 6.0, 7.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032318115234375, -0.031420230865478516, -0.03052234649658203, -0.029624462127685547, -0.028726577758789062, -0.027828693389892578, -0.026930809020996094, -0.02603292465209961, -0.025135040283203125, -0.02423715591430664, -0.023339271545410156, -0.022441387176513672, -0.021543502807617188, -0.020645618438720703, -0.01974773406982422, -0.018849849700927734, -0.01795196533203125, -0.017054080963134766, -0.01615619659423828, -0.015258312225341797, -0.014360427856445312, -0.013462543487548828, -0.012564659118652344, -0.01166677474975586, -0.010768890380859375, -0.00987100601196289, -0.008973121643066406, -0.008075237274169922, -0.0071773529052734375, -0.006279468536376953, -0.005381584167480469, -0.004483699798583984, -0.0035858154296875, -0.0026879310607910156, -0.0017900466918945312, -0.0008921623229980469, 5.7220458984375e-06, 0.0009036064147949219, 0.0018014907836914062, 0.0026993751525878906, 0.003597259521484375, 0.004495143890380859, 0.005393028259277344, 0.006290912628173828, 0.0071887969970703125, 0.008086681365966797, 0.008984565734863281, 0.009882450103759766, 0.01078033447265625, 0.011678218841552734, 0.012576103210449219, 0.013473987579345703, 0.014371871948242188, 0.015269756317138672, 0.016167640686035156, 0.01706552505493164, 0.017963409423828125, 0.01886129379272461, 0.019759178161621094, 0.020657062530517578, 0.021554946899414062, 0.022452831268310547, 0.02335071563720703, 0.024248600006103516, 0.025146484375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 23.0, 37.0, 29.0, 68.0, 137.0, 200.0, 207.0, 105.0, 73.0, 37.0, 26.0, 17.0, 9.0, 11.0, 6.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.530160665512085, -2.473973512649536, -2.4177865982055664, -2.3615994453430176, -2.305412530899048, -2.249225378036499, -2.1930384635925293, -2.1368513107299805, -2.0806641578674316, -2.024477005004883, -1.968290090560913, -1.9121030569076538, -1.8559160232543945, -1.7997288703918457, -1.7435418367385864, -1.6873548030853271, -1.6311678886413574, -1.5749808549880981, -1.5187938213348389, -1.4626067876815796, -1.4064197540283203, -1.3502326011657715, -1.2940455675125122, -1.237858533859253, -1.1816715002059937, -1.1254844665527344, -1.069297432899475, -1.0131103992462158, -0.9569233059883118, -0.9007362723350525, -0.8445491790771484, -0.7883621454238892, -0.7321751117706299, -0.6759880781173706, -0.6198010444641113, -0.5636139512062073, -0.507426917552948, -0.4512398838996887, -0.39505282044410706, -0.3388657569885254, -0.2826787233352661, -0.22649167478084564, -0.17030462622642517, -0.1141175776720047, -0.05793052911758423, -0.0017434954643249512, 0.054443567991256714, 0.11063063144683838, 0.16681766510009766, 0.22300471365451813, 0.2791917622089386, 0.33537882566452026, 0.39156585931777954, 0.4477528929710388, 0.5039399862289429, 0.5601270198822021, 0.6163140535354614, 0.6725010871887207, 0.72868812084198, 0.784875214099884, 0.8410622477531433, 0.8972492814064026, 0.9534363746643066, 1.009623408317566, 1.0658104419708252]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 5.0, 6.0, 18.0, 9.0, 15.0, 20.0, 27.0, 30.0, 32.0, 38.0, 33.0, 29.0, 18.0, 36.0, 53.0, 33.0, 49.0, 47.0, 31.0, 63.0, 37.0, 36.0, 41.0, 34.0, 40.0, 25.0, 31.0, 22.0, 27.0, 20.0, 12.0, 13.0, 8.0, 8.0, 10.0, 4.0, 5.0, 9.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7298775911331177, -0.708768367767334, -0.6876590847969055, -0.666549801826477, -0.6454405784606934, -0.6243313550949097, -0.6032220721244812, -0.5821127891540527, -0.561003565788269, -0.5398943424224854, -0.5187850594520569, -0.4976758062839508, -0.4765665531158447, -0.45545729994773865, -0.43434804677963257, -0.4132387936115265, -0.3921295404434204, -0.37102028727531433, -0.34991103410720825, -0.3288017809391022, -0.3076925277709961, -0.28658327460289, -0.26547402143478394, -0.24436476826667786, -0.22325551509857178, -0.2021462619304657, -0.18103700876235962, -0.15992775559425354, -0.13881850242614746, -0.11770924925804138, -0.0965999960899353, -0.07549074292182922, -0.054381489753723145, -0.033272236585617065, -0.012162983417510986, 0.008946269750595093, 0.030055522918701172, 0.05116477608680725, 0.07227402925491333, 0.09338328242301941, 0.11449253559112549, 0.13560178875923157, 0.15671104192733765, 0.17782029509544373, 0.1989295482635498, 0.22003880143165588, 0.24114805459976196, 0.26225730776786804, 0.2833665609359741, 0.3044758141040802, 0.3255850672721863, 0.34669432044029236, 0.36780357360839844, 0.3889128267765045, 0.4100220799446106, 0.4311313331127167, 0.45224058628082275, 0.47334983944892883, 0.4944590926170349, 0.5155683755874634, 0.5366775989532471, 0.5577868223190308, 0.5788961052894592, 0.6000053882598877, 0.6211146116256714]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 12.0, 19.0, 23.0, 34.0, 45.0, 68.0, 107.0, 118.0, 188.0, 259.0, 394.0, 541.0, 890.0, 1363.0, 2385.0, 5039.0, 12823.0, 47464.0, 290005.0, 557730.0, 92988.0, 20907.0, 7014.0, 3245.0, 1678.0, 1074.0, 622.0, 440.0, 308.0, 205.0, 148.0, 105.0, 69.0, 62.0, 46.0, 39.0, 23.0, 15.0, 9.0, 9.0, 8.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5087890625, -0.491943359375, -0.47509765625, -0.458251953125, -0.44140625, -0.424560546875, -0.40771484375, -0.390869140625, -0.3740234375, -0.357177734375, -0.34033203125, -0.323486328125, -0.306640625, -0.289794921875, -0.27294921875, -0.256103515625, -0.2392578125, -0.222412109375, -0.20556640625, -0.188720703125, -0.171875, -0.155029296875, -0.13818359375, -0.121337890625, -0.1044921875, -0.087646484375, -0.07080078125, -0.053955078125, -0.037109375, -0.020263671875, -0.00341796875, 0.013427734375, 0.0302734375, 0.047119140625, 0.06396484375, 0.080810546875, 0.09765625, 0.114501953125, 0.13134765625, 0.148193359375, 0.1650390625, 0.181884765625, 0.19873046875, 0.215576171875, 0.232421875, 0.249267578125, 0.26611328125, 0.282958984375, 0.2998046875, 0.316650390625, 0.33349609375, 0.350341796875, 0.3671875, 0.384033203125, 0.40087890625, 0.417724609375, 0.4345703125, 0.451416015625, 0.46826171875, 0.485107421875, 0.501953125, 0.518798828125, 0.53564453125, 0.552490234375, 0.5693359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 6.0, 4.0, 11.0, 8.0, 14.0, 8.0, 12.0, 19.0, 23.0, 31.0, 26.0, 35.0, 35.0, 28.0, 42.0, 36.0, 43.0, 44.0, 48.0, 43.0, 46.0, 56.0, 44.0, 43.0, 42.0, 25.0, 28.0, 24.0, 31.0, 28.0, 24.0, 22.0, 18.0, 17.0, 9.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.0703125, -2.01220703125, -1.9541015625, -1.89599609375, -1.837890625, -1.77978515625, -1.7216796875, -1.66357421875, -1.60546875, -1.54736328125, -1.4892578125, -1.43115234375, -1.373046875, -1.31494140625, -1.2568359375, -1.19873046875, -1.140625, -1.08251953125, -1.0244140625, -0.96630859375, -0.908203125, -0.85009765625, -0.7919921875, -0.73388671875, -0.67578125, -0.61767578125, -0.5595703125, -0.50146484375, -0.443359375, -0.38525390625, -0.3271484375, -0.26904296875, -0.2109375, -0.15283203125, -0.0947265625, -0.03662109375, 0.021484375, 0.07958984375, 0.1376953125, 0.19580078125, 0.25390625, 0.31201171875, 0.3701171875, 0.42822265625, 0.486328125, 0.54443359375, 0.6025390625, 0.66064453125, 0.71875, 0.77685546875, 0.8349609375, 0.89306640625, 0.951171875, 1.00927734375, 1.0673828125, 1.12548828125, 1.18359375, 1.24169921875, 1.2998046875, 1.35791015625, 1.416015625, 1.47412109375, 1.5322265625, 1.59033203125, 1.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 10.0, 12.0, 15.0, 25.0, 24.0, 22.0, 30.0, 36.0, 47.0, 68.0, 122.0, 487.0, 989194.0, 57705.0, 306.0, 98.0, 60.0, 46.0, 50.0, 32.0, 39.0, 29.0, 22.0, 20.0, 14.0, 15.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.5701904296875, -5.355224609375, -5.1402587890625, -4.92529296875, -4.7103271484375, -4.495361328125, -4.2803955078125, -4.0654296875, -3.8504638671875, -3.635498046875, -3.4205322265625, -3.20556640625, -2.9906005859375, -2.775634765625, -2.5606689453125, -2.345703125, -2.1307373046875, -1.915771484375, -1.7008056640625, -1.48583984375, -1.2708740234375, -1.055908203125, -0.8409423828125, -0.6259765625, -0.4110107421875, -0.196044921875, 0.0189208984375, 0.23388671875, 0.4488525390625, 0.663818359375, 0.8787841796875, 1.09375, 1.3087158203125, 1.523681640625, 1.7386474609375, 1.95361328125, 2.1685791015625, 2.383544921875, 2.5985107421875, 2.8134765625, 3.0284423828125, 3.243408203125, 3.4583740234375, 3.67333984375, 3.8883056640625, 4.103271484375, 4.3182373046875, 4.533203125, 4.7481689453125, 4.963134765625, 5.1781005859375, 5.39306640625, 5.6080322265625, 5.822998046875, 6.0379638671875, 6.2529296875, 6.4678955078125, 6.682861328125, 6.8978271484375, 7.11279296875, 7.3277587890625, 7.542724609375, 7.7576904296875, 7.97265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 8.0, 8.0, 9.0, 11.0, 15.0, 28.0, 24.0, 23.0, 30.0, 38.0, 37.0, 63.0, 68.0, 62.0, 84.0, 58.0, 54.0, 56.0, 47.0, 43.0, 51.0, 39.0, 30.0, 30.0, 23.0, 24.0, 8.0, 17.0, 3.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3046875, -2.218841552734375, -2.13299560546875, -2.047149658203125, -1.9613037109375, -1.875457763671875, -1.78961181640625, -1.703765869140625, -1.617919921875, -1.532073974609375, -1.44622802734375, -1.360382080078125, -1.2745361328125, -1.188690185546875, -1.10284423828125, -1.016998291015625, -0.93115234375, -0.845306396484375, -0.75946044921875, -0.673614501953125, -0.5877685546875, -0.501922607421875, -0.41607666015625, -0.330230712890625, -0.244384765625, -0.158538818359375, -0.07269287109375, 0.013153076171875, 0.0989990234375, 0.184844970703125, 0.27069091796875, 0.356536865234375, 0.4423828125, 0.528228759765625, 0.61407470703125, 0.699920654296875, 0.7857666015625, 0.871612548828125, 0.95745849609375, 1.043304443359375, 1.129150390625, 1.214996337890625, 1.30084228515625, 1.386688232421875, 1.4725341796875, 1.558380126953125, 1.64422607421875, 1.730072021484375, 1.81591796875, 1.901763916015625, 1.98760986328125, 2.073455810546875, 2.1593017578125, 2.245147705078125, 2.33099365234375, 2.416839599609375, 2.502685546875, 2.588531494140625, 2.67437744140625, 2.760223388671875, 2.8460693359375, 2.931915283203125, 3.01776123046875, 3.103607177734375, 3.189453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 10.0, 21.0, 38.0, 145.0, 925.0, 151996.0, 893694.0, 1468.0, 156.0, 47.0, 16.0, 6.0, 5.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6500625610351562, -0.6140899658203125, -0.5781173706054688, -0.542144775390625, -0.5061721801757812, -0.4701995849609375, -0.43422698974609375, -0.39825439453125, -0.36228179931640625, -0.3263092041015625, -0.29033660888671875, -0.254364013671875, -0.21839141845703125, -0.1824188232421875, -0.14644622802734375, -0.1104736328125, -0.07450103759765625, -0.0385284423828125, -0.00255584716796875, 0.033416748046875, 0.06938934326171875, 0.1053619384765625, 0.14133453369140625, 0.17730712890625, 0.21327972412109375, 0.2492523193359375, 0.28522491455078125, 0.321197509765625, 0.35717010498046875, 0.3931427001953125, 0.42911529541015625, 0.465087890625, 0.5010604858398438, 0.5370330810546875, 0.5730056762695312, 0.608978271484375, 0.6449508666992188, 0.6809234619140625, 0.7168960571289062, 0.75286865234375, 0.7888412475585938, 0.8248138427734375, 0.8607864379882812, 0.896759033203125, 0.9327316284179688, 0.9687042236328125, 1.0046768188476562, 1.0406494140625, 1.0766220092773438, 1.1125946044921875, 1.1485671997070312, 1.184539794921875, 1.2205123901367188, 1.2564849853515625, 1.2924575805664062, 1.32843017578125, 1.3644027709960938, 1.4003753662109375, 1.4363479614257812, 1.472320556640625, 1.5082931518554688, 1.5442657470703125, 1.5802383422851562, 1.6162109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 6.0, 2.0, 12.0, 14.0, 7.0, 10.0, 19.0, 18.0, 36.0, 43.0, 82.0, 124.0, 213.0, 145.0, 102.0, 49.0, 22.0, 30.0, 17.0, 8.0, 16.0, 2.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74913215637207e-05, -3.637932240962982e-05, -3.526732325553894e-05, -3.415532410144806e-05, -3.304332494735718e-05, -3.1931325793266296e-05, -3.0819326639175415e-05, -2.9707327485084534e-05, -2.8595328330993652e-05, -2.748332917690277e-05, -2.637133002281189e-05, -2.5259330868721008e-05, -2.4147331714630127e-05, -2.3035332560539246e-05, -2.1923333406448364e-05, -2.0811334252357483e-05, -1.96993350982666e-05, -1.858733594417572e-05, -1.747533679008484e-05, -1.6363337635993958e-05, -1.5251338481903076e-05, -1.4139339327812195e-05, -1.3027340173721313e-05, -1.1915341019630432e-05, -1.080334186553955e-05, -9.69134271144867e-06, -8.579343557357788e-06, -7.467344403266907e-06, -6.355345249176025e-06, -5.243346095085144e-06, -4.131346940994263e-06, -3.0193477869033813e-06, -1.9073486328125e-06, -7.953494787216187e-07, 3.166496753692627e-07, 1.428648829460144e-06, 2.5406479835510254e-06, 3.6526471376419067e-06, 4.764646291732788e-06, 5.8766454458236694e-06, 6.988644599914551e-06, 8.100643754005432e-06, 9.212642908096313e-06, 1.0324642062187195e-05, 1.1436641216278076e-05, 1.2548640370368958e-05, 1.3660639524459839e-05, 1.477263867855072e-05, 1.58846378326416e-05, 1.6996636986732483e-05, 1.8108636140823364e-05, 1.9220635294914246e-05, 2.0332634449005127e-05, 2.1444633603096008e-05, 2.255663275718689e-05, 2.366863191127777e-05, 2.4780631065368652e-05, 2.5892630219459534e-05, 2.7004629373550415e-05, 2.8116628527641296e-05, 2.9228627681732178e-05, 3.034062683582306e-05, 3.145262598991394e-05, 3.256462514400482e-05, 3.36766242980957e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 17.0, 18.0, 52.0, 203.0, 1307.0, 34506.0, 1005344.0, 6271.0, 600.0, 121.0, 41.0, 19.0, 14.0, 6.0, 8.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.0888671875, -1.0625, -1.0361328125, -1.009765625, -0.9833984375, -0.95703125, -0.9306640625, -0.904296875, -0.8779296875, -0.8515625, -0.8251953125, -0.798828125, -0.7724609375, -0.74609375, -0.7197265625, -0.693359375, -0.6669921875, -0.640625, -0.6142578125, -0.587890625, -0.5615234375, -0.53515625, -0.5087890625, -0.482421875, -0.4560546875, -0.4296875, -0.4033203125, -0.376953125, -0.3505859375, -0.32421875, -0.2978515625, -0.271484375, -0.2451171875, -0.21875, -0.1923828125, -0.166015625, -0.1396484375, -0.11328125, -0.0869140625, -0.060546875, -0.0341796875, -0.0078125, 0.0185546875, 0.044921875, 0.0712890625, 0.09765625, 0.1240234375, 0.150390625, 0.1767578125, 0.203125, 0.2294921875, 0.255859375, 0.2822265625, 0.30859375, 0.3349609375, 0.361328125, 0.3876953125, 0.4140625, 0.4404296875, 0.466796875, 0.4931640625, 0.51953125, 0.5458984375, 0.572265625, 0.5986328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 7.0, 11.0, 18.0, 32.0, 46.0, 69.0, 128.0, 232.0, 189.0, 111.0, 57.0, 36.0, 25.0, 11.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.0897207260131836, -0.08624076843261719, -0.08276081085205078, -0.07928085327148438, -0.07580089569091797, -0.07232093811035156, -0.06884098052978516, -0.06536102294921875, -0.061881065368652344, -0.05840110778808594, -0.05492115020751953, -0.051441192626953125, -0.04796123504638672, -0.04448127746582031, -0.041001319885253906, -0.0375213623046875, -0.034041404724121094, -0.030561447143554688, -0.02708148956298828, -0.023601531982421875, -0.02012157440185547, -0.016641616821289062, -0.013161659240722656, -0.00968170166015625, -0.006201744079589844, -0.0027217864990234375, 0.0007581710815429688, 0.004238128662109375, 0.007718086242675781, 0.011198043823242188, 0.014678001403808594, 0.018157958984375, 0.021637916564941406, 0.025117874145507812, 0.02859783172607422, 0.032077789306640625, 0.03555774688720703, 0.03903770446777344, 0.042517662048339844, 0.04599761962890625, 0.049477577209472656, 0.05295753479003906, 0.05643749237060547, 0.059917449951171875, 0.06339740753173828, 0.06687736511230469, 0.0703573226928711, 0.0738372802734375, 0.0773172378540039, 0.08079719543457031, 0.08427715301513672, 0.08775711059570312, 0.09123706817626953, 0.09471702575683594, 0.09819698333740234, 0.10167694091796875, 0.10515689849853516, 0.10863685607910156, 0.11211681365966797, 0.11559677124023438, 0.11907672882080078, 0.12255668640136719, 0.1260366439819336, 0.1295166015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 6.0, 11.0, 23.0, 27.0, 48.0, 63.0, 116.0, 168.0, 193.0, 128.0, 74.0, 48.0, 28.0, 26.0, 11.0, 12.0, 4.0, 7.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.985243320465088, -2.889725923538208, -2.7942087650299072, -2.6986913681030273, -2.6031739711761475, -2.5076565742492676, -2.412139415740967, -2.316622018814087, -2.221104621887207, -2.125587224960327, -2.0300700664520264, -1.9345526695251465, -1.8390352725982666, -1.7435179948806763, -1.648000717163086, -1.552483320236206, -1.4569661617279053, -1.361448884010315, -1.265931487083435, -1.1704142093658447, -1.0748968124389648, -0.9793795347213745, -0.8838622570037842, -0.7883449196815491, -0.692827582359314, -0.5973102450370789, -0.5017929077148438, -0.4062756299972534, -0.3107582926750183, -0.2152409553527832, -0.11972367763519287, -0.024206340312957764, 0.07131099700927734, 0.16682831943035126, 0.26234564185142517, 0.3578629493713379, 0.453380286693573, 0.5488976240158081, 0.6444149017333984, 0.7399322390556335, 0.8354495763778687, 0.9309669137001038, 1.0264842510223389, 1.1220015287399292, 1.2175188064575195, 1.3130362033843994, 1.4085534811019897, 1.50407075881958, 1.59958815574646, 1.6951054334640503, 1.7906228303909302, 1.8861401081085205, 1.9816575050354004, 2.077174663543701, 2.172692060470581, 2.268209457397461, 2.3637266159057617, 2.4592440128326416, 2.5547611713409424, 2.6502785682678223, 2.745795965194702, 2.841313362121582, 2.936830520629883, 3.0323479175567627, 3.1278653144836426]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 8.0, 10.0, 13.0, 18.0, 14.0, 21.0, 24.0, 36.0, 22.0, 26.0, 34.0, 21.0, 39.0, 50.0, 45.0, 47.0, 39.0, 36.0, 46.0, 49.0, 42.0, 40.0, 37.0, 33.0, 33.0, 31.0, 28.0, 21.0, 20.0, 19.0, 12.0, 11.0, 14.0, 14.0, 10.0, 9.0, 5.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6409285068511963, -2.5557265281677246, -2.470524311065674, -2.385322332382202, -2.3001201152801514, -2.2149181365966797, -2.129715919494629, -2.0445139408111572, -1.959311842918396, -1.8741097450256348, -1.7889076471328735, -1.7037055492401123, -1.6185035705566406, -1.5333013534545898, -1.4480993747711182, -1.362897276878357, -1.2776951789855957, -1.1924930810928345, -1.1072909832000732, -1.0220890045166016, -0.9368868470191956, -0.8516847491264343, -0.7664827108383179, -0.6812806129455566, -0.5960785150527954, -0.5108764171600342, -0.42567434906959534, -0.3404722809791565, -0.25527018308639526, -0.17006808519363403, -0.08486604690551758, 0.00033605098724365234, 0.08553814888000488, 0.17074023187160492, 0.25594231486320496, 0.3411443829536438, 0.42634648084640503, 0.5115485787391663, 0.5967506170272827, 0.681952714920044, 0.7671548128128052, 0.8523569107055664, 0.9375590085983276, 1.0227611064910889, 1.1079630851745605, 1.1931653022766113, 1.278367280960083, 1.3635693788528442, 1.4487714767456055, 1.5339735746383667, 1.619175672531128, 1.7043776512145996, 1.7895798683166504, 1.874781847000122, 1.9599839448928833, 2.0451860427856445, 2.1303882598876953, 2.215590238571167, 2.3007924556732178, 2.3859944343566895, 2.4711966514587402, 2.556398630142212, 2.6416006088256836, 2.7268028259277344, 2.812004804611206]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 8.0, 10.0, 10.0, 18.0, 13.0, 20.0, 15.0, 25.0, 34.0, 53.0, 58.0, 93.0, 131.0, 242.0, 390.0, 740.0, 1479.0, 3821.0, 12624.0, 107838.0, 3489281.0, 544494.0, 22975.0, 5720.0, 2053.0, 895.0, 439.0, 246.0, 159.0, 112.0, 77.0, 55.0, 28.0, 28.0, 23.0, 17.0, 21.0, 8.0, 9.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.76171875, -2.671722412109375, -2.58172607421875, -2.491729736328125, -2.4017333984375, -2.311737060546875, -2.22174072265625, -2.131744384765625, -2.041748046875, -1.951751708984375, -1.86175537109375, -1.771759033203125, -1.6817626953125, -1.591766357421875, -1.50177001953125, -1.411773681640625, -1.32177734375, -1.231781005859375, -1.14178466796875, -1.051788330078125, -0.9617919921875, -0.871795654296875, -0.78179931640625, -0.691802978515625, -0.601806640625, -0.511810302734375, -0.42181396484375, -0.331817626953125, -0.2418212890625, -0.151824951171875, -0.06182861328125, 0.028167724609375, 0.1181640625, 0.208160400390625, 0.29815673828125, 0.388153076171875, 0.4781494140625, 0.568145751953125, 0.65814208984375, 0.748138427734375, 0.838134765625, 0.928131103515625, 1.01812744140625, 1.108123779296875, 1.1981201171875, 1.288116455078125, 1.37811279296875, 1.468109130859375, 1.55810546875, 1.648101806640625, 1.73809814453125, 1.828094482421875, 1.9180908203125, 2.008087158203125, 2.09808349609375, 2.188079833984375, 2.278076171875, 2.368072509765625, 2.45806884765625, 2.548065185546875, 2.6380615234375, 2.728057861328125, 2.81805419921875, 2.908050537109375, 2.998046875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 9.0, 10.0, 12.0, 24.0, 17.0, 16.0, 34.0, 24.0, 29.0, 41.0, 34.0, 31.0, 39.0, 41.0, 50.0, 52.0, 58.0, 49.0, 58.0, 49.0, 34.0, 38.0, 33.0, 21.0, 29.0, 27.0, 20.0, 19.0, 25.0, 10.0, 10.0, 8.0, 11.0, 6.0, 4.0, 2.0, 5.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.82470703125, -0.800506591796875, -0.77630615234375, -0.752105712890625, -0.7279052734375, -0.703704833984375, -0.67950439453125, -0.655303955078125, -0.631103515625, -0.606903076171875, -0.58270263671875, -0.558502197265625, -0.5343017578125, -0.510101318359375, -0.48590087890625, -0.461700439453125, -0.4375, -0.413299560546875, -0.38909912109375, -0.364898681640625, -0.3406982421875, -0.316497802734375, -0.29229736328125, -0.268096923828125, -0.243896484375, -0.219696044921875, -0.19549560546875, -0.171295166015625, -0.1470947265625, -0.122894287109375, -0.09869384765625, -0.074493408203125, -0.05029296875, -0.026092529296875, -0.00189208984375, 0.022308349609375, 0.0465087890625, 0.070709228515625, 0.09490966796875, 0.119110107421875, 0.143310546875, 0.167510986328125, 0.19171142578125, 0.215911865234375, 0.2401123046875, 0.264312744140625, 0.28851318359375, 0.312713623046875, 0.3369140625, 0.361114501953125, 0.38531494140625, 0.409515380859375, 0.4337158203125, 0.457916259765625, 0.48211669921875, 0.506317138671875, 0.530517578125, 0.554718017578125, 0.57891845703125, 0.603118896484375, 0.6273193359375, 0.651519775390625, 0.67572021484375, 0.699920654296875, 0.72412109375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 16.0, 14.0, 30.0, 63.0, 95.0, 248.0, 669.0, 14865.0, 4169179.0, 8108.0, 550.0, 201.0, 93.0, 50.0, 34.0, 16.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.605224609375, -7.28076171875, -6.956298828125, -6.6318359375, -6.307373046875, -5.98291015625, -5.658447265625, -5.333984375, -5.009521484375, -4.68505859375, -4.360595703125, -4.0361328125, -3.711669921875, -3.38720703125, -3.062744140625, -2.73828125, -2.413818359375, -2.08935546875, -1.764892578125, -1.4404296875, -1.115966796875, -0.79150390625, -0.467041015625, -0.142578125, 0.181884765625, 0.50634765625, 0.830810546875, 1.1552734375, 1.479736328125, 1.80419921875, 2.128662109375, 2.453125, 2.777587890625, 3.10205078125, 3.426513671875, 3.7509765625, 4.075439453125, 4.39990234375, 4.724365234375, 5.048828125, 5.373291015625, 5.69775390625, 6.022216796875, 6.3466796875, 6.671142578125, 6.99560546875, 7.320068359375, 7.64453125, 7.968994140625, 8.29345703125, 8.617919921875, 8.9423828125, 9.266845703125, 9.59130859375, 9.915771484375, 10.240234375, 10.564697265625, 10.88916015625, 11.213623046875, 11.5380859375, 11.862548828125, 12.18701171875, 12.511474609375, 12.8359375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 3.0, 4.0, 5.0, 3.0, 6.0, 10.0, 9.0, 14.0, 14.0, 15.0, 20.0, 31.0, 44.0, 57.0, 87.0, 147.0, 216.0, 438.0, 737.0, 772.0, 573.0, 288.0, 166.0, 98.0, 85.0, 57.0, 36.0, 30.0, 23.0, 15.0, 20.0, 12.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.50830078125, -0.49462890625, -0.48095703125, -0.46728515625, -0.45361328125, -0.43994140625, -0.42626953125, -0.41259765625, -0.39892578125, -0.38525390625, -0.37158203125, -0.35791015625, -0.34423828125, -0.33056640625, -0.31689453125, -0.30322265625, -0.28955078125, -0.27587890625, -0.26220703125, -0.24853515625, -0.23486328125, -0.22119140625, -0.20751953125, -0.19384765625, -0.18017578125, -0.16650390625, -0.15283203125, -0.13916015625, -0.12548828125, -0.11181640625, -0.09814453125, -0.08447265625, -0.07080078125, -0.05712890625, -0.04345703125, -0.02978515625, -0.01611328125, -0.00244140625, 0.01123046875, 0.02490234375, 0.03857421875, 0.05224609375, 0.06591796875, 0.07958984375, 0.09326171875, 0.10693359375, 0.12060546875, 0.13427734375, 0.14794921875, 0.16162109375, 0.17529296875, 0.18896484375, 0.20263671875, 0.21630859375, 0.22998046875, 0.24365234375, 0.25732421875, 0.27099609375, 0.28466796875, 0.29833984375, 0.31201171875, 0.32568359375, 0.33935546875, 0.35302734375, 0.36669921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 6.0, 2.0, 12.0, 13.0, 20.0, 30.0, 57.0, 69.0, 76.0, 91.0, 112.0, 134.0, 100.0, 75.0, 61.0, 38.0, 24.0, 14.0, 12.0, 8.0, 11.0, 8.0, 4.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9296356439590454, -1.8824702501296997, -1.835304856300354, -1.7881394624710083, -1.7409741878509521, -1.6938087940216064, -1.6466434001922607, -1.599478006362915, -1.5523126125335693, -1.5051472187042236, -1.457981824874878, -1.4108164310455322, -1.3636510372161865, -1.3164857625961304, -1.2693203687667847, -1.222154974937439, -1.1749895811080933, -1.1278241872787476, -1.0806587934494019, -1.0334933996200562, -0.9863280653953552, -0.9391626715660095, -0.8919973373413086, -0.8448319435119629, -0.7976665496826172, -0.7505011558532715, -0.7033357620239258, -0.6561704277992249, -0.6090050339698792, -0.5618396401405334, -0.5146743059158325, -0.4675089120864868, -0.42034363746643066, -0.37317824363708496, -0.32601287961006165, -0.27884751558303833, -0.23168212175369263, -0.18451674282550812, -0.1373513638973236, -0.09018599987030029, -0.04302060604095459, 0.004144772887229919, 0.05131015181541443, 0.09847553074359894, 0.14564090967178345, 0.19280628859996796, 0.23997166752815247, 0.2871370315551758, 0.3343024253845215, 0.3814678192138672, 0.4286331832408905, 0.4757985472679138, 0.5229639410972595, 0.5701293349266052, 0.6172946691513062, 0.6644600629806519, 0.7116254568099976, 0.7587908506393433, 0.805956244468689, 0.8531215786933899, 0.9002869725227356, 0.9474523663520813, 0.9946177005767822, 1.041783094406128, 1.0889484882354736]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 7.0, 5.0, 6.0, 8.0, 6.0, 13.0, 12.0, 17.0, 16.0, 26.0, 24.0, 30.0, 20.0, 30.0, 22.0, 28.0, 26.0, 40.0, 44.0, 38.0, 38.0, 46.0, 31.0, 36.0, 40.0, 38.0, 28.0, 24.0, 25.0, 35.0, 24.0, 28.0, 25.0, 19.0, 15.0, 12.0, 17.0, 16.0, 13.0, 11.0, 7.0, 8.0, 14.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 5.0], "bins": [-0.7717801332473755, -0.7501706480979919, -0.7285611629486084, -0.7069516181945801, -0.6853421330451965, -0.663732647895813, -0.6421231031417847, -0.6205136179924011, -0.5989041328430176, -0.577294647693634, -0.5556851625442505, -0.5340756177902222, -0.5124661326408386, -0.4908566474914551, -0.46924713253974915, -0.4476376175880432, -0.42602813243865967, -0.4044186472892761, -0.3828091323375702, -0.36119961738586426, -0.3395901322364807, -0.31798064708709717, -0.29637113213539124, -0.2747616171836853, -0.25315213203430176, -0.23154263198375702, -0.20993313193321228, -0.18832363188266754, -0.1667141318321228, -0.14510463178157806, -0.12349513173103333, -0.10188563168048859, -0.08027607202529907, -0.058666571974754333, -0.037057071924209595, -0.015447571873664856, 0.006161928176879883, 0.02777142822742462, 0.04938092827796936, 0.0709904283285141, 0.09259992837905884, 0.11420942842960358, 0.13581892848014832, 0.15742842853069305, 0.1790379285812378, 0.20064742863178253, 0.22225692868232727, 0.243866428732872, 0.26547592878341675, 0.2870854139328003, 0.3086949288845062, 0.33030444383621216, 0.3519139289855957, 0.37352341413497925, 0.3951329290866852, 0.4167424440383911, 0.43835192918777466, 0.4599614143371582, 0.48157092928886414, 0.5031804442405701, 0.5247899293899536, 0.5463994145393372, 0.5680088996887207, 0.589618444442749, 0.6112279295921326]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 4.0, 7.0, 11.0, 9.0, 25.0, 36.0, 33.0, 51.0, 73.0, 120.0, 190.0, 230.0, 336.0, 505.0, 803.0, 1343.0, 1999.0, 3467.0, 6014.0, 11069.0, 21877.0, 49651.0, 155043.0, 503256.0, 184399.0, 56062.0, 23777.0, 11867.0, 6509.0, 3623.0, 2182.0, 1281.0, 881.0, 584.0, 408.0, 258.0, 173.0, 128.0, 80.0, 55.0, 38.0, 31.0, 22.0, 17.0, 11.0, 3.0, 2.0, 6.0, 5.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.36767578125, -0.356719970703125, -0.34576416015625, -0.334808349609375, -0.3238525390625, -0.312896728515625, -0.30194091796875, -0.290985107421875, -0.280029296875, -0.269073486328125, -0.25811767578125, -0.247161865234375, -0.2362060546875, -0.225250244140625, -0.21429443359375, -0.203338623046875, -0.1923828125, -0.181427001953125, -0.17047119140625, -0.159515380859375, -0.1485595703125, -0.137603759765625, -0.12664794921875, -0.115692138671875, -0.104736328125, -0.093780517578125, -0.08282470703125, -0.071868896484375, -0.0609130859375, -0.049957275390625, -0.03900146484375, -0.028045654296875, -0.01708984375, -0.006134033203125, 0.00482177734375, 0.015777587890625, 0.0267333984375, 0.037689208984375, 0.04864501953125, 0.059600830078125, 0.070556640625, 0.081512451171875, 0.09246826171875, 0.103424072265625, 0.1143798828125, 0.125335693359375, 0.13629150390625, 0.147247314453125, 0.158203125, 0.169158935546875, 0.18011474609375, 0.191070556640625, 0.2020263671875, 0.212982177734375, 0.22393798828125, 0.234893798828125, 0.245849609375, 0.256805419921875, 0.26776123046875, 0.278717041015625, 0.2896728515625, 0.300628662109375, 0.31158447265625, 0.322540283203125, 0.33349609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 8.0, 14.0, 10.0, 13.0, 9.0, 17.0, 22.0, 25.0, 25.0, 22.0, 28.0, 27.0, 36.0, 35.0, 46.0, 53.0, 46.0, 41.0, 35.0, 46.0, 49.0, 36.0, 39.0, 21.0, 38.0, 29.0, 40.0, 25.0, 26.0, 18.0, 12.0, 14.0, 11.0, 13.0, 10.0, 6.0, 7.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.51904296875, -0.5046348571777344, -0.49022674560546875, -0.4758186340332031, -0.4614105224609375, -0.4470024108886719, -0.43259429931640625, -0.4181861877441406, -0.403778076171875, -0.3893699645996094, -0.37496185302734375, -0.3605537414550781, -0.3461456298828125, -0.3317375183105469, -0.31732940673828125, -0.3029212951660156, -0.28851318359375, -0.2741050720214844, -0.25969696044921875, -0.24528884887695312, -0.2308807373046875, -0.21647262573242188, -0.20206451416015625, -0.18765640258789062, -0.173248291015625, -0.15884017944335938, -0.14443206787109375, -0.13002395629882812, -0.1156158447265625, -0.10120773315429688, -0.08679962158203125, -0.07239151000976562, -0.0579833984375, -0.043575286865234375, -0.02916717529296875, -0.014759063720703125, -0.0003509521484375, 0.014057159423828125, 0.02846527099609375, 0.042873382568359375, 0.057281494140625, 0.07168960571289062, 0.08609771728515625, 0.10050582885742188, 0.1149139404296875, 0.12932205200195312, 0.14373016357421875, 0.15813827514648438, 0.17254638671875, 0.18695449829101562, 0.20136260986328125, 0.21577072143554688, 0.2301788330078125, 0.24458694458007812, 0.25899505615234375, 0.2734031677246094, 0.287811279296875, 0.3022193908691406, 0.31662750244140625, 0.3310356140136719, 0.3454437255859375, 0.3598518371582031, 0.37425994873046875, 0.3886680603027344, 0.403076171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 6.0, 12.0, 11.0, 16.0, 32.0, 56.0, 62.0, 89.0, 162.0, 219.0, 400.0, 698.0, 1205.0, 2160.0, 4256.0, 9319.0, 22358.0, 66622.0, 278490.0, 482237.0, 118759.0, 35235.0, 13476.0, 6018.0, 3011.0, 1536.0, 816.0, 491.0, 307.0, 165.0, 96.0, 80.0, 43.0, 27.0, 24.0, 12.0, 12.0, 12.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2923927307128906, -0.28302764892578125, -0.2736625671386719, -0.2642974853515625, -0.2549324035644531, -0.24556732177734375, -0.23620223999023438, -0.226837158203125, -0.21747207641601562, -0.20810699462890625, -0.19874191284179688, -0.1893768310546875, -0.18001174926757812, -0.17064666748046875, -0.16128158569335938, -0.15191650390625, -0.14255142211914062, -0.13318634033203125, -0.12382125854492188, -0.1144561767578125, -0.10509109497070312, -0.09572601318359375, -0.08636093139648438, -0.076995849609375, -0.06763076782226562, -0.05826568603515625, -0.048900604248046875, -0.0395355224609375, -0.030170440673828125, -0.02080535888671875, -0.011440277099609375, -0.0020751953125, 0.007289886474609375, 0.01665496826171875, 0.026020050048828125, 0.0353851318359375, 0.044750213623046875, 0.05411529541015625, 0.06348037719726562, 0.072845458984375, 0.08221054077148438, 0.09157562255859375, 0.10094070434570312, 0.1103057861328125, 0.11967086791992188, 0.12903594970703125, 0.13840103149414062, 0.14776611328125, 0.15713119506835938, 0.16649627685546875, 0.17586135864257812, 0.1852264404296875, 0.19459152221679688, 0.20395660400390625, 0.21332168579101562, 0.222686767578125, 0.23205184936523438, 0.24141693115234375, 0.2507820129394531, 0.2601470947265625, 0.2695121765136719, 0.27887725830078125, 0.2882423400878906, 0.297607421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 10.0, 6.0, 7.0, 10.0, 16.0, 9.0, 29.0, 21.0, 25.0, 23.0, 28.0, 24.0, 43.0, 29.0, 38.0, 47.0, 35.0, 50.0, 32.0, 41.0, 37.0, 50.0, 40.0, 44.0, 38.0, 31.0, 33.0, 28.0, 21.0, 22.0, 13.0, 17.0, 17.0, 16.0, 11.0, 9.0, 5.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.89453125, -0.868927001953125, -0.84332275390625, -0.817718505859375, -0.7921142578125, -0.766510009765625, -0.74090576171875, -0.715301513671875, -0.689697265625, -0.664093017578125, -0.63848876953125, -0.612884521484375, -0.5872802734375, -0.561676025390625, -0.53607177734375, -0.510467529296875, -0.48486328125, -0.459259033203125, -0.43365478515625, -0.408050537109375, -0.3824462890625, -0.356842041015625, -0.33123779296875, -0.305633544921875, -0.280029296875, -0.254425048828125, -0.22882080078125, -0.203216552734375, -0.1776123046875, -0.152008056640625, -0.12640380859375, -0.100799560546875, -0.0751953125, -0.049591064453125, -0.02398681640625, 0.001617431640625, 0.0272216796875, 0.052825927734375, 0.07843017578125, 0.104034423828125, 0.129638671875, 0.155242919921875, 0.18084716796875, 0.206451416015625, 0.2320556640625, 0.257659912109375, 0.28326416015625, 0.308868408203125, 0.33447265625, 0.360076904296875, 0.38568115234375, 0.411285400390625, 0.4368896484375, 0.462493896484375, 0.48809814453125, 0.513702392578125, 0.539306640625, 0.564910888671875, 0.59051513671875, 0.616119384765625, 0.6417236328125, 0.667327880859375, 0.69293212890625, 0.718536376953125, 0.744140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 2.0, 9.0, 5.0, 6.0, 10.0, 17.0, 22.0, 41.0, 70.0, 91.0, 129.0, 175.0, 254.0, 393.0, 643.0, 1107.0, 1989.0, 3899.0, 8491.0, 20573.0, 60794.0, 221003.0, 469716.0, 175889.0, 50035.0, 17564.0, 7359.0, 3583.0, 1833.0, 1042.0, 646.0, 389.0, 233.0, 158.0, 123.0, 82.0, 53.0, 32.0, 31.0, 16.0, 20.0, 12.0, 3.0, 7.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055755615234375, -0.05379343032836914, -0.05183124542236328, -0.04986906051635742, -0.04790687561035156, -0.0459446907043457, -0.043982505798339844, -0.042020320892333984, -0.040058135986328125, -0.038095951080322266, -0.036133766174316406, -0.03417158126831055, -0.03220939636230469, -0.030247211456298828, -0.02828502655029297, -0.02632284164428711, -0.02436065673828125, -0.02239847183227539, -0.02043628692626953, -0.018474102020263672, -0.016511917114257812, -0.014549732208251953, -0.012587547302246094, -0.010625362396240234, -0.008663177490234375, -0.006700992584228516, -0.004738807678222656, -0.002776622772216797, -0.0008144378662109375, 0.0011477470397949219, 0.0031099319458007812, 0.005072116851806641, 0.0070343017578125, 0.00899648666381836, 0.010958671569824219, 0.012920856475830078, 0.014883041381835938, 0.016845226287841797, 0.018807411193847656, 0.020769596099853516, 0.022731781005859375, 0.024693965911865234, 0.026656150817871094, 0.028618335723876953, 0.030580520629882812, 0.03254270553588867, 0.03450489044189453, 0.03646707534790039, 0.03842926025390625, 0.04039144515991211, 0.04235363006591797, 0.04431581497192383, 0.04627799987792969, 0.04824018478393555, 0.050202369689941406, 0.052164554595947266, 0.054126739501953125, 0.056088924407958984, 0.058051109313964844, 0.0600132942199707, 0.06197547912597656, 0.06393766403198242, 0.06589984893798828, 0.06786203384399414, 0.06982421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 10.0, 12.0, 14.0, 26.0, 42.0, 65.0, 120.0, 170.0, 193.0, 116.0, 76.0, 54.0, 32.0, 20.0, 10.0, 10.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61015510559082e-05, -6.347056478261948e-05, -6.083957850933075e-05, -5.820859223604202e-05, -5.5577605962753296e-05, -5.294661968946457e-05, -5.031563341617584e-05, -4.7684647142887115e-05, -4.505366086959839e-05, -4.242267459630966e-05, -3.9791688323020935e-05, -3.716070204973221e-05, -3.452971577644348e-05, -3.1898729503154755e-05, -2.9267743229866028e-05, -2.66367569565773e-05, -2.4005770683288574e-05, -2.1374784409999847e-05, -1.874379813671112e-05, -1.6112811863422394e-05, -1.3481825590133667e-05, -1.085083931684494e-05, -8.219853043556213e-06, -5.5888667702674866e-06, -2.9578804969787598e-06, -3.2689422369003296e-07, 2.304092049598694e-06, 4.935078322887421e-06, 7.5660645961761475e-06, 1.0197050869464874e-05, 1.2828037142753601e-05, 1.5459023416042328e-05, 1.8090009689331055e-05, 2.072099596261978e-05, 2.3351982235908508e-05, 2.5982968509197235e-05, 2.8613954782485962e-05, 3.124494105577469e-05, 3.3875927329063416e-05, 3.650691360235214e-05, 3.913789987564087e-05, 4.1768886148929596e-05, 4.439987242221832e-05, 4.703085869550705e-05, 4.9661844968795776e-05, 5.22928312420845e-05, 5.492381751537323e-05, 5.755480378866196e-05, 6.0185790061950684e-05, 6.281677633523941e-05, 6.544776260852814e-05, 6.807874888181686e-05, 7.070973515510559e-05, 7.334072142839432e-05, 7.597170770168304e-05, 7.860269397497177e-05, 8.12336802482605e-05, 8.386466652154922e-05, 8.649565279483795e-05, 8.912663906812668e-05, 9.17576253414154e-05, 9.438861161470413e-05, 9.701959788799286e-05, 9.965058416128159e-05, 0.00010228157043457031]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 16.0, 18.0, 18.0, 40.0, 91.0, 179.0, 369.0, 1203.0, 4064.0, 19456.0, 188405.0, 739131.0, 80440.0, 10998.0, 2724.0, 803.0, 291.0, 129.0, 60.0, 28.0, 20.0, 16.0, 4.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.12993621826171875, -0.1253509521484375, -0.12076568603515625, -0.116180419921875, -0.11159515380859375, -0.1070098876953125, -0.10242462158203125, -0.09783935546875, -0.09325408935546875, -0.0886688232421875, -0.08408355712890625, -0.079498291015625, -0.07491302490234375, -0.0703277587890625, -0.06574249267578125, -0.0611572265625, -0.05657196044921875, -0.0519866943359375, -0.04740142822265625, -0.042816162109375, -0.03823089599609375, -0.0336456298828125, -0.02906036376953125, -0.02447509765625, -0.01988983154296875, -0.0153045654296875, -0.01071929931640625, -0.006134033203125, -0.00154876708984375, 0.0030364990234375, 0.00762176513671875, 0.01220703125, 0.01679229736328125, 0.0213775634765625, 0.02596282958984375, 0.030548095703125, 0.03513336181640625, 0.0397186279296875, 0.04430389404296875, 0.04888916015625, 0.05347442626953125, 0.0580596923828125, 0.06264495849609375, 0.067230224609375, 0.07181549072265625, 0.0764007568359375, 0.08098602294921875, 0.0855712890625, 0.09015655517578125, 0.0947418212890625, 0.09932708740234375, 0.103912353515625, 0.10849761962890625, 0.1130828857421875, 0.11766815185546875, 0.12225341796875, 0.12683868408203125, 0.1314239501953125, 0.13600921630859375, 0.140594482421875, 0.14517974853515625, 0.1497650146484375, 0.15435028076171875, 0.158935546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 2.0, 5.0, 8.0, 12.0, 9.0, 10.0, 17.0, 22.0, 33.0, 37.0, 56.0, 63.0, 70.0, 65.0, 76.0, 74.0, 80.0, 52.0, 60.0, 64.0, 49.0, 28.0, 25.0, 23.0, 8.0, 11.0, 12.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0187530517578125, -0.01811075210571289, -0.01746845245361328, -0.016826152801513672, -0.016183853149414062, -0.015541553497314453, -0.014899253845214844, -0.014256954193115234, -0.013614654541015625, -0.012972354888916016, -0.012330055236816406, -0.011687755584716797, -0.011045455932617188, -0.010403156280517578, -0.009760856628417969, -0.00911855697631836, -0.00847625732421875, -0.00783395767211914, -0.007191658020019531, -0.006549358367919922, -0.0059070587158203125, -0.005264759063720703, -0.004622459411621094, -0.003980159759521484, -0.003337860107421875, -0.0026955604553222656, -0.0020532608032226562, -0.0014109611511230469, -0.0007686614990234375, -0.00012636184692382812, 0.0005159378051757812, 0.0011582374572753906, 0.001800537109375, 0.0024428367614746094, 0.0030851364135742188, 0.003727436065673828, 0.0043697357177734375, 0.005012035369873047, 0.005654335021972656, 0.006296634674072266, 0.006938934326171875, 0.007581233978271484, 0.008223533630371094, 0.008865833282470703, 0.009508132934570312, 0.010150432586669922, 0.010792732238769531, 0.01143503189086914, 0.01207733154296875, 0.01271963119506836, 0.013361930847167969, 0.014004230499267578, 0.014646530151367188, 0.015288829803466797, 0.015931129455566406, 0.016573429107666016, 0.017215728759765625, 0.017858028411865234, 0.018500328063964844, 0.019142627716064453, 0.019784927368164062, 0.020427227020263672, 0.02106952667236328, 0.02171182632446289, 0.0223541259765625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 9.0, 6.0, 7.0, 13.0, 15.0, 42.0, 38.0, 86.0, 109.0, 127.0, 181.0, 139.0, 76.0, 56.0, 32.0, 21.0, 17.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0980820655822754, -1.062807559967041, -1.027532935142517, -0.9922583699226379, -0.9569838047027588, -0.9217092990875244, -0.8864347338676453, -0.8511601686477661, -0.815885603427887, -0.7806110382080078, -0.7453364729881287, -0.7100619077682495, -0.6747874021530151, -0.6395127773284912, -0.6042382717132568, -0.5689637064933777, -0.5336891412734985, -0.4984145760536194, -0.46314001083374023, -0.42786547541618347, -0.3925909101963043, -0.35731634497642517, -0.3220418095588684, -0.28676724433898926, -0.2514926791191101, -0.21621811389923096, -0.180943563580513, -0.14566901326179504, -0.1103944480419159, -0.07511988282203674, -0.03984533250331879, -0.00457078218460083, 0.03070366382598877, 0.06597822159528732, 0.10125277936458588, 0.13652732968330383, 0.17180189490318298, 0.20707646012306213, 0.2423510104417801, 0.27762556076049805, 0.3129001259803772, 0.34817469120025635, 0.3834492564201355, 0.41872379183769226, 0.4539983570575714, 0.48927292227745056, 0.5245474576950073, 0.5598220229148865, 0.5950965881347656, 0.6303711533546448, 0.6656457185745239, 0.7009202837944031, 0.7361948490142822, 0.7714693546295166, 0.8067439198493958, 0.8420184850692749, 0.877293050289154, 0.9125676155090332, 0.9478421807289124, 0.9831167459487915, 1.0183912515640259, 1.0536658763885498, 1.0889403820037842, 1.1242148876190186, 1.1594895124435425]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 6.0, 7.0, 11.0, 17.0, 21.0, 11.0, 19.0, 21.0, 28.0, 29.0, 24.0, 19.0, 37.0, 26.0, 31.0, 34.0, 40.0, 51.0, 37.0, 51.0, 26.0, 38.0, 34.0, 25.0, 31.0, 30.0, 27.0, 35.0, 40.0, 17.0, 17.0, 19.0, 12.0, 18.0, 12.0, 9.0, 9.0, 15.0, 9.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0], "bins": [-0.449985146522522, -0.43745124340057373, -0.4249173402786255, -0.41238343715667725, -0.399849534034729, -0.38731563091278076, -0.37478169798851013, -0.3622477948665619, -0.34971389174461365, -0.3371799886226654, -0.32464608550071716, -0.3121121823787689, -0.2995782494544983, -0.28704434633255005, -0.2745104432106018, -0.26197654008865356, -0.24944263696670532, -0.23690873384475708, -0.22437483072280884, -0.2118409126996994, -0.19930700957775116, -0.18677310645580292, -0.17423918843269348, -0.16170528531074524, -0.149171382188797, -0.13663747906684875, -0.12410356849431992, -0.11156965792179108, -0.09903575479984283, -0.08650185167789459, -0.07396794110536575, -0.061434030532836914, -0.04890015721321106, -0.03636625036597252, -0.02383234351873398, -0.011298436671495438, 0.001235470175743103, 0.013769373297691345, 0.026303283870220184, 0.03883719444274902, 0.051371097564697266, 0.06390500068664551, 0.07643891125917435, 0.08897282183170319, 0.10150672495365143, 0.11404062807559967, 0.1265745460987091, 0.13910844922065735, 0.1516423523426056, 0.16417625546455383, 0.17671015858650208, 0.1892440766096115, 0.20177797973155975, 0.214311882853508, 0.22684580087661743, 0.23937970399856567, 0.2519136071205139, 0.26444751024246216, 0.2769814133644104, 0.28951531648635864, 0.3020492196083069, 0.3145831227302551, 0.32711705565452576, 0.339650958776474, 0.35218486189842224]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 13.0, 7.0, 13.0, 18.0, 21.0, 41.0, 62.0, 84.0, 155.0, 225.0, 370.0, 610.0, 1039.0, 1703.0, 2921.0, 5265.0, 10224.0, 21580.0, 59373.0, 283376.0, 500742.0, 100783.0, 31189.0, 13224.0, 6711.0, 3583.0, 2081.0, 1248.0, 662.0, 430.0, 275.0, 208.0, 100.0, 73.0, 52.0, 30.0, 23.0, 15.0, 5.0, 3.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2526664733886719, -0.24263763427734375, -0.23260879516601562, -0.2225799560546875, -0.21255111694335938, -0.20252227783203125, -0.19249343872070312, -0.182464599609375, -0.17243576049804688, -0.16240692138671875, -0.15237808227539062, -0.1423492431640625, -0.13232040405273438, -0.12229156494140625, -0.11226272583007812, -0.10223388671875, -0.09220504760742188, -0.08217620849609375, -0.07214736938476562, -0.0621185302734375, -0.052089691162109375, -0.04206085205078125, -0.032032012939453125, -0.022003173828125, -0.011974334716796875, -0.00194549560546875, 0.008083343505859375, 0.0181121826171875, 0.028141021728515625, 0.03816986083984375, 0.048198699951171875, 0.0582275390625, 0.06825637817382812, 0.07828521728515625, 0.08831405639648438, 0.0983428955078125, 0.10837173461914062, 0.11840057373046875, 0.12842941284179688, 0.138458251953125, 0.14848709106445312, 0.15851593017578125, 0.16854476928710938, 0.1785736083984375, 0.18860244750976562, 0.19863128662109375, 0.20866012573242188, 0.21868896484375, 0.22871780395507812, 0.23874664306640625, 0.24877548217773438, 0.2588043212890625, 0.2688331604003906, 0.27886199951171875, 0.2888908386230469, 0.298919677734375, 0.3089485168457031, 0.31897735595703125, 0.3290061950683594, 0.3390350341796875, 0.3490638732910156, 0.35909271240234375, 0.3691215515136719, 0.379150390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 6.0, 5.0, 17.0, 20.0, 12.0, 15.0, 24.0, 17.0, 43.0, 30.0, 19.0, 32.0, 41.0, 39.0, 40.0, 48.0, 46.0, 50.0, 43.0, 40.0, 37.0, 44.0, 32.0, 35.0, 30.0, 29.0, 29.0, 31.0, 21.0, 22.0, 11.0, 12.0, 14.0, 13.0, 8.0, 5.0, 7.0, 4.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0517578125, -1.0185546875, -0.9853515625, -0.9521484375, -0.9189453125, -0.8857421875, -0.8525390625, -0.8193359375, -0.7861328125, -0.7529296875, -0.7197265625, -0.6865234375, -0.6533203125, -0.6201171875, -0.5869140625, -0.5537109375, -0.5205078125, -0.4873046875, -0.4541015625, -0.4208984375, -0.3876953125, -0.3544921875, -0.3212890625, -0.2880859375, -0.2548828125, -0.2216796875, -0.1884765625, -0.1552734375, -0.1220703125, -0.0888671875, -0.0556640625, -0.0224609375, 0.0107421875, 0.0439453125, 0.0771484375, 0.1103515625, 0.1435546875, 0.1767578125, 0.2099609375, 0.2431640625, 0.2763671875, 0.3095703125, 0.3427734375, 0.3759765625, 0.4091796875, 0.4423828125, 0.4755859375, 0.5087890625, 0.5419921875, 0.5751953125, 0.6083984375, 0.6416015625, 0.6748046875, 0.7080078125, 0.7412109375, 0.7744140625, 0.8076171875, 0.8408203125, 0.8740234375, 0.9072265625, 0.9404296875, 0.9736328125, 1.0068359375, 1.0400390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 9.0, 4.0, 10.0, 10.0, 9.0, 17.0, 20.0, 17.0, 20.0, 30.0, 22.0, 33.0, 53.0, 41.0, 35.0, 55.0, 131.0, 844078.0, 203443.0, 124.0, 47.0, 44.0, 46.0, 34.0, 36.0, 27.0, 27.0, 22.0, 18.0, 17.0, 12.0, 12.0, 6.0, 7.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.29296875, -5.1416015625, -4.990234375, -4.8388671875, -4.6875, -4.5361328125, -4.384765625, -4.2333984375, -4.08203125, -3.9306640625, -3.779296875, -3.6279296875, -3.4765625, -3.3251953125, -3.173828125, -3.0224609375, -2.87109375, -2.7197265625, -2.568359375, -2.4169921875, -2.265625, -2.1142578125, -1.962890625, -1.8115234375, -1.66015625, -1.5087890625, -1.357421875, -1.2060546875, -1.0546875, -0.9033203125, -0.751953125, -0.6005859375, -0.44921875, -0.2978515625, -0.146484375, 0.0048828125, 0.15625, 0.3076171875, 0.458984375, 0.6103515625, 0.76171875, 0.9130859375, 1.064453125, 1.2158203125, 1.3671875, 1.5185546875, 1.669921875, 1.8212890625, 1.97265625, 2.1240234375, 2.275390625, 2.4267578125, 2.578125, 2.7294921875, 2.880859375, 3.0322265625, 3.18359375, 3.3349609375, 3.486328125, 3.6376953125, 3.7890625, 3.9404296875, 4.091796875, 4.2431640625, 4.39453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 16.0, 19.0, 19.0, 20.0, 18.0, 29.0, 29.0, 32.0, 46.0, 46.0, 28.0, 54.0, 37.0, 62.0, 49.0, 55.0, 49.0, 42.0, 39.0, 38.0, 32.0, 26.0, 31.0, 22.0, 28.0, 14.0, 15.0, 10.0, 10.0, 8.0, 8.0, 4.0, 8.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.1552734375, -1.1223373413085938, -1.0894012451171875, -1.0564651489257812, -1.023529052734375, -0.9905929565429688, -0.9576568603515625, -0.9247207641601562, -0.89178466796875, -0.8588485717773438, -0.8259124755859375, -0.7929763793945312, -0.760040283203125, -0.7271041870117188, -0.6941680908203125, -0.6612319946289062, -0.6282958984375, -0.5953598022460938, -0.5624237060546875, -0.5294876098632812, -0.496551513671875, -0.46361541748046875, -0.4306793212890625, -0.39774322509765625, -0.36480712890625, -0.33187103271484375, -0.2989349365234375, -0.26599884033203125, -0.233062744140625, -0.20012664794921875, -0.1671905517578125, -0.13425445556640625, -0.101318359375, -0.06838226318359375, -0.0354461669921875, -0.00251007080078125, 0.030426025390625, 0.06336212158203125, 0.0962982177734375, 0.12923431396484375, 0.16217041015625, 0.19510650634765625, 0.2280426025390625, 0.26097869873046875, 0.293914794921875, 0.32685089111328125, 0.3597869873046875, 0.39272308349609375, 0.4256591796875, 0.45859527587890625, 0.4915313720703125, 0.5244674682617188, 0.557403564453125, 0.5903396606445312, 0.6232757568359375, 0.6562118530273438, 0.68914794921875, 0.7220840454101562, 0.7550201416015625, 0.7879562377929688, 0.820892333984375, 0.8538284301757812, 0.8867645263671875, 0.9197006225585938, 0.95263671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 22.0, 14.0, 23.0, 28.0, 60.0, 125.0, 324.0, 979.0, 4664.0, 38956.0, 947680.0, 48448.0, 5403.0, 1191.0, 344.0, 113.0, 60.0, 35.0, 20.0, 15.0, 9.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44921875, -0.43497467041015625, -0.4207305908203125, -0.40648651123046875, -0.392242431640625, -0.37799835205078125, -0.3637542724609375, -0.34951019287109375, -0.33526611328125, -0.32102203369140625, -0.3067779541015625, -0.29253387451171875, -0.278289794921875, -0.26404571533203125, -0.2498016357421875, -0.23555755615234375, -0.2213134765625, -0.20706939697265625, -0.1928253173828125, -0.17858123779296875, -0.164337158203125, -0.15009307861328125, -0.1358489990234375, -0.12160491943359375, -0.10736083984375, -0.09311676025390625, -0.0788726806640625, -0.06462860107421875, -0.050384521484375, -0.03614044189453125, -0.0218963623046875, -0.00765228271484375, 0.006591796875, 0.02083587646484375, 0.0350799560546875, 0.04932403564453125, 0.063568115234375, 0.07781219482421875, 0.0920562744140625, 0.10630035400390625, 0.12054443359375, 0.13478851318359375, 0.1490325927734375, 0.16327667236328125, 0.177520751953125, 0.19176483154296875, 0.2060089111328125, 0.22025299072265625, 0.2344970703125, 0.24874114990234375, 0.2629852294921875, 0.27722930908203125, 0.291473388671875, 0.30571746826171875, 0.3199615478515625, 0.33420562744140625, 0.34844970703125, 0.36269378662109375, 0.3769378662109375, 0.39118194580078125, 0.405426025390625, 0.41967010498046875, 0.4339141845703125, 0.44815826416015625, 0.46240234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 10.0, 19.0, 26.0, 25.0, 32.0, 86.0, 173.0, 266.0, 123.0, 65.0, 45.0, 21.0, 22.0, 11.0, 7.0, 7.0, 4.0, 1.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.987550735473633e-05, -3.855675458908081e-05, -3.723800182342529e-05, -3.5919249057769775e-05, -3.460049629211426e-05, -3.328174352645874e-05, -3.196299076080322e-05, -3.0644237995147705e-05, -2.9325485229492188e-05, -2.800673246383667e-05, -2.6687979698181152e-05, -2.5369226932525635e-05, -2.4050474166870117e-05, -2.27317214012146e-05, -2.1412968635559082e-05, -2.0094215869903564e-05, -1.8775463104248047e-05, -1.745671033859253e-05, -1.6137957572937012e-05, -1.4819204807281494e-05, -1.3500452041625977e-05, -1.2181699275970459e-05, -1.0862946510314941e-05, -9.544193744659424e-06, -8.225440979003906e-06, -6.906688213348389e-06, -5.587935447692871e-06, -4.2691826820373535e-06, -2.950429916381836e-06, -1.6316771507263184e-06, -3.129243850708008e-07, 1.0058283805847168e-06, 2.3245811462402344e-06, 3.643333911895752e-06, 4.9620866775512695e-06, 6.280839443206787e-06, 7.599592208862305e-06, 8.918344974517822e-06, 1.023709774017334e-05, 1.1555850505828857e-05, 1.2874603271484375e-05, 1.4193356037139893e-05, 1.551210880279541e-05, 1.6830861568450928e-05, 1.8149614334106445e-05, 1.9468367099761963e-05, 2.078711986541748e-05, 2.2105872631072998e-05, 2.3424625396728516e-05, 2.4743378162384033e-05, 2.606213092803955e-05, 2.738088369369507e-05, 2.8699636459350586e-05, 3.0018389225006104e-05, 3.133714199066162e-05, 3.265589475631714e-05, 3.3974647521972656e-05, 3.5293400287628174e-05, 3.661215305328369e-05, 3.793090581893921e-05, 3.9249658584594727e-05, 4.0568411350250244e-05, 4.188716411590576e-05, 4.320591688156128e-05, 4.45246696472168e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 9.0, 9.0, 20.0, 15.0, 34.0, 66.0, 126.0, 209.0, 333.0, 764.0, 1625.0, 3873.0, 12032.0, 59014.0, 825269.0, 117966.0, 18042.0, 5222.0, 2013.0, 946.0, 436.0, 219.0, 118.0, 66.0, 42.0, 22.0, 15.0, 15.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.19244766235351562, -0.18494415283203125, -0.17744064331054688, -0.1699371337890625, -0.16243362426757812, -0.15493011474609375, -0.14742660522460938, -0.139923095703125, -0.13241958618164062, -0.12491607666015625, -0.11741256713867188, -0.1099090576171875, -0.10240554809570312, -0.09490203857421875, -0.08739852905273438, -0.07989501953125, -0.07239151000976562, -0.06488800048828125, -0.057384490966796875, -0.0498809814453125, -0.042377471923828125, -0.03487396240234375, -0.027370452880859375, -0.019866943359375, -0.012363433837890625, -0.00485992431640625, 0.002643585205078125, 0.0101470947265625, 0.017650604248046875, 0.02515411376953125, 0.032657623291015625, 0.0401611328125, 0.047664642333984375, 0.05516815185546875, 0.06267166137695312, 0.0701751708984375, 0.07767868041992188, 0.08518218994140625, 0.09268569946289062, 0.100189208984375, 0.10769271850585938, 0.11519622802734375, 0.12269973754882812, 0.1302032470703125, 0.13770675659179688, 0.14521026611328125, 0.15271377563476562, 0.16021728515625, 0.16772079467773438, 0.17522430419921875, 0.18272781372070312, 0.1902313232421875, 0.19773483276367188, 0.20523834228515625, 0.21274185180664062, 0.220245361328125, 0.22774887084960938, 0.23525238037109375, 0.24275588989257812, 0.2502593994140625, 0.2577629089355469, 0.26526641845703125, 0.2727699279785156, 0.2802734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 8.0, 12.0, 9.0, 15.0, 19.0, 15.0, 30.0, 49.0, 59.0, 78.0, 207.0, 192.0, 90.0, 62.0, 42.0, 23.0, 21.0, 16.0, 14.0, 11.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1019287109375, -0.09931182861328125, -0.0966949462890625, -0.09407806396484375, -0.091461181640625, -0.08884429931640625, -0.0862274169921875, -0.08361053466796875, -0.08099365234375, -0.07837677001953125, -0.0757598876953125, -0.07314300537109375, -0.070526123046875, -0.06790924072265625, -0.0652923583984375, -0.06267547607421875, -0.06005859375, -0.05744171142578125, -0.0548248291015625, -0.05220794677734375, -0.049591064453125, -0.04697418212890625, -0.0443572998046875, -0.04174041748046875, -0.03912353515625, -0.03650665283203125, -0.0338897705078125, -0.03127288818359375, -0.028656005859375, -0.02603912353515625, -0.0234222412109375, -0.02080535888671875, -0.0181884765625, -0.01557159423828125, -0.0129547119140625, -0.01033782958984375, -0.007720947265625, -0.00510406494140625, -0.0024871826171875, 0.00012969970703125, 0.00274658203125, 0.00536346435546875, 0.0079803466796875, 0.01059722900390625, 0.013214111328125, 0.01583099365234375, 0.0184478759765625, 0.02106475830078125, 0.023681640625, 0.02629852294921875, 0.0289154052734375, 0.03153228759765625, 0.034149169921875, 0.03676605224609375, 0.0393829345703125, 0.04199981689453125, 0.04461669921875, 0.04723358154296875, 0.0498504638671875, 0.05246734619140625, 0.055084228515625, 0.05770111083984375, 0.0603179931640625, 0.06293487548828125, 0.0655517578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 7.0, 14.0, 22.0, 40.0, 102.0, 151.0, 212.0, 200.0, 119.0, 63.0, 26.0, 21.0, 7.0, 10.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0143203735351562, -1.917041540145874, -1.8197627067565918, -1.7224838733673096, -1.625205159187317, -1.5279263257980347, -1.4306474924087524, -1.3333687782287598, -1.2360899448394775, -1.1388111114501953, -1.041532278060913, -0.9442535042762756, -0.8469747304916382, -0.749695897102356, -0.6524170637130737, -0.5551382899284363, -0.4578593969345093, -0.36058059334754944, -0.2633017897605896, -0.16602295637130737, -0.06874415278434753, 0.028534650802612305, 0.12581348419189453, 0.22309225797653198, 0.3203710913658142, 0.41764989495277405, 0.5149286985397339, 0.6122075319290161, 0.7094863653182983, 0.8067651391029358, 0.904043972492218, 1.0013227462768555, 1.0986015796661377, 1.19588041305542, 1.2931592464447021, 1.3904380798339844, 1.487716794013977, 1.5849956274032593, 1.6822744607925415, 1.7795531749725342, 1.8768320083618164, 1.9741108417510986, 2.071389675140381, 2.168668508529663, 2.2659473419189453, 2.3632259368896484, 2.4605050086975098, 2.557783603668213, 2.655062675476074, 2.7523415088653564, 2.8496203422546387, 2.946899175643921, 3.044178009033203, 3.1414566040039062, 3.2387356758117676, 3.3360142707824707, 3.433293104171753, 3.530571937561035, 3.6278507709503174, 3.7251296043395996, 3.822408437728882, 3.919687271118164, 4.016965866088867, 4.1142449378967285, 4.211523532867432]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 12.0, 12.0, 17.0, 25.0, 20.0, 28.0, 35.0, 32.0, 41.0, 36.0, 36.0, 50.0, 48.0, 49.0, 40.0, 44.0, 52.0, 38.0, 28.0, 34.0, 29.0, 29.0, 31.0, 27.0, 21.0, 25.0, 24.0, 14.0, 15.0, 10.0, 11.0, 6.0, 6.0, 7.0, 6.0, 4.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4211187362670898, -1.374914526939392, -1.3287103176116943, -1.2825061082839966, -1.2363018989562988, -1.1900975704193115, -1.1438934803009033, -1.097689151763916, -1.0514849424362183, -1.0052807331085205, -0.9590765237808228, -0.912872314453125, -0.8666680455207825, -0.8204638361930847, -0.774259626865387, -0.7280553579330444, -0.6818512082099915, -0.6356469988822937, -0.589442789554596, -0.5432385206222534, -0.49703431129455566, -0.4508301019668579, -0.40462589263916016, -0.35842165350914, -0.31221744418144226, -0.2660132348537445, -0.21980899572372437, -0.1736047863960266, -0.12740056216716766, -0.08119633793830872, -0.03499212861061096, 0.01121211051940918, 0.057416319847106934, 0.10362054407596588, 0.14982476830482483, 0.19602897763252258, 0.24223320186138153, 0.2884374260902405, 0.33464163541793823, 0.3808458745479584, 0.42705008387565613, 0.4732542932033539, 0.519458532333374, 0.5656627416610718, 0.6118669509887695, 0.6580711603164673, 0.704275369644165, 0.7504796385765076, 0.7966838479042053, 0.8428880572319031, 0.8890922665596008, 0.9352965354919434, 0.9815007448196411, 1.0277049541473389, 1.0739091634750366, 1.1201133728027344, 1.1663175821304321, 1.2125217914581299, 1.2587260007858276, 1.3049302101135254, 1.3511344194412231, 1.397338628768921, 1.4435429573059082, 1.489747166633606, 1.5359513759613037]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 10.0, 14.0, 20.0, 16.0, 43.0, 41.0, 84.0, 107.0, 176.0, 269.0, 505.0, 832.0, 1548.0, 3307.0, 8509.0, 65841.0, 2569555.0, 1487336.0, 42401.0, 7347.0, 2958.0, 1426.0, 778.0, 410.0, 291.0, 152.0, 92.0, 72.0, 42.0, 26.0, 14.0, 20.0, 6.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9326171875, -1.8720703125, -1.8115234375, -1.7509765625, -1.6904296875, -1.6298828125, -1.5693359375, -1.5087890625, -1.4482421875, -1.3876953125, -1.3271484375, -1.2666015625, -1.2060546875, -1.1455078125, -1.0849609375, -1.0244140625, -0.9638671875, -0.9033203125, -0.8427734375, -0.7822265625, -0.7216796875, -0.6611328125, -0.6005859375, -0.5400390625, -0.4794921875, -0.4189453125, -0.3583984375, -0.2978515625, -0.2373046875, -0.1767578125, -0.1162109375, -0.0556640625, 0.0048828125, 0.0654296875, 0.1259765625, 0.1865234375, 0.2470703125, 0.3076171875, 0.3681640625, 0.4287109375, 0.4892578125, 0.5498046875, 0.6103515625, 0.6708984375, 0.7314453125, 0.7919921875, 0.8525390625, 0.9130859375, 0.9736328125, 1.0341796875, 1.0947265625, 1.1552734375, 1.2158203125, 1.2763671875, 1.3369140625, 1.3974609375, 1.4580078125, 1.5185546875, 1.5791015625, 1.6396484375, 1.7001953125, 1.7607421875, 1.8212890625, 1.8818359375, 1.9423828125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 12.0, 12.0, 12.0, 8.0, 13.0, 26.0, 19.0, 19.0, 44.0, 29.0, 35.0, 39.0, 39.0, 74.0, 43.0, 48.0, 52.0, 57.0, 51.0, 44.0, 49.0, 38.0, 29.0, 32.0, 24.0, 22.0, 15.0, 13.0, 12.0, 9.0, 12.0, 8.0, 9.0, 7.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72509765625, -0.7042236328125, -0.683349609375, -0.6624755859375, -0.6416015625, -0.6207275390625, -0.599853515625, -0.5789794921875, -0.55810546875, -0.5372314453125, -0.516357421875, -0.4954833984375, -0.474609375, -0.4537353515625, -0.432861328125, -0.4119873046875, -0.39111328125, -0.3702392578125, -0.349365234375, -0.3284912109375, -0.3076171875, -0.2867431640625, -0.265869140625, -0.2449951171875, -0.22412109375, -0.2032470703125, -0.182373046875, -0.1614990234375, -0.140625, -0.1197509765625, -0.098876953125, -0.0780029296875, -0.05712890625, -0.0362548828125, -0.015380859375, 0.0054931640625, 0.0263671875, 0.0472412109375, 0.068115234375, 0.0889892578125, 0.10986328125, 0.1307373046875, 0.151611328125, 0.1724853515625, 0.193359375, 0.2142333984375, 0.235107421875, 0.2559814453125, 0.27685546875, 0.2977294921875, 0.318603515625, 0.3394775390625, 0.3603515625, 0.3812255859375, 0.402099609375, 0.4229736328125, 0.44384765625, 0.4647216796875, 0.485595703125, 0.5064697265625, 0.52734375, 0.5482177734375, 0.569091796875, 0.5899658203125, 0.61083984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 13.0, 15.0, 34.0, 61.0, 113.0, 253.0, 679.0, 2177.0, 9724.0, 99850.0, 3986075.0, 83403.0, 8761.0, 1931.0, 603.0, 291.0, 109.0, 69.0, 34.0, 24.0, 16.0, 11.0, 4.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7516632080078125, -1.680084228515625, -1.6085052490234375, -1.53692626953125, -1.4653472900390625, -1.393768310546875, -1.3221893310546875, -1.2506103515625, -1.1790313720703125, -1.107452392578125, -1.0358734130859375, -0.96429443359375, -0.8927154541015625, -0.821136474609375, -0.7495574951171875, -0.677978515625, -0.6063995361328125, -0.534820556640625, -0.4632415771484375, -0.39166259765625, -0.3200836181640625, -0.248504638671875, -0.1769256591796875, -0.1053466796875, -0.0337677001953125, 0.037811279296875, 0.1093902587890625, 0.18096923828125, 0.2525482177734375, 0.324127197265625, 0.3957061767578125, 0.46728515625, 0.5388641357421875, 0.610443115234375, 0.6820220947265625, 0.75360107421875, 0.8251800537109375, 0.896759033203125, 0.9683380126953125, 1.0399169921875, 1.1114959716796875, 1.183074951171875, 1.2546539306640625, 1.32623291015625, 1.3978118896484375, 1.469390869140625, 1.5409698486328125, 1.612548828125, 1.6841278076171875, 1.755706787109375, 1.8272857666015625, 1.89886474609375, 1.9704437255859375, 2.042022705078125, 2.1136016845703125, 2.1851806640625, 2.2567596435546875, 2.328338623046875, 2.3999176025390625, 2.47149658203125, 2.5430755615234375, 2.614654541015625, 2.6862335205078125, 2.7578125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 8.0, 6.0, 16.0, 15.0, 11.0, 24.0, 25.0, 23.0, 46.0, 56.0, 96.0, 146.0, 316.0, 605.0, 812.0, 762.0, 433.0, 247.0, 132.0, 79.0, 47.0, 32.0, 20.0, 20.0, 17.0, 15.0, 7.0, 10.0, 8.0, 8.0, 2.0, 1.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28466796875, -0.2747764587402344, -0.26488494873046875, -0.2549934387207031, -0.2451019287109375, -0.23521041870117188, -0.22531890869140625, -0.21542739868164062, -0.205535888671875, -0.19564437866210938, -0.18575286865234375, -0.17586135864257812, -0.1659698486328125, -0.15607833862304688, -0.14618682861328125, -0.13629531860351562, -0.12640380859375, -0.11651229858398438, -0.10662078857421875, -0.09672927856445312, -0.0868377685546875, -0.07694625854492188, -0.06705474853515625, -0.057163238525390625, -0.047271728515625, -0.037380218505859375, -0.02748870849609375, -0.017597198486328125, -0.0077056884765625, 0.002185821533203125, 0.01207733154296875, 0.021968841552734375, 0.0318603515625, 0.041751861572265625, 0.05164337158203125, 0.061534881591796875, 0.0714263916015625, 0.08131790161132812, 0.09120941162109375, 0.10110092163085938, 0.110992431640625, 0.12088394165039062, 0.13077545166015625, 0.14066696166992188, 0.1505584716796875, 0.16044998168945312, 0.17034149169921875, 0.18023300170898438, 0.19012451171875, 0.20001602172851562, 0.20990753173828125, 0.21979904174804688, 0.2296905517578125, 0.23958206176757812, 0.24947357177734375, 0.2593650817871094, 0.269256591796875, 0.2791481018066406, 0.28903961181640625, 0.2989311218261719, 0.3088226318359375, 0.3187141418457031, 0.32860565185546875, 0.3384971618652344, 0.348388671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 12.0, 10.0, 17.0, 29.0, 40.0, 55.0, 70.0, 79.0, 130.0, 115.0, 117.0, 89.0, 52.0, 58.0, 33.0, 17.0, 11.0, 14.0, 11.0, 6.0, 6.0, 2.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5149469375610352, -1.4754689931869507, -1.4359909296035767, -1.3965129852294922, -1.3570350408554077, -1.3175570964813232, -1.2780790328979492, -1.2386010885238647, -1.1991231441497803, -1.1596451997756958, -1.1201671361923218, -1.0806891918182373, -1.0412112474441528, -1.0017333030700684, -0.9622552394866943, -0.9227772951126099, -0.8832992315292358, -0.8438212275505066, -0.8043432831764221, -0.7648652791976929, -0.7253873348236084, -0.6859093308448792, -0.6464313268661499, -0.6069533824920654, -0.5674753785133362, -0.5279973745346069, -0.48851943016052246, -0.4490414261817932, -0.40956345200538635, -0.3700854778289795, -0.33060747385025024, -0.2911294996738434, -0.2516516447067261, -0.2121736705303192, -0.17269568145275116, -0.1332176923751831, -0.09373971819877625, -0.054261744022369385, -0.01478375494480133, 0.024694234132766724, 0.06417220830917358, 0.10365018993616104, 0.1431281715631485, 0.18260616064071655, 0.2220841348171234, 0.2615621089935303, 0.3010401129722595, 0.3405180871486664, 0.37999606132507324, 0.4194740355014801, 0.45895200967788696, 0.4984300136566162, 0.5379079580307007, 0.5773859620094299, 0.6168639659881592, 0.6563419103622437, 0.6958199143409729, 0.7352979183197021, 0.7747758626937866, 0.8142538666725159, 0.8537318706512451, 0.8932098150253296, 0.9326878190040588, 0.9721658229827881, 1.0116437673568726]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 11.0, 11.0, 8.0, 12.0, 12.0, 13.0, 22.0, 31.0, 29.0, 25.0, 34.0, 30.0, 30.0, 33.0, 33.0, 31.0, 52.0, 52.0, 38.0, 31.0, 38.0, 40.0, 37.0, 33.0, 30.0, 38.0, 20.0, 27.0, 28.0, 21.0, 20.0, 22.0, 14.0, 10.0, 15.0, 11.0, 11.0, 12.0, 4.0, 5.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.6883559226989746, -0.668379008769989, -0.6484020948410034, -0.628425121307373, -0.6084482073783875, -0.5884712934494019, -0.5684943795204163, -0.5485174655914307, -0.5285404920578003, -0.5085635781288147, -0.4885866343975067, -0.4686097204685211, -0.44863277673721313, -0.42865586280822754, -0.40867894887924194, -0.38870200514793396, -0.36872509121894836, -0.34874817728996277, -0.3287712335586548, -0.3087943196296692, -0.2888173758983612, -0.2688404619693756, -0.24886353313922882, -0.22888660430908203, -0.20890967547893524, -0.18893274664878845, -0.16895581781864166, -0.14897888898849487, -0.12900197505950928, -0.10902503877878189, -0.0890481173992157, -0.06907118856906891, -0.04909425973892212, -0.02911733277142048, -0.009140405803918839, 0.010836519300937653, 0.030813448131084442, 0.05079037696123123, 0.07076729834079742, 0.09074422717094421, 0.110721156001091, 0.1306980848312378, 0.15067501366138458, 0.17065194249153137, 0.19062885642051697, 0.21060580015182495, 0.23058271408081055, 0.25055962800979614, 0.2705365717411041, 0.2905134856700897, 0.3104904294013977, 0.3304673433303833, 0.3504442870616913, 0.3704212009906769, 0.39039814472198486, 0.41037505865097046, 0.43035197257995605, 0.45032888650894165, 0.47030583024024963, 0.49028274416923523, 0.5102596879005432, 0.5302366018295288, 0.5502135157585144, 0.5701904296875, 0.5901674032211304]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 14.0, 18.0, 28.0, 42.0, 56.0, 71.0, 137.0, 160.0, 234.0, 359.0, 465.0, 666.0, 1043.0, 1496.0, 2331.0, 3532.0, 5937.0, 11323.0, 24439.0, 74964.0, 492179.0, 327085.0, 56592.0, 20477.0, 9710.0, 5555.0, 3192.0, 2041.0, 1346.0, 945.0, 607.0, 432.0, 317.0, 232.0, 153.0, 102.0, 86.0, 57.0, 27.0, 22.0, 25.0, 14.0, 10.0, 6.0, 7.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.33544921875, -0.3249320983886719, -0.31441497802734375, -0.3038978576660156, -0.2933807373046875, -0.2828636169433594, -0.27234649658203125, -0.2618293762207031, -0.251312255859375, -0.24079513549804688, -0.23027801513671875, -0.21976089477539062, -0.2092437744140625, -0.19872665405273438, -0.18820953369140625, -0.17769241333007812, -0.16717529296875, -0.15665817260742188, -0.14614105224609375, -0.13562393188476562, -0.1251068115234375, -0.11458969116210938, -0.10407257080078125, -0.09355545043945312, -0.083038330078125, -0.07252120971679688, -0.06200408935546875, -0.051486968994140625, -0.0409698486328125, -0.030452728271484375, -0.01993560791015625, -0.009418487548828125, 0.0010986328125, 0.011615753173828125, 0.02213287353515625, 0.032649993896484375, 0.0431671142578125, 0.053684234619140625, 0.06420135498046875, 0.07471847534179688, 0.085235595703125, 0.09575271606445312, 0.10626983642578125, 0.11678695678710938, 0.1273040771484375, 0.13782119750976562, 0.14833831787109375, 0.15885543823242188, 0.16937255859375, 0.17988967895507812, 0.19040679931640625, 0.20092391967773438, 0.2114410400390625, 0.22195816040039062, 0.23247528076171875, 0.24299240112304688, 0.253509521484375, 0.2640266418457031, 0.27454376220703125, 0.2850608825683594, 0.2955780029296875, 0.3060951232910156, 0.31661224365234375, 0.3271293640136719, 0.337646484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 11.0, 7.0, 10.0, 12.0, 14.0, 15.0, 19.0, 21.0, 30.0, 26.0, 28.0, 30.0, 34.0, 33.0, 36.0, 55.0, 53.0, 46.0, 52.0, 35.0, 48.0, 38.0, 43.0, 34.0, 39.0, 25.0, 24.0, 22.0, 22.0, 19.0, 18.0, 14.0, 11.0, 16.0, 9.0, 11.0, 7.0, 2.0, 5.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0], "bins": [-0.4453125, -0.4327545166015625, -0.420196533203125, -0.4076385498046875, -0.39508056640625, -0.3825225830078125, -0.369964599609375, -0.3574066162109375, -0.3448486328125, -0.3322906494140625, -0.319732666015625, -0.3071746826171875, -0.29461669921875, -0.2820587158203125, -0.269500732421875, -0.2569427490234375, -0.244384765625, -0.2318267822265625, -0.219268798828125, -0.2067108154296875, -0.19415283203125, -0.1815948486328125, -0.169036865234375, -0.1564788818359375, -0.1439208984375, -0.1313629150390625, -0.118804931640625, -0.1062469482421875, -0.09368896484375, -0.0811309814453125, -0.068572998046875, -0.0560150146484375, -0.04345703125, -0.0308990478515625, -0.018341064453125, -0.0057830810546875, 0.00677490234375, 0.0193328857421875, 0.031890869140625, 0.0444488525390625, 0.0570068359375, 0.0695648193359375, 0.082122802734375, 0.0946807861328125, 0.10723876953125, 0.1197967529296875, 0.132354736328125, 0.1449127197265625, 0.157470703125, 0.1700286865234375, 0.182586669921875, 0.1951446533203125, 0.20770263671875, 0.2202606201171875, 0.232818603515625, 0.2453765869140625, 0.2579345703125, 0.2704925537109375, 0.283050537109375, 0.2956085205078125, 0.30816650390625, 0.3207244873046875, 0.333282470703125, 0.3458404541015625, 0.3583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 10.0, 25.0, 41.0, 50.0, 75.0, 112.0, 158.0, 266.0, 406.0, 605.0, 988.0, 1705.0, 2829.0, 5359.0, 10956.0, 26807.0, 80269.0, 318594.0, 424137.0, 112183.0, 34563.0, 13669.0, 6372.0, 3363.0, 1893.0, 1072.0, 692.0, 459.0, 320.0, 172.0, 115.0, 87.0, 56.0, 37.0, 35.0, 25.0, 14.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18313026428222656, -0.17705154418945312, -0.1709728240966797, -0.16489410400390625, -0.1588153839111328, -0.15273666381835938, -0.14665794372558594, -0.1405792236328125, -0.13450050354003906, -0.12842178344726562, -0.12234306335449219, -0.11626434326171875, -0.11018562316894531, -0.10410690307617188, -0.09802818298339844, -0.091949462890625, -0.08587074279785156, -0.07979202270507812, -0.07371330261230469, -0.06763458251953125, -0.06155586242675781, -0.055477142333984375, -0.04939842224121094, -0.0433197021484375, -0.03724098205566406, -0.031162261962890625, -0.025083541870117188, -0.01900482177734375, -0.012926101684570312, -0.006847381591796875, -0.0007686614990234375, 0.00531005859375, 0.011388778686523438, 0.017467498779296875, 0.023546218872070312, 0.02962493896484375, 0.03570365905761719, 0.041782379150390625, 0.04786109924316406, 0.0539398193359375, 0.06001853942871094, 0.06609725952148438, 0.07217597961425781, 0.07825469970703125, 0.08433341979980469, 0.09041213989257812, 0.09649085998535156, 0.102569580078125, 0.10864830017089844, 0.11472702026367188, 0.12080574035644531, 0.12688446044921875, 0.1329631805419922, 0.13904190063476562, 0.14512062072753906, 0.1511993408203125, 0.15727806091308594, 0.16335678100585938, 0.1694355010986328, 0.17551422119140625, 0.1815929412841797, 0.18767166137695312, 0.19375038146972656, 0.1998291015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 6.0, 6.0, 10.0, 3.0, 15.0, 13.0, 14.0, 13.0, 17.0, 17.0, 32.0, 29.0, 25.0, 31.0, 32.0, 49.0, 56.0, 32.0, 50.0, 39.0, 47.0, 46.0, 39.0, 34.0, 40.0, 42.0, 33.0, 27.0, 27.0, 34.0, 18.0, 24.0, 12.0, 17.0, 8.0, 11.0, 11.0, 10.0, 10.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.69091796875, -0.6693344116210938, -0.6477508544921875, -0.6261672973632812, -0.604583740234375, -0.5830001831054688, -0.5614166259765625, -0.5398330688476562, -0.51824951171875, -0.49666595458984375, -0.4750823974609375, -0.45349884033203125, -0.431915283203125, -0.41033172607421875, -0.3887481689453125, -0.36716461181640625, -0.3455810546875, -0.32399749755859375, -0.3024139404296875, -0.28083038330078125, -0.259246826171875, -0.23766326904296875, -0.2160797119140625, -0.19449615478515625, -0.17291259765625, -0.15132904052734375, -0.1297454833984375, -0.10816192626953125, -0.086578369140625, -0.06499481201171875, -0.0434112548828125, -0.02182769775390625, -0.000244140625, 0.02133941650390625, 0.0429229736328125, 0.06450653076171875, 0.086090087890625, 0.10767364501953125, 0.1292572021484375, 0.15084075927734375, 0.17242431640625, 0.19400787353515625, 0.2155914306640625, 0.23717498779296875, 0.258758544921875, 0.28034210205078125, 0.3019256591796875, 0.32350921630859375, 0.3450927734375, 0.36667633056640625, 0.3882598876953125, 0.40984344482421875, 0.431427001953125, 0.45301055908203125, 0.4745941162109375, 0.49617767333984375, 0.51776123046875, 0.5393447875976562, 0.5609283447265625, 0.5825119018554688, 0.604095458984375, 0.6256790161132812, 0.6472625732421875, 0.6688461303710938, 0.6904296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 18.0, 18.0, 42.0, 54.0, 85.0, 132.0, 225.0, 357.0, 611.0, 1193.0, 2235.0, 4614.0, 10980.0, 28990.0, 92764.0, 350725.0, 392717.0, 107487.0, 32894.0, 12104.0, 5141.0, 2388.0, 1163.0, 645.0, 356.0, 234.0, 129.0, 88.0, 44.0, 24.0, 22.0, 16.0, 10.0, 10.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0421142578125, -0.04084014892578125, -0.0395660400390625, -0.03829193115234375, -0.037017822265625, -0.03574371337890625, -0.0344696044921875, -0.03319549560546875, -0.03192138671875, -0.03064727783203125, -0.0293731689453125, -0.02809906005859375, -0.026824951171875, -0.02555084228515625, -0.0242767333984375, -0.02300262451171875, -0.021728515625, -0.02045440673828125, -0.0191802978515625, -0.01790618896484375, -0.016632080078125, -0.01535797119140625, -0.0140838623046875, -0.01280975341796875, -0.01153564453125, -0.01026153564453125, -0.0089874267578125, -0.00771331787109375, -0.006439208984375, -0.00516510009765625, -0.0038909912109375, -0.00261688232421875, -0.0013427734375, -6.866455078125e-05, 0.0012054443359375, 0.00247955322265625, 0.003753662109375, 0.00502777099609375, 0.0063018798828125, 0.00757598876953125, 0.00885009765625, 0.01012420654296875, 0.0113983154296875, 0.01267242431640625, 0.013946533203125, 0.01522064208984375, 0.0164947509765625, 0.01776885986328125, 0.01904296875, 0.02031707763671875, 0.0215911865234375, 0.02286529541015625, 0.024139404296875, 0.02541351318359375, 0.0266876220703125, 0.02796173095703125, 0.02923583984375, 0.03050994873046875, 0.0317840576171875, 0.03305816650390625, 0.034332275390625, 0.03560638427734375, 0.0368804931640625, 0.03815460205078125, 0.0394287109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 11.0, 17.0, 15.0, 30.0, 45.0, 58.0, 85.0, 133.0, 141.0, 130.0, 102.0, 83.0, 42.0, 34.0, 23.0, 10.0, 17.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.075599670410156e-05, -2.964399755001068e-05, -2.85319983959198e-05, -2.741999924182892e-05, -2.6308000087738037e-05, -2.5196000933647156e-05, -2.4084001779556274e-05, -2.2972002625465393e-05, -2.1860003471374512e-05, -2.074800431728363e-05, -1.963600516319275e-05, -1.8524006009101868e-05, -1.7412006855010986e-05, -1.6300007700920105e-05, -1.5188008546829224e-05, -1.4076009392738342e-05, -1.2964010238647461e-05, -1.185201108455658e-05, -1.0740011930465698e-05, -9.628012776374817e-06, -8.516013622283936e-06, -7.404014468193054e-06, -6.292015314102173e-06, -5.1800161600112915e-06, -4.06801700592041e-06, -2.956017851829529e-06, -1.8440186977386475e-06, -7.320195436477661e-07, 3.7997961044311523e-07, 1.4919787645339966e-06, 2.603977918624878e-06, 3.7159770727157593e-06, 4.827976226806641e-06, 5.939975380897522e-06, 7.051974534988403e-06, 8.163973689079285e-06, 9.275972843170166e-06, 1.0387971997261047e-05, 1.1499971151351929e-05, 1.261197030544281e-05, 1.3723969459533691e-05, 1.4835968613624573e-05, 1.5947967767715454e-05, 1.7059966921806335e-05, 1.8171966075897217e-05, 1.9283965229988098e-05, 2.039596438407898e-05, 2.150796353816986e-05, 2.2619962692260742e-05, 2.3731961846351624e-05, 2.4843961000442505e-05, 2.5955960154533386e-05, 2.7067959308624268e-05, 2.817995846271515e-05, 2.929195761680603e-05, 3.040395677089691e-05, 3.151595592498779e-05, 3.2627955079078674e-05, 3.3739954233169556e-05, 3.485195338726044e-05, 3.596395254135132e-05, 3.70759516954422e-05, 3.818795084953308e-05, 3.929995000362396e-05, 4.0411949157714844e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 9.0, 18.0, 23.0, 49.0, 72.0, 149.0, 340.0, 801.0, 2560.0, 10482.0, 57410.0, 487737.0, 425676.0, 50122.0, 9385.0, 2370.0, 718.0, 298.0, 133.0, 72.0, 32.0, 27.0, 9.0, 20.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08709716796875, -0.0845327377319336, -0.08196830749511719, -0.07940387725830078, -0.07683944702148438, -0.07427501678466797, -0.07171058654785156, -0.06914615631103516, -0.06658172607421875, -0.06401729583740234, -0.06145286560058594, -0.05888843536376953, -0.056324005126953125, -0.05375957489013672, -0.05119514465332031, -0.048630714416503906, -0.0460662841796875, -0.043501853942871094, -0.04093742370605469, -0.03837299346923828, -0.035808563232421875, -0.03324413299560547, -0.030679702758789062, -0.028115272521972656, -0.02555084228515625, -0.022986412048339844, -0.020421981811523438, -0.01785755157470703, -0.015293121337890625, -0.012728691101074219, -0.010164260864257812, -0.007599830627441406, -0.005035400390625, -0.0024709701538085938, 9.34600830078125e-05, 0.0026578903198242188, 0.005222320556640625, 0.007786750793457031, 0.010351181030273438, 0.012915611267089844, 0.01548004150390625, 0.018044471740722656, 0.020608901977539062, 0.02317333221435547, 0.025737762451171875, 0.02830219268798828, 0.030866622924804688, 0.033431053161621094, 0.0359954833984375, 0.038559913635253906, 0.04112434387207031, 0.04368877410888672, 0.046253204345703125, 0.04881763458251953, 0.05138206481933594, 0.053946495056152344, 0.05651092529296875, 0.059075355529785156, 0.06163978576660156, 0.06420421600341797, 0.06676864624023438, 0.06933307647705078, 0.07189750671386719, 0.0744619369506836, 0.0770263671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 5.0, 8.0, 12.0, 17.0, 13.0, 18.0, 14.0, 27.0, 31.0, 33.0, 53.0, 67.0, 61.0, 72.0, 64.0, 63.0, 73.0, 57.0, 47.0, 47.0, 32.0, 31.0, 34.0, 20.0, 22.0, 13.0, 12.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0129241943359375, -0.012572526931762695, -0.01222085952758789, -0.011869192123413086, -0.011517524719238281, -0.011165857315063477, -0.010814189910888672, -0.010462522506713867, -0.010110855102539062, -0.009759187698364258, -0.009407520294189453, -0.009055852890014648, -0.008704185485839844, -0.008352518081665039, -0.008000850677490234, -0.00764918327331543, -0.007297515869140625, -0.00694584846496582, -0.006594181060791016, -0.006242513656616211, -0.005890846252441406, -0.0055391788482666016, -0.005187511444091797, -0.004835844039916992, -0.0044841766357421875, -0.004132509231567383, -0.003780841827392578, -0.0034291744232177734, -0.0030775070190429688, -0.002725839614868164, -0.0023741722106933594, -0.0020225048065185547, -0.00167083740234375, -0.0013191699981689453, -0.0009675025939941406, -0.0006158351898193359, -0.00026416778564453125, 8.749961853027344e-05, 0.0004391670227050781, 0.0007908344268798828, 0.0011425018310546875, 0.0014941692352294922, 0.0018458366394042969, 0.0021975040435791016, 0.0025491714477539062, 0.002900838851928711, 0.0032525062561035156, 0.0036041736602783203, 0.003955841064453125, 0.00430750846862793, 0.004659175872802734, 0.005010843276977539, 0.005362510681152344, 0.0057141780853271484, 0.006065845489501953, 0.006417512893676758, 0.0067691802978515625, 0.007120847702026367, 0.007472515106201172, 0.007824182510375977, 0.008175849914550781, 0.008527517318725586, 0.00887918472290039, 0.009230852127075195, 0.00958251953125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 13.0, 7.0, 11.0, 26.0, 25.0, 42.0, 43.0, 66.0, 89.0, 115.0, 114.0, 108.0, 92.0, 47.0, 48.0, 36.0, 31.0, 19.0, 8.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.8256650567054749, -0.8052636981010437, -0.7848622798919678, -0.7644609212875366, -0.7440595626831055, -0.7236582040786743, -0.7032567858695984, -0.6828554272651672, -0.6624540090560913, -0.6420526504516602, -0.6216512322425842, -0.6012498736381531, -0.5808485150337219, -0.560447096824646, -0.5400457382202148, -0.5196443796157837, -0.49924302101135254, -0.478841632604599, -0.45844027400016785, -0.4380388855934143, -0.41763752698898315, -0.3972361385822296, -0.3768347501754761, -0.3564333915710449, -0.3360320031642914, -0.31563061475753784, -0.2952292561531067, -0.27482786774635315, -0.2544264793395996, -0.23402512073516846, -0.21362373232841492, -0.19322235882282257, -0.17282095551490784, -0.1524195820093155, -0.13201820850372314, -0.1116168200969696, -0.09121544659137726, -0.07081407308578491, -0.05041269212961197, -0.030011311173439026, -0.00960993766784668, 0.010791439563035965, 0.03119281679391861, 0.051594194024801254, 0.0719955712556839, 0.09239694476127625, 0.11279832571744919, 0.13319970667362213, 0.15360108017921448, 0.17400245368480682, 0.19440382719039917, 0.2148052155971527, 0.23520658910274506, 0.2556079626083374, 0.27600935101509094, 0.2964107394218445, 0.31681209802627563, 0.3372134864330292, 0.3576148450374603, 0.37801623344421387, 0.398417592048645, 0.41881898045539856, 0.4392203688621521, 0.45962172746658325, 0.4800231158733368]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 8.0, 12.0, 9.0, 12.0, 20.0, 17.0, 26.0, 36.0, 24.0, 25.0, 32.0, 28.0, 42.0, 32.0, 51.0, 49.0, 52.0, 45.0, 41.0, 29.0, 40.0, 37.0, 27.0, 48.0, 29.0, 24.0, 26.0, 33.0, 17.0, 15.0, 17.0, 12.0, 15.0, 14.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 4.0, 4.0], "bins": [-0.43707090616226196, -0.4251249432563782, -0.4131790101528168, -0.40123307704925537, -0.3892871141433716, -0.3773411512374878, -0.3653952181339264, -0.353449285030365, -0.3415033221244812, -0.3295573592185974, -0.317611426115036, -0.3056654930114746, -0.2937195301055908, -0.28177356719970703, -0.26982763409614563, -0.25788170099258423, -0.24593573808670044, -0.23398979008197784, -0.22204384207725525, -0.21009789407253265, -0.19815194606781006, -0.18620599806308746, -0.17426005005836487, -0.16231410205364227, -0.15036815404891968, -0.13842220604419708, -0.1264762580394745, -0.11453031003475189, -0.1025843620300293, -0.0906384140253067, -0.0786924660205841, -0.06674651801586151, -0.054800570011138916, -0.04285462200641632, -0.030908674001693726, -0.01896272599697113, -0.007016777992248535, 0.00492917001247406, 0.016875118017196655, 0.02882106602191925, 0.040767014026641846, 0.05271296203136444, 0.06465891003608704, 0.07660485804080963, 0.08855080604553223, 0.10049675405025482, 0.11244270205497742, 0.12438865005970001, 0.1363345980644226, 0.1482805460691452, 0.1602264940738678, 0.1721724420785904, 0.184118390083313, 0.19606433808803558, 0.20801028609275818, 0.21995623409748077, 0.23190218210220337, 0.24384813010692596, 0.25579407811164856, 0.26774001121520996, 0.27968597412109375, 0.29163193702697754, 0.30357787013053894, 0.31552380323410034, 0.32746976613998413]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 8.0, 10.0, 14.0, 18.0, 38.0, 56.0, 77.0, 97.0, 123.0, 206.0, 342.0, 471.0, 734.0, 1180.0, 1848.0, 3102.0, 5420.0, 10728.0, 32728.0, 269941.0, 625557.0, 63409.0, 15432.0, 7000.0, 3819.0, 2255.0, 1367.0, 885.0, 551.0, 397.0, 240.0, 151.0, 90.0, 70.0, 58.0, 43.0, 29.0, 24.0, 9.0, 4.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.484619140625, -0.4700202941894531, -0.45542144775390625, -0.4408226013183594, -0.4262237548828125, -0.4116249084472656, -0.39702606201171875, -0.3824272155761719, -0.367828369140625, -0.3532295227050781, -0.33863067626953125, -0.3240318298339844, -0.3094329833984375, -0.2948341369628906, -0.28023529052734375, -0.2656364440917969, -0.25103759765625, -0.23643875122070312, -0.22183990478515625, -0.20724105834960938, -0.1926422119140625, -0.17804336547851562, -0.16344451904296875, -0.14884567260742188, -0.134246826171875, -0.11964797973632812, -0.10504913330078125, -0.09045028686523438, -0.0758514404296875, -0.061252593994140625, -0.04665374755859375, -0.032054901123046875, -0.0174560546875, -0.002857208251953125, 0.01174163818359375, 0.026340484619140625, 0.0409393310546875, 0.055538177490234375, 0.07013702392578125, 0.08473587036132812, 0.099334716796875, 0.11393356323242188, 0.12853240966796875, 0.14313125610351562, 0.1577301025390625, 0.17232894897460938, 0.18692779541015625, 0.20152664184570312, 0.21612548828125, 0.23072433471679688, 0.24532318115234375, 0.2599220275878906, 0.2745208740234375, 0.2891197204589844, 0.30371856689453125, 0.3183174133300781, 0.332916259765625, 0.3475151062011719, 0.36211395263671875, 0.3767127990722656, 0.3913116455078125, 0.4059104919433594, 0.42050933837890625, 0.4351081848144531, 0.44970703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 7.0, 9.0, 9.0, 14.0, 17.0, 27.0, 17.0, 25.0, 26.0, 33.0, 22.0, 38.0, 44.0, 47.0, 50.0, 47.0, 59.0, 52.0, 47.0, 30.0, 40.0, 47.0, 32.0, 28.0, 25.0, 33.0, 27.0, 19.0, 16.0, 19.0, 17.0, 9.0, 7.0, 11.0, 7.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0], "bins": [-1.00390625, -0.9770126342773438, -0.9501190185546875, -0.9232254028320312, -0.896331787109375, -0.8694381713867188, -0.8425445556640625, -0.8156509399414062, -0.78875732421875, -0.7618637084960938, -0.7349700927734375, -0.7080764770507812, -0.681182861328125, -0.6542892456054688, -0.6273956298828125, -0.6005020141601562, -0.5736083984375, -0.5467147827148438, -0.5198211669921875, -0.49292755126953125, -0.466033935546875, -0.43914031982421875, -0.4122467041015625, -0.38535308837890625, -0.35845947265625, -0.33156585693359375, -0.3046722412109375, -0.27777862548828125, -0.250885009765625, -0.22399139404296875, -0.1970977783203125, -0.17020416259765625, -0.143310546875, -0.11641693115234375, -0.0895233154296875, -0.06262969970703125, -0.035736083984375, -0.00884246826171875, 0.0180511474609375, 0.04494476318359375, 0.07183837890625, 0.09873199462890625, 0.1256256103515625, 0.15251922607421875, 0.179412841796875, 0.20630645751953125, 0.2332000732421875, 0.26009368896484375, 0.2869873046875, 0.31388092041015625, 0.3407745361328125, 0.36766815185546875, 0.394561767578125, 0.42145538330078125, 0.4483489990234375, 0.47524261474609375, 0.50213623046875, 0.5290298461914062, 0.5559234619140625, 0.5828170776367188, 0.609710693359375, 0.6366043090820312, 0.6634979248046875, 0.6903915405273438, 0.71728515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 3.0, 4.0, 7.0, 2.0, 5.0, 6.0, 12.0, 14.0, 5.0, 23.0, 17.0, 23.0, 17.0, 14.0, 28.0, 28.0, 39.0, 35.0, 45.0, 64.0, 136.0, 700.0, 38981.0, 1005200.0, 2556.0, 184.0, 63.0, 56.0, 36.0, 29.0, 33.0, 24.0, 22.0, 21.0, 17.0, 19.0, 8.0, 7.0, 13.0, 5.0, 9.0, 13.0, 8.0, 6.0, 4.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.337921142578125, -2.25787353515625, -2.177825927734375, -2.0977783203125, -2.017730712890625, -1.93768310546875, -1.857635498046875, -1.777587890625, -1.697540283203125, -1.61749267578125, -1.537445068359375, -1.4573974609375, -1.377349853515625, -1.29730224609375, -1.217254638671875, -1.13720703125, -1.057159423828125, -0.97711181640625, -0.897064208984375, -0.8170166015625, -0.736968994140625, -0.65692138671875, -0.576873779296875, -0.496826171875, -0.416778564453125, -0.33673095703125, -0.256683349609375, -0.1766357421875, -0.096588134765625, -0.01654052734375, 0.063507080078125, 0.1435546875, 0.223602294921875, 0.30364990234375, 0.383697509765625, 0.4637451171875, 0.543792724609375, 0.62384033203125, 0.703887939453125, 0.783935546875, 0.863983154296875, 0.94403076171875, 1.024078369140625, 1.1041259765625, 1.184173583984375, 1.26422119140625, 1.344268798828125, 1.42431640625, 1.504364013671875, 1.58441162109375, 1.664459228515625, 1.7445068359375, 1.824554443359375, 1.90460205078125, 1.984649658203125, 2.064697265625, 2.144744873046875, 2.22479248046875, 2.304840087890625, 2.3848876953125, 2.464935302734375, 2.54498291015625, 2.625030517578125, 2.705078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 20.0, 21.0, 16.0, 21.0, 21.0, 26.0, 33.0, 36.0, 47.0, 35.0, 59.0, 51.0, 42.0, 45.0, 35.0, 64.0, 38.0, 38.0, 31.0, 40.0, 34.0, 23.0, 19.0, 23.0, 24.0, 13.0, 13.0, 14.0, 9.0, 6.0, 12.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.72705078125, -0.70263671875, -0.67822265625, -0.65380859375, -0.62939453125, -0.60498046875, -0.58056640625, -0.55615234375, -0.53173828125, -0.50732421875, -0.48291015625, -0.45849609375, -0.43408203125, -0.40966796875, -0.38525390625, -0.36083984375, -0.33642578125, -0.31201171875, -0.28759765625, -0.26318359375, -0.23876953125, -0.21435546875, -0.18994140625, -0.16552734375, -0.14111328125, -0.11669921875, -0.09228515625, -0.06787109375, -0.04345703125, -0.01904296875, 0.00537109375, 0.02978515625, 0.05419921875, 0.07861328125, 0.10302734375, 0.12744140625, 0.15185546875, 0.17626953125, 0.20068359375, 0.22509765625, 0.24951171875, 0.27392578125, 0.29833984375, 0.32275390625, 0.34716796875, 0.37158203125, 0.39599609375, 0.42041015625, 0.44482421875, 0.46923828125, 0.49365234375, 0.51806640625, 0.54248046875, 0.56689453125, 0.59130859375, 0.61572265625, 0.64013671875, 0.66455078125, 0.68896484375, 0.71337890625, 0.73779296875, 0.76220703125, 0.78662109375, 0.81103515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 7.0, 11.0, 13.0, 27.0, 37.0, 59.0, 109.0, 152.0, 295.0, 584.0, 1136.0, 2481.0, 6147.0, 22850.0, 635212.0, 350621.0, 18586.0, 5442.0, 2293.0, 1138.0, 595.0, 340.0, 171.0, 93.0, 61.0, 26.0, 25.0, 12.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271728515625, -0.26416778564453125, -0.2566070556640625, -0.24904632568359375, -0.241485595703125, -0.23392486572265625, -0.2263641357421875, -0.21880340576171875, -0.21124267578125, -0.20368194580078125, -0.1961212158203125, -0.18856048583984375, -0.180999755859375, -0.17343902587890625, -0.1658782958984375, -0.15831756591796875, -0.1507568359375, -0.14319610595703125, -0.1356353759765625, -0.12807464599609375, -0.120513916015625, -0.11295318603515625, -0.1053924560546875, -0.09783172607421875, -0.09027099609375, -0.08271026611328125, -0.0751495361328125, -0.06758880615234375, -0.060028076171875, -0.05246734619140625, -0.0449066162109375, -0.03734588623046875, -0.02978515625, -0.02222442626953125, -0.0146636962890625, -0.00710296630859375, 0.000457763671875, 0.00801849365234375, 0.0155792236328125, 0.02313995361328125, 0.03070068359375, 0.03826141357421875, 0.0458221435546875, 0.05338287353515625, 0.060943603515625, 0.06850433349609375, 0.0760650634765625, 0.08362579345703125, 0.0911865234375, 0.09874725341796875, 0.1063079833984375, 0.11386871337890625, 0.121429443359375, 0.12899017333984375, 0.1365509033203125, 0.14411163330078125, 0.15167236328125, 0.15923309326171875, 0.1667938232421875, 0.17435455322265625, 0.181915283203125, 0.18947601318359375, 0.1970367431640625, 0.20459747314453125, 0.212158203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 3.0, 2.0, 8.0, 8.0, 23.0, 44.0, 154.0, 408.0, 210.0, 60.0, 31.0, 16.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.463029861450195e-05, -3.277510404586792e-05, -3.091990947723389e-05, -2.9064714908599854e-05, -2.720952033996582e-05, -2.5354325771331787e-05, -2.3499131202697754e-05, -2.164393663406372e-05, -1.9788742065429688e-05, -1.7933547496795654e-05, -1.607835292816162e-05, -1.4223158359527588e-05, -1.2367963790893555e-05, -1.0512769222259521e-05, -8.657574653625488e-06, -6.802380084991455e-06, -4.947185516357422e-06, -3.0919909477233887e-06, -1.2367963790893555e-06, 6.183981895446777e-07, 2.473592758178711e-06, 4.328787326812744e-06, 6.183981895446777e-06, 8.03917646408081e-06, 9.894371032714844e-06, 1.1749565601348877e-05, 1.360476016998291e-05, 1.5459954738616943e-05, 1.7315149307250977e-05, 1.917034387588501e-05, 2.1025538444519043e-05, 2.2880733013153076e-05, 2.473592758178711e-05, 2.6591122150421143e-05, 2.8446316719055176e-05, 3.030151128768921e-05, 3.215670585632324e-05, 3.4011900424957275e-05, 3.586709499359131e-05, 3.772228956222534e-05, 3.9577484130859375e-05, 4.143267869949341e-05, 4.328787326812744e-05, 4.5143067836761475e-05, 4.699826240539551e-05, 4.885345697402954e-05, 5.0708651542663574e-05, 5.256384611129761e-05, 5.441904067993164e-05, 5.6274235248565674e-05, 5.812942981719971e-05, 5.998462438583374e-05, 6.183981895446777e-05, 6.36950135231018e-05, 6.555020809173584e-05, 6.740540266036987e-05, 6.92605972290039e-05, 7.111579179763794e-05, 7.297098636627197e-05, 7.4826180934906e-05, 7.668137550354004e-05, 7.853657007217407e-05, 8.03917646408081e-05, 8.224695920944214e-05, 8.410215377807617e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 13.0, 22.0, 23.0, 43.0, 49.0, 95.0, 119.0, 213.0, 329.0, 489.0, 849.0, 1368.0, 2337.0, 4480.0, 9882.0, 32141.0, 584514.0, 365636.0, 27049.0, 8954.0, 4193.0, 2292.0, 1265.0, 824.0, 459.0, 336.0, 177.0, 122.0, 86.0, 56.0, 35.0, 30.0, 13.0, 15.0, 9.0, 9.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2122802734375, -0.20563507080078125, -0.1989898681640625, -0.19234466552734375, -0.185699462890625, -0.17905426025390625, -0.1724090576171875, -0.16576385498046875, -0.15911865234375, -0.15247344970703125, -0.1458282470703125, -0.13918304443359375, -0.132537841796875, -0.12589263916015625, -0.1192474365234375, -0.11260223388671875, -0.10595703125, -0.09931182861328125, -0.0926666259765625, -0.08602142333984375, -0.079376220703125, -0.07273101806640625, -0.0660858154296875, -0.05944061279296875, -0.05279541015625, -0.04615020751953125, -0.0395050048828125, -0.03285980224609375, -0.026214599609375, -0.01956939697265625, -0.0129241943359375, -0.00627899169921875, 0.0003662109375, 0.00701141357421875, 0.0136566162109375, 0.02030181884765625, 0.026947021484375, 0.03359222412109375, 0.0402374267578125, 0.04688262939453125, 0.05352783203125, 0.06017303466796875, 0.0668182373046875, 0.07346343994140625, 0.080108642578125, 0.08675384521484375, 0.0933990478515625, 0.10004425048828125, 0.106689453125, 0.11333465576171875, 0.1199798583984375, 0.12662506103515625, 0.133270263671875, 0.13991546630859375, 0.1465606689453125, 0.15320587158203125, 0.15985107421875, 0.16649627685546875, 0.1731414794921875, 0.17978668212890625, 0.186431884765625, 0.19307708740234375, 0.1997222900390625, 0.20636749267578125, 0.2130126953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 8.0, 14.0, 23.0, 31.0, 50.0, 102.0, 203.0, 248.0, 120.0, 58.0, 40.0, 17.0, 17.0, 13.0, 4.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1109619140625, -0.10771656036376953, -0.10447120666503906, -0.1012258529663086, -0.09798049926757812, -0.09473514556884766, -0.09148979187011719, -0.08824443817138672, -0.08499908447265625, -0.08175373077392578, -0.07850837707519531, -0.07526302337646484, -0.07201766967773438, -0.0687723159790039, -0.06552696228027344, -0.06228160858154297, -0.0590362548828125, -0.05579090118408203, -0.05254554748535156, -0.049300193786621094, -0.046054840087890625, -0.042809486389160156, -0.03956413269042969, -0.03631877899169922, -0.03307342529296875, -0.02982807159423828, -0.026582717895507812, -0.023337364196777344, -0.020092010498046875, -0.016846656799316406, -0.013601303100585938, -0.010355949401855469, -0.007110595703125, -0.0038652420043945312, -0.0006198883056640625, 0.0026254653930664062, 0.005870819091796875, 0.009116172790527344, 0.012361526489257812, 0.015606880187988281, 0.01885223388671875, 0.02209758758544922, 0.025342941284179688, 0.028588294982910156, 0.031833648681640625, 0.035079002380371094, 0.03832435607910156, 0.04156970977783203, 0.0448150634765625, 0.04806041717529297, 0.05130577087402344, 0.054551124572753906, 0.057796478271484375, 0.061041831970214844, 0.06428718566894531, 0.06753253936767578, 0.07077789306640625, 0.07402324676513672, 0.07726860046386719, 0.08051395416259766, 0.08375930786132812, 0.0870046615600586, 0.09025001525878906, 0.09349536895751953, 0.09674072265625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 15.0, 13.0, 19.0, 28.0, 49.0, 54.0, 91.0, 115.0, 136.0, 113.0, 115.0, 76.0, 44.0, 31.0, 27.0, 14.0, 14.0, 7.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9558732509613037, -1.9066932201385498, -1.857513189315796, -1.808333158493042, -1.759153127670288, -1.7099730968475342, -1.6607930660247803, -1.6116130352020264, -1.5624330043792725, -1.5132529735565186, -1.4640729427337646, -1.4148929119110107, -1.3657128810882568, -1.316532850265503, -1.267352819442749, -1.2181727886199951, -1.1689927577972412, -1.1198127269744873, -1.0706326961517334, -1.0214526653289795, -0.9722726345062256, -0.9230926036834717, -0.8739125728607178, -0.8247325420379639, -0.77555251121521, -0.726372480392456, -0.6771924495697021, -0.6280124187469482, -0.5788323879241943, -0.5296523571014404, -0.4804723262786865, -0.4312922954559326, -0.38211214542388916, -0.33293211460113525, -0.28375208377838135, -0.23457205295562744, -0.18539202213287354, -0.13621199131011963, -0.08703196048736572, -0.037851929664611816, 0.01132810115814209, 0.060508131980895996, 0.1096881628036499, 0.1588681936264038, 0.20804822444915771, 0.2572282552719116, 0.3064082860946655, 0.35558831691741943, 0.40476834774017334, 0.45394837856292725, 0.5031284093856812, 0.5523084402084351, 0.601488471031189, 0.6506685018539429, 0.6998485326766968, 0.7490285634994507, 0.7982085943222046, 0.8473886251449585, 0.8965686559677124, 0.9457486867904663, 0.9949287176132202, 1.0441087484359741, 1.093288779258728, 1.142468810081482, 1.1916488409042358]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 10.0, 13.0, 19.0, 18.0, 23.0, 30.0, 42.0, 29.0, 37.0, 46.0, 40.0, 40.0, 45.0, 51.0, 40.0, 45.0, 43.0, 42.0, 34.0, 40.0, 47.0, 35.0, 32.0, 28.0, 18.0, 22.0, 23.0, 20.0, 16.0, 5.0, 6.0, 9.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3416337966918945, -1.2968405485153198, -1.2520473003387451, -1.2072540521621704, -1.1624608039855957, -1.1176674365997314, -1.0728741884231567, -1.028080940246582, -0.9832876920700073, -0.9384944438934326, -0.8937011957168579, -0.8489078879356384, -0.8041146397590637, -0.759321391582489, -0.7145280838012695, -0.6697348356246948, -0.6249415874481201, -0.5801483392715454, -0.5353550910949707, -0.4905617833137512, -0.4457685351371765, -0.4009752869606018, -0.3561820089817047, -0.3113887310028076, -0.2665954828262329, -0.221802219748497, -0.1770089566707611, -0.1322156935930252, -0.0874224305152893, -0.042629167437553406, 0.002164095640182495, 0.04695737361907959, 0.09175074100494385, 0.13654400408267975, 0.18133726716041565, 0.22613053023815155, 0.27092379331588745, 0.31571704149246216, 0.36051031947135925, 0.40530359745025635, 0.45009684562683105, 0.49489009380340576, 0.5396833419799805, 0.5844766497612, 0.6292698979377747, 0.6740631461143494, 0.7188564538955688, 0.7636497020721436, 0.8084429502487183, 0.853236198425293, 0.8980294466018677, 0.9428227543830872, 0.9876160025596619, 1.0324093103408813, 1.077202558517456, 1.1219958066940308, 1.1667890548706055, 1.2115823030471802, 1.2563755512237549, 1.3011687994003296, 1.3459620475769043, 1.3907554149627686, 1.4355486631393433, 1.480341911315918, 1.5251351594924927]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 14.0, 18.0, 24.0, 41.0, 55.0, 87.0, 180.0, 338.0, 839.0, 2499.0, 10447.0, 298524.0, 3814377.0, 57758.0, 6136.0, 1687.0, 615.0, 247.0, 144.0, 75.0, 42.0, 37.0, 30.0, 15.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24407958984375, -2.1619873046875, -2.07989501953125, -1.997802734375, -1.91571044921875, -1.8336181640625, -1.75152587890625, -1.66943359375, -1.58734130859375, -1.5052490234375, -1.42315673828125, -1.341064453125, -1.25897216796875, -1.1768798828125, -1.09478759765625, -1.0126953125, -0.93060302734375, -0.8485107421875, -0.76641845703125, -0.684326171875, -0.60223388671875, -0.5201416015625, -0.43804931640625, -0.35595703125, -0.27386474609375, -0.1917724609375, -0.10968017578125, -0.027587890625, 0.05450439453125, 0.1365966796875, 0.21868896484375, 0.30078125, 0.38287353515625, 0.4649658203125, 0.54705810546875, 0.629150390625, 0.71124267578125, 0.7933349609375, 0.87542724609375, 0.95751953125, 1.03961181640625, 1.1217041015625, 1.20379638671875, 1.285888671875, 1.36798095703125, 1.4500732421875, 1.53216552734375, 1.6142578125, 1.69635009765625, 1.7784423828125, 1.86053466796875, 1.942626953125, 2.02471923828125, 2.1068115234375, 2.18890380859375, 2.27099609375, 2.35308837890625, 2.4351806640625, 2.51727294921875, 2.599365234375, 2.68145751953125, 2.7635498046875, 2.84564208984375, 2.927734375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 6.0, 15.0, 14.0, 19.0, 22.0, 28.0, 39.0, 35.0, 38.0, 55.0, 50.0, 58.0, 59.0, 45.0, 62.0, 51.0, 56.0, 57.0, 39.0, 38.0, 38.0, 25.0, 27.0, 25.0, 23.0, 15.0, 12.0, 5.0, 8.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.705078125, -0.6843109130859375, -0.663543701171875, -0.6427764892578125, -0.62200927734375, -0.6012420654296875, -0.580474853515625, -0.5597076416015625, -0.5389404296875, -0.5181732177734375, -0.497406005859375, -0.4766387939453125, -0.45587158203125, -0.4351043701171875, -0.414337158203125, -0.3935699462890625, -0.372802734375, -0.3520355224609375, -0.331268310546875, -0.3105010986328125, -0.28973388671875, -0.2689666748046875, -0.248199462890625, -0.2274322509765625, -0.2066650390625, -0.1858978271484375, -0.165130615234375, -0.1443634033203125, -0.12359619140625, -0.1028289794921875, -0.082061767578125, -0.0612945556640625, -0.04052734375, -0.0197601318359375, 0.001007080078125, 0.0217742919921875, 0.04254150390625, 0.0633087158203125, 0.084075927734375, 0.1048431396484375, 0.1256103515625, 0.1463775634765625, 0.167144775390625, 0.1879119873046875, 0.20867919921875, 0.2294464111328125, 0.250213623046875, 0.2709808349609375, 0.291748046875, 0.3125152587890625, 0.333282470703125, 0.3540496826171875, 0.37481689453125, 0.3955841064453125, 0.416351318359375, 0.4371185302734375, 0.4578857421875, 0.4786529541015625, 0.499420166015625, 0.5201873779296875, 0.54095458984375, 0.5617218017578125, 0.582489013671875, 0.6032562255859375, 0.6240234375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 11.0, 12.0, 15.0, 9.0, 21.0, 26.0, 50.0, 72.0, 84.0, 208.0, 467.0, 1029.0, 2839.0, 9934.0, 51272.0, 2088163.0, 1974104.0, 51169.0, 9881.0, 2929.0, 1033.0, 423.0, 190.0, 110.0, 68.0, 36.0, 31.0, 18.0, 16.0, 21.0, 4.0, 5.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1220703125, -1.08050537109375, -1.0389404296875, -0.99737548828125, -0.955810546875, -0.91424560546875, -0.8726806640625, -0.83111572265625, -0.78955078125, -0.74798583984375, -0.7064208984375, -0.66485595703125, -0.623291015625, -0.58172607421875, -0.5401611328125, -0.49859619140625, -0.45703125, -0.41546630859375, -0.3739013671875, -0.33233642578125, -0.290771484375, -0.24920654296875, -0.2076416015625, -0.16607666015625, -0.12451171875, -0.08294677734375, -0.0413818359375, 0.00018310546875, 0.041748046875, 0.08331298828125, 0.1248779296875, 0.16644287109375, 0.2080078125, 0.24957275390625, 0.2911376953125, 0.33270263671875, 0.374267578125, 0.41583251953125, 0.4573974609375, 0.49896240234375, 0.54052734375, 0.58209228515625, 0.6236572265625, 0.66522216796875, 0.706787109375, 0.74835205078125, 0.7899169921875, 0.83148193359375, 0.873046875, 0.91461181640625, 0.9561767578125, 0.99774169921875, 1.039306640625, 1.08087158203125, 1.1224365234375, 1.16400146484375, 1.20556640625, 1.24713134765625, 1.2886962890625, 1.33026123046875, 1.371826171875, 1.41339111328125, 1.4549560546875, 1.49652099609375, 1.5380859375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 19.0, 17.0, 16.0, 23.0, 29.0, 39.0, 65.0, 99.0, 114.0, 250.0, 461.0, 723.0, 820.0, 536.0, 315.0, 182.0, 94.0, 56.0, 45.0, 31.0, 23.0, 26.0, 19.0, 14.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28076171875, -0.272308349609375, -0.26385498046875, -0.255401611328125, -0.2469482421875, -0.238494873046875, -0.23004150390625, -0.221588134765625, -0.213134765625, -0.204681396484375, -0.19622802734375, -0.187774658203125, -0.1793212890625, -0.170867919921875, -0.16241455078125, -0.153961181640625, -0.1455078125, -0.137054443359375, -0.12860107421875, -0.120147705078125, -0.1116943359375, -0.103240966796875, -0.09478759765625, -0.086334228515625, -0.077880859375, -0.069427490234375, -0.06097412109375, -0.052520751953125, -0.0440673828125, -0.035614013671875, -0.02716064453125, -0.018707275390625, -0.01025390625, -0.001800537109375, 0.00665283203125, 0.015106201171875, 0.0235595703125, 0.032012939453125, 0.04046630859375, 0.048919677734375, 0.057373046875, 0.065826416015625, 0.07427978515625, 0.082733154296875, 0.0911865234375, 0.099639892578125, 0.10809326171875, 0.116546630859375, 0.125, 0.133453369140625, 0.14190673828125, 0.150360107421875, 0.1588134765625, 0.167266845703125, 0.17572021484375, 0.184173583984375, 0.192626953125, 0.201080322265625, 0.20953369140625, 0.217987060546875, 0.2264404296875, 0.234893798828125, 0.24334716796875, 0.251800537109375, 0.26025390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 12.0, 19.0, 17.0, 28.0, 33.0, 56.0, 70.0, 133.0, 164.0, 129.0, 89.0, 58.0, 56.0, 39.0, 30.0, 19.0, 7.0, 6.0, 9.0, 6.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6198253631591797, -1.5801854133605957, -1.5405454635620117, -1.5009055137634277, -1.4612655639648438, -1.4216256141662598, -1.3819856643676758, -1.3423457145690918, -1.3027057647705078, -1.2630658149719238, -1.2234258651733398, -1.1837859153747559, -1.1441459655761719, -1.104506015777588, -1.064866065979004, -1.02522611618042, -0.9855862259864807, -0.9459462761878967, -0.9063063263893127, -0.8666663765907288, -0.8270264267921448, -0.7873864769935608, -0.7477465867996216, -0.7081066370010376, -0.6684666872024536, -0.6288267374038696, -0.5891867876052856, -0.5495468378067017, -0.5099068880081177, -0.4702669382095337, -0.4306270182132721, -0.3909870684146881, -0.35134708881378174, -0.31170713901519775, -0.27206718921661377, -0.23242725431919098, -0.192787304520607, -0.153147354722023, -0.11350741982460022, -0.07386747002601624, -0.03422752022743225, 0.005412425845861435, 0.04505237191915512, 0.08469231426715851, 0.12433226406574249, 0.16397221386432648, 0.20361214876174927, 0.24325209856033325, 0.28289204835891724, 0.3225319981575012, 0.3621719479560852, 0.4018118977546692, 0.4414518475532532, 0.48109179735183716, 0.5207316875457764, 0.5603716373443604, 0.6000115871429443, 0.6396515369415283, 0.6792914867401123, 0.7189314365386963, 0.7585713863372803, 0.7982113361358643, 0.8378512859344482, 0.8774912357330322, 0.9171311855316162]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 4.0, 8.0, 12.0, 12.0, 13.0, 20.0, 19.0, 16.0, 34.0, 33.0, 43.0, 40.0, 47.0, 38.0, 45.0, 48.0, 44.0, 46.0, 43.0, 48.0, 44.0, 44.0, 49.0, 36.0, 24.0, 30.0, 31.0, 21.0, 22.0, 12.0, 17.0, 13.0, 5.0, 10.0, 9.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6572402715682983, -0.6374079585075378, -0.6175755858421326, -0.5977432727813721, -0.5779109001159668, -0.5580785870552063, -0.5382462739944458, -0.5184139013290405, -0.49858158826828003, -0.47874924540519714, -0.45891690254211426, -0.43908458948135376, -0.4192522466182709, -0.399419903755188, -0.3795875608921051, -0.3597552180290222, -0.33992287516593933, -0.32009053230285645, -0.30025818943977356, -0.2804258465766907, -0.2605935335159302, -0.2407611906528473, -0.2209288477897644, -0.2010965198278427, -0.18126417696475983, -0.16143183410167694, -0.14159950613975525, -0.12176716327667236, -0.10193482786417007, -0.08210249245166779, -0.0622701495885849, -0.04243782162666321, -0.022605478763580322, -0.002773141488432884, 0.017059195786714554, 0.03689153492450714, 0.05672387033700943, 0.07655620574951172, 0.0963885486125946, 0.1162208765745163, 0.13605321943759918, 0.15588556230068207, 0.17571789026260376, 0.19555023312568665, 0.21538257598876953, 0.23521490395069122, 0.2550472617149353, 0.2748795747756958, 0.2947119176387787, 0.3145442605018616, 0.33437660336494446, 0.35420894622802734, 0.37404125928878784, 0.3938736021518707, 0.4137059450149536, 0.4335382580757141, 0.4533706307411194, 0.47320297360420227, 0.49303531646728516, 0.5128676295280457, 0.5327000021934509, 0.5525323152542114, 0.5723646879196167, 0.5921970009803772, 0.6120293140411377]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 0.0, 4.0, 8.0, 9.0, 12.0, 22.0, 30.0, 41.0, 53.0, 114.0, 179.0, 301.0, 676.0, 1314.0, 2955.0, 7102.0, 19750.0, 65950.0, 294994.0, 489817.0, 115624.0, 30930.0, 10728.0, 4176.0, 1820.0, 888.0, 425.0, 256.0, 134.0, 75.0, 41.0, 32.0, 28.0, 15.0, 14.0, 13.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.1900634765625, -0.18521499633789062, -0.18036651611328125, -0.17551803588867188, -0.1706695556640625, -0.16582107543945312, -0.16097259521484375, -0.15612411499023438, -0.151275634765625, -0.14642715454101562, -0.14157867431640625, -0.13673019409179688, -0.1318817138671875, -0.12703323364257812, -0.12218475341796875, -0.11733627319335938, -0.11248779296875, -0.10763931274414062, -0.10279083251953125, -0.09794235229492188, -0.0930938720703125, -0.08824539184570312, -0.08339691162109375, -0.07854843139648438, -0.073699951171875, -0.06885147094726562, -0.06400299072265625, -0.059154510498046875, -0.0543060302734375, -0.049457550048828125, -0.04460906982421875, -0.039760589599609375, -0.034912109375, -0.030063629150390625, -0.02521514892578125, -0.020366668701171875, -0.0155181884765625, -0.010669708251953125, -0.00582122802734375, -0.000972747802734375, 0.003875732421875, 0.008724212646484375, 0.01357269287109375, 0.018421173095703125, 0.0232696533203125, 0.028118133544921875, 0.03296661376953125, 0.037815093994140625, 0.04266357421875, 0.047512054443359375, 0.05236053466796875, 0.057209014892578125, 0.0620574951171875, 0.06690597534179688, 0.07175445556640625, 0.07660293579101562, 0.081451416015625, 0.08629989624023438, 0.09114837646484375, 0.09599685668945312, 0.1008453369140625, 0.10569381713867188, 0.11054229736328125, 0.11539077758789062, 0.1202392578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 8.0, 15.0, 18.0, 18.0, 18.0, 34.0, 42.0, 42.0, 50.0, 52.0, 52.0, 58.0, 57.0, 54.0, 62.0, 50.0, 45.0, 55.0, 43.0, 29.0, 31.0, 26.0, 24.0, 17.0, 14.0, 18.0, 7.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.489013671875, -0.4742240905761719, -0.45943450927734375, -0.4446449279785156, -0.4298553466796875, -0.4150657653808594, -0.40027618408203125, -0.3854866027832031, -0.370697021484375, -0.3559074401855469, -0.34111785888671875, -0.3263282775878906, -0.3115386962890625, -0.2967491149902344, -0.28195953369140625, -0.2671699523925781, -0.25238037109375, -0.23759078979492188, -0.22280120849609375, -0.20801162719726562, -0.1932220458984375, -0.17843246459960938, -0.16364288330078125, -0.14885330200195312, -0.134063720703125, -0.11927413940429688, -0.10448455810546875, -0.08969497680664062, -0.0749053955078125, -0.060115814208984375, -0.04532623291015625, -0.030536651611328125, -0.0157470703125, -0.000957489013671875, 0.01383209228515625, 0.028621673583984375, 0.0434112548828125, 0.058200836181640625, 0.07299041748046875, 0.08777999877929688, 0.102569580078125, 0.11735916137695312, 0.13214874267578125, 0.14693832397460938, 0.1617279052734375, 0.17651748657226562, 0.19130706787109375, 0.20609664916992188, 0.22088623046875, 0.23567581176757812, 0.25046539306640625, 0.2652549743652344, 0.2800445556640625, 0.2948341369628906, 0.30962371826171875, 0.3244132995605469, 0.339202880859375, 0.3539924621582031, 0.36878204345703125, 0.3835716247558594, 0.3983612060546875, 0.4131507873535156, 0.42794036865234375, 0.4427299499511719, 0.45751953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 17.0, 35.0, 29.0, 66.0, 104.0, 200.0, 323.0, 560.0, 1117.0, 2437.0, 5608.0, 15156.0, 46892.0, 171207.0, 476806.0, 234098.0, 61370.0, 19434.0, 7058.0, 2940.0, 1473.0, 696.0, 368.0, 212.0, 103.0, 75.0, 47.0, 36.0, 11.0, 9.0, 10.0, 4.0, 7.0, 2.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.12017822265625, -0.11637687683105469, -0.11257553100585938, -0.10877418518066406, -0.10497283935546875, -0.10117149353027344, -0.09737014770507812, -0.09356880187988281, -0.0897674560546875, -0.08596611022949219, -0.08216476440429688, -0.07836341857910156, -0.07456207275390625, -0.07076072692871094, -0.06695938110351562, -0.06315803527832031, -0.059356689453125, -0.05555534362792969, -0.051753997802734375, -0.04795265197753906, -0.04415130615234375, -0.04034996032714844, -0.036548614501953125, -0.03274726867675781, -0.0289459228515625, -0.025144577026367188, -0.021343231201171875, -0.017541885375976562, -0.01374053955078125, -0.009939193725585938, -0.006137847900390625, -0.0023365020751953125, 0.00146484375, 0.0052661895751953125, 0.009067535400390625, 0.012868881225585938, 0.01667022705078125, 0.020471572875976562, 0.024272918701171875, 0.028074264526367188, 0.0318756103515625, 0.03567695617675781, 0.039478302001953125, 0.04327964782714844, 0.04708099365234375, 0.05088233947753906, 0.054683685302734375, 0.05848503112792969, 0.062286376953125, 0.06608772277832031, 0.06988906860351562, 0.07369041442871094, 0.07749176025390625, 0.08129310607910156, 0.08509445190429688, 0.08889579772949219, 0.0926971435546875, 0.09649848937988281, 0.10029983520507812, 0.10410118103027344, 0.10790252685546875, 0.11170387268066406, 0.11550521850585938, 0.11930656433105469, 0.12310791015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 6.0, 11.0, 14.0, 13.0, 17.0, 22.0, 27.0, 25.0, 37.0, 35.0, 34.0, 48.0, 50.0, 54.0, 35.0, 43.0, 52.0, 55.0, 48.0, 30.0, 44.0, 40.0, 42.0, 35.0, 37.0, 23.0, 19.0, 21.0, 14.0, 11.0, 8.0, 10.0, 5.0, 9.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7099609375, -0.6864700317382812, -0.6629791259765625, -0.6394882202148438, -0.615997314453125, -0.5925064086914062, -0.5690155029296875, -0.5455245971679688, -0.52203369140625, -0.49854278564453125, -0.4750518798828125, -0.45156097412109375, -0.428070068359375, -0.40457916259765625, -0.3810882568359375, -0.35759735107421875, -0.3341064453125, -0.31061553955078125, -0.2871246337890625, -0.26363372802734375, -0.240142822265625, -0.21665191650390625, -0.1931610107421875, -0.16967010498046875, -0.14617919921875, -0.12268829345703125, -0.0991973876953125, -0.07570648193359375, -0.052215576171875, -0.02872467041015625, -0.0052337646484375, 0.01825714111328125, 0.041748046875, 0.06523895263671875, 0.0887298583984375, 0.11222076416015625, 0.135711669921875, 0.15920257568359375, 0.1826934814453125, 0.20618438720703125, 0.22967529296875, 0.25316619873046875, 0.2766571044921875, 0.30014801025390625, 0.323638916015625, 0.34712982177734375, 0.3706207275390625, 0.39411163330078125, 0.4176025390625, 0.44109344482421875, 0.4645843505859375, 0.48807525634765625, 0.511566162109375, 0.5350570678710938, 0.5585479736328125, 0.5820388793945312, 0.60552978515625, 0.6290206909179688, 0.6525115966796875, 0.6760025024414062, 0.699493408203125, 0.7229843139648438, 0.7464752197265625, 0.7699661254882812, 0.79345703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 9.0, 13.0, 10.0, 33.0, 37.0, 61.0, 143.0, 213.0, 378.0, 922.0, 2184.0, 6491.0, 23357.0, 118118.0, 594906.0, 244463.0, 41226.0, 10345.0, 3246.0, 1199.0, 579.0, 271.0, 145.0, 71.0, 46.0, 26.0, 18.0, 8.0, 5.0, 9.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051849365234375, -0.05021333694458008, -0.048577308654785156, -0.046941280364990234, -0.04530525207519531, -0.04366922378540039, -0.04203319549560547, -0.04039716720581055, -0.038761138916015625, -0.0371251106262207, -0.03548908233642578, -0.03385305404663086, -0.03221702575683594, -0.030580997467041016, -0.028944969177246094, -0.027308940887451172, -0.02567291259765625, -0.024036884307861328, -0.022400856018066406, -0.020764827728271484, -0.019128799438476562, -0.01749277114868164, -0.01585674285888672, -0.014220714569091797, -0.012584686279296875, -0.010948657989501953, -0.009312629699707031, -0.007676601409912109, -0.0060405731201171875, -0.004404544830322266, -0.0027685165405273438, -0.0011324882507324219, 0.0005035400390625, 0.002139568328857422, 0.0037755966186523438, 0.005411624908447266, 0.0070476531982421875, 0.00868368148803711, 0.010319709777832031, 0.011955738067626953, 0.013591766357421875, 0.015227794647216797, 0.01686382293701172, 0.01849985122680664, 0.020135879516601562, 0.021771907806396484, 0.023407936096191406, 0.025043964385986328, 0.02667999267578125, 0.028316020965576172, 0.029952049255371094, 0.031588077545166016, 0.03322410583496094, 0.03486013412475586, 0.03649616241455078, 0.0381321907043457, 0.039768218994140625, 0.04140424728393555, 0.04304027557373047, 0.04467630386352539, 0.04631233215332031, 0.047948360443115234, 0.049584388732910156, 0.05122041702270508, 0.0528564453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 3.0, 7.0, 12.0, 13.0, 9.0, 17.0, 17.0, 39.0, 42.0, 68.0, 117.0, 126.0, 101.0, 127.0, 89.0, 60.0, 47.0, 31.0, 26.0, 16.0, 6.0, 10.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.552436828613281e-05, -3.464706242084503e-05, -3.376975655555725e-05, -3.289245069026947e-05, -3.201514482498169e-05, -3.113783895969391e-05, -3.0260533094406128e-05, -2.9383227229118347e-05, -2.8505921363830566e-05, -2.7628615498542786e-05, -2.6751309633255005e-05, -2.5874003767967224e-05, -2.4996697902679443e-05, -2.4119392037391663e-05, -2.3242086172103882e-05, -2.23647803068161e-05, -2.148747444152832e-05, -2.061016857624054e-05, -1.973286271095276e-05, -1.8855556845664978e-05, -1.7978250980377197e-05, -1.7100945115089417e-05, -1.6223639249801636e-05, -1.5346333384513855e-05, -1.4469027519226074e-05, -1.3591721653938293e-05, -1.2714415788650513e-05, -1.1837109923362732e-05, -1.0959804058074951e-05, -1.008249819278717e-05, -9.20519232749939e-06, -8.327886462211609e-06, -7.450580596923828e-06, -6.573274731636047e-06, -5.695968866348267e-06, -4.818663001060486e-06, -3.941357135772705e-06, -3.0640512704849243e-06, -2.1867454051971436e-06, -1.3094395399093628e-06, -4.3213367462158203e-07, 4.4517219066619873e-07, 1.3224780559539795e-06, 2.1997839212417603e-06, 3.077089786529541e-06, 3.954395651817322e-06, 4.8317015171051025e-06, 5.709007382392883e-06, 6.586313247680664e-06, 7.463619112968445e-06, 8.340924978256226e-06, 9.218230843544006e-06, 1.0095536708831787e-05, 1.0972842574119568e-05, 1.1850148439407349e-05, 1.272745430469513e-05, 1.360476016998291e-05, 1.4482066035270691e-05, 1.535937190055847e-05, 1.6236677765846252e-05, 1.7113983631134033e-05, 1.7991289496421814e-05, 1.8868595361709595e-05, 1.9745901226997375e-05, 2.0623207092285156e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 8.0, 21.0, 42.0, 46.0, 69.0, 124.0, 207.0, 363.0, 564.0, 935.0, 1759.0, 3390.0, 6780.0, 15876.0, 41380.0, 127518.0, 392454.0, 307847.0, 93239.0, 31555.0, 12299.0, 5637.0, 2779.0, 1524.0, 848.0, 485.0, 279.0, 201.0, 118.0, 62.0, 45.0, 34.0, 14.0, 16.0, 7.0, 4.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.037506103515625, -0.03643035888671875, -0.0353546142578125, -0.03427886962890625, -0.033203125, -0.03212738037109375, -0.0310516357421875, -0.02997589111328125, -0.028900146484375, -0.02782440185546875, -0.0267486572265625, -0.02567291259765625, -0.02459716796875, -0.02352142333984375, -0.0224456787109375, -0.02136993408203125, -0.020294189453125, -0.01921844482421875, -0.0181427001953125, -0.01706695556640625, -0.0159912109375, -0.01491546630859375, -0.0138397216796875, -0.01276397705078125, -0.011688232421875, -0.01061248779296875, -0.0095367431640625, -0.00846099853515625, -0.00738525390625, -0.00630950927734375, -0.0052337646484375, -0.00415802001953125, -0.003082275390625, -0.00200653076171875, -0.0009307861328125, 0.00014495849609375, 0.001220703125, 0.00229644775390625, 0.0033721923828125, 0.00444793701171875, 0.005523681640625, 0.00659942626953125, 0.0076751708984375, 0.00875091552734375, 0.00982666015625, 0.01090240478515625, 0.0119781494140625, 0.01305389404296875, 0.014129638671875, 0.01520538330078125, 0.0162811279296875, 0.01735687255859375, 0.0184326171875, 0.01950836181640625, 0.0205841064453125, 0.02165985107421875, 0.022735595703125, 0.02381134033203125, 0.0248870849609375, 0.02596282958984375, 0.02703857421875, 0.02811431884765625, 0.0291900634765625, 0.03026580810546875, 0.031341552734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 21.0, 31.0, 25.0, 34.0, 70.0, 72.0, 65.0, 97.0, 75.0, 82.0, 78.0, 58.0, 63.0, 47.0, 37.0, 26.0, 16.0, 19.0, 11.0, 12.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01166534423828125, -0.011307954788208008, -0.010950565338134766, -0.010593175888061523, -0.010235786437988281, -0.009878396987915039, -0.009521007537841797, -0.009163618087768555, -0.008806228637695312, -0.00844883918762207, -0.008091449737548828, -0.007734060287475586, -0.007376670837402344, -0.0070192813873291016, -0.006661891937255859, -0.006304502487182617, -0.005947113037109375, -0.005589723587036133, -0.005232334136962891, -0.0048749446868896484, -0.004517555236816406, -0.004160165786743164, -0.003802776336669922, -0.0034453868865966797, -0.0030879974365234375, -0.0027306079864501953, -0.002373218536376953, -0.002015829086303711, -0.0016584396362304688, -0.0013010501861572266, -0.0009436607360839844, -0.0005862712860107422, -0.0002288818359375, 0.0001285076141357422, 0.0004858970642089844, 0.0008432865142822266, 0.0012006759643554688, 0.001558065414428711, 0.0019154548645019531, 0.0022728443145751953, 0.0026302337646484375, 0.0029876232147216797, 0.003345012664794922, 0.003702402114868164, 0.004059791564941406, 0.0044171810150146484, 0.004774570465087891, 0.005131959915161133, 0.005489349365234375, 0.005846738815307617, 0.006204128265380859, 0.0065615177154541016, 0.006918907165527344, 0.007276296615600586, 0.007633686065673828, 0.00799107551574707, 0.008348464965820312, 0.008705854415893555, 0.009063243865966797, 0.009420633316040039, 0.009778022766113281, 0.010135412216186523, 0.010492801666259766, 0.010850191116333008, 0.01120758056640625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 19.0, 22.0, 26.0, 53.0, 74.0, 164.0, 195.0, 167.0, 83.0, 76.0, 46.0, 21.0, 9.0, 14.0, 10.0, 3.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4605964422225952, -1.4278874397277832, -1.3951785564422607, -1.3624695539474487, -1.3297605514526367, -1.2970515489578247, -1.2643426656723022, -1.2316336631774902, -1.1989246606826782, -1.1662156581878662, -1.1335067749023438, -1.1007977724075317, -1.0680887699127197, -1.0353797674179077, -1.0026708841323853, -0.9699618816375732, -0.937252938747406, -0.9045439958572388, -0.8718349933624268, -0.8391260504722595, -0.8064170479774475, -0.7737081050872803, -0.7409991025924683, -0.708290159702301, -0.6755812168121338, -0.6428722739219666, -0.6101632714271545, -0.5774543285369873, -0.5447453260421753, -0.5120363831520081, -0.47932741045951843, -0.4466184377670288, -0.4139094948768616, -0.38120052218437195, -0.3484915494918823, -0.3157826066017151, -0.2830736041069031, -0.25036466121673584, -0.21765568852424622, -0.1849467158317566, -0.15223774313926697, -0.11952877044677734, -0.08681980520486832, -0.05411083996295929, -0.021401867270469666, 0.011307105422019958, 0.04401606321334839, 0.07672503590583801, 0.10943400859832764, 0.14214298129081726, 0.17485195398330688, 0.20756091177463531, 0.24026988446712494, 0.27297884225845337, 0.305687814950943, 0.3383967876434326, 0.37110576033592224, 0.40381473302841187, 0.4365237057209015, 0.4692326784133911, 0.5019416213035583, 0.5346506237983704, 0.5673595666885376, 0.6000685691833496, 0.6327775120735168]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 10.0, 4.0, 6.0, 11.0, 21.0, 17.0, 20.0, 26.0, 25.0, 39.0, 45.0, 50.0, 52.0, 46.0, 52.0, 53.0, 43.0, 55.0, 57.0, 46.0, 53.0, 51.0, 28.0, 30.0, 31.0, 28.0, 20.0, 13.0, 20.0, 11.0, 3.0, 8.0, 8.0, 5.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44822201132774353, -0.4344092905521393, -0.42059656977653503, -0.4067838490009308, -0.39297112822532654, -0.3791584074497223, -0.36534565687179565, -0.3515329360961914, -0.33772021532058716, -0.3239074945449829, -0.31009477376937866, -0.2962820529937744, -0.28246933221817017, -0.2686566114425659, -0.25484389066696167, -0.24103115499019623, -0.22721844911575317, -0.21340572834014893, -0.19959300756454468, -0.18578028678894043, -0.17196756601333618, -0.15815484523773193, -0.1443421095609665, -0.13052938878536224, -0.116716668009758, -0.10290394723415375, -0.0890912264585495, -0.07527849823236465, -0.061465777456760406, -0.04765305668115616, -0.033840328454971313, -0.020027607679367065, -0.006214916706085205, 0.007597805932164192, 0.02141052857041359, 0.035223253071308136, 0.049035973846912384, 0.06284869462251663, 0.07666142284870148, 0.09047414362430573, 0.10428686439990997, 0.11809958517551422, 0.13191230595111847, 0.1457250416278839, 0.15953776240348816, 0.1733504831790924, 0.18716320395469666, 0.2009759247303009, 0.21478864550590515, 0.2286013662815094, 0.24241408705711365, 0.2562268078327179, 0.27003952860832214, 0.2838522493839264, 0.297664999961853, 0.3114777207374573, 0.3252904415130615, 0.33910316228866577, 0.35291588306427, 0.36672860383987427, 0.3805413246154785, 0.39435404539108276, 0.408166766166687, 0.42197948694229126, 0.4357922077178955]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 13.0, 16.0, 23.0, 36.0, 39.0, 60.0, 64.0, 106.0, 118.0, 182.0, 254.0, 359.0, 513.0, 822.0, 1274.0, 2238.0, 4476.0, 10097.0, 35030.0, 373309.0, 551628.0, 44532.0, 11797.0, 4875.0, 2498.0, 1413.0, 840.0, 554.0, 355.0, 282.0, 198.0, 126.0, 97.0, 74.0, 56.0, 47.0, 32.0, 28.0, 20.0, 20.0, 11.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.53271484375, -0.5161056518554688, -0.4994964599609375, -0.48288726806640625, -0.466278076171875, -0.44966888427734375, -0.4330596923828125, -0.41645050048828125, -0.39984130859375, -0.38323211669921875, -0.3666229248046875, -0.35001373291015625, -0.333404541015625, -0.31679534912109375, -0.3001861572265625, -0.28357696533203125, -0.2669677734375, -0.25035858154296875, -0.2337493896484375, -0.21714019775390625, -0.200531005859375, -0.18392181396484375, -0.1673126220703125, -0.15070343017578125, -0.13409423828125, -0.11748504638671875, -0.1008758544921875, -0.08426666259765625, -0.067657470703125, -0.05104827880859375, -0.0344390869140625, -0.01782989501953125, -0.001220703125, 0.01538848876953125, 0.0319976806640625, 0.04860687255859375, 0.065216064453125, 0.08182525634765625, 0.0984344482421875, 0.11504364013671875, 0.13165283203125, 0.14826202392578125, 0.1648712158203125, 0.18148040771484375, 0.198089599609375, 0.21469879150390625, 0.2313079833984375, 0.24791717529296875, 0.2645263671875, 0.28113555908203125, 0.2977447509765625, 0.31435394287109375, 0.330963134765625, 0.34757232666015625, 0.3641815185546875, 0.38079071044921875, 0.39739990234375, 0.41400909423828125, 0.4306182861328125, 0.44722747802734375, 0.463836669921875, 0.48044586181640625, 0.4970550537109375, 0.5136642456054688, 0.5302734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 2.0, 6.0, 17.0, 15.0, 17.0, 26.0, 24.0, 52.0, 45.0, 58.0, 57.0, 54.0, 57.0, 63.0, 65.0, 63.0, 53.0, 56.0, 64.0, 33.0, 16.0, 28.0, 30.0, 19.0, 17.0, 11.0, 9.0, 6.0, 2.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9509658813476562, -0.9199981689453125, -0.8890304565429688, -0.858062744140625, -0.8270950317382812, -0.7961273193359375, -0.7651596069335938, -0.73419189453125, -0.7032241821289062, -0.6722564697265625, -0.6412887573242188, -0.610321044921875, -0.5793533325195312, -0.5483856201171875, -0.5174179077148438, -0.4864501953125, -0.45548248291015625, -0.4245147705078125, -0.39354705810546875, -0.362579345703125, -0.33161163330078125, -0.3006439208984375, -0.26967620849609375, -0.23870849609375, -0.20774078369140625, -0.1767730712890625, -0.14580535888671875, -0.114837646484375, -0.08386993408203125, -0.0529022216796875, -0.02193450927734375, 0.009033203125, 0.04000091552734375, 0.0709686279296875, 0.10193634033203125, 0.132904052734375, 0.16387176513671875, 0.1948394775390625, 0.22580718994140625, 0.25677490234375, 0.28774261474609375, 0.3187103271484375, 0.34967803955078125, 0.380645751953125, 0.41161346435546875, 0.4425811767578125, 0.47354888916015625, 0.5045166015625, 0.5354843139648438, 0.5664520263671875, 0.5974197387695312, 0.628387451171875, 0.6593551635742188, 0.6903228759765625, 0.7212905883789062, 0.75225830078125, 0.7832260131835938, 0.8141937255859375, 0.8451614379882812, 0.876129150390625, 0.9070968627929688, 0.9380645751953125, 0.9690322875976562, 1.0]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 10.0, 7.0, 12.0, 15.0, 24.0, 40.0, 42.0, 73.0, 101.0, 136.0, 227.0, 404.0, 894.0, 2694.0, 21337.0, 990297.0, 27104.0, 2999.0, 970.0, 476.0, 232.0, 121.0, 96.0, 53.0, 45.0, 30.0, 18.0, 19.0, 14.0, 10.0, 13.0, 15.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1044921875, -1.0628662109375, -1.021240234375, -0.9796142578125, -0.93798828125, -0.8963623046875, -0.854736328125, -0.8131103515625, -0.771484375, -0.7298583984375, -0.688232421875, -0.6466064453125, -0.60498046875, -0.5633544921875, -0.521728515625, -0.4801025390625, -0.4384765625, -0.3968505859375, -0.355224609375, -0.3135986328125, -0.27197265625, -0.2303466796875, -0.188720703125, -0.1470947265625, -0.10546875, -0.0638427734375, -0.022216796875, 0.0194091796875, 0.06103515625, 0.1026611328125, 0.144287109375, 0.1859130859375, 0.2275390625, 0.2691650390625, 0.310791015625, 0.3524169921875, 0.39404296875, 0.4356689453125, 0.477294921875, 0.5189208984375, 0.560546875, 0.6021728515625, 0.643798828125, 0.6854248046875, 0.72705078125, 0.7686767578125, 0.810302734375, 0.8519287109375, 0.8935546875, 0.9351806640625, 0.976806640625, 1.0184326171875, 1.06005859375, 1.1016845703125, 1.143310546875, 1.1849365234375, 1.2265625, 1.2681884765625, 1.309814453125, 1.3514404296875, 1.39306640625, 1.4346923828125, 1.476318359375, 1.5179443359375, 1.5595703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 6.0, 3.0, 5.0, 3.0, 8.0, 15.0, 9.0, 15.0, 18.0, 17.0, 17.0, 29.0, 24.0, 23.0, 32.0, 28.0, 36.0, 32.0, 31.0, 44.0, 43.0, 34.0, 45.0, 44.0, 25.0, 38.0, 36.0, 44.0, 42.0, 22.0, 33.0, 22.0, 21.0, 23.0, 25.0, 16.0, 11.0, 10.0, 12.0, 8.0, 6.0, 14.0, 12.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.63330078125, -0.6142730712890625, -0.595245361328125, -0.5762176513671875, -0.55718994140625, -0.5381622314453125, -0.519134521484375, -0.5001068115234375, -0.4810791015625, -0.4620513916015625, -0.443023681640625, -0.4239959716796875, -0.40496826171875, -0.3859405517578125, -0.366912841796875, -0.3478851318359375, -0.328857421875, -0.3098297119140625, -0.290802001953125, -0.2717742919921875, -0.25274658203125, -0.2337188720703125, -0.214691162109375, -0.1956634521484375, -0.1766357421875, -0.1576080322265625, -0.138580322265625, -0.1195526123046875, -0.10052490234375, -0.0814971923828125, -0.062469482421875, -0.0434417724609375, -0.0244140625, -0.0053863525390625, 0.013641357421875, 0.0326690673828125, 0.05169677734375, 0.0707244873046875, 0.089752197265625, 0.1087799072265625, 0.1278076171875, 0.1468353271484375, 0.165863037109375, 0.1848907470703125, 0.20391845703125, 0.2229461669921875, 0.241973876953125, 0.2610015869140625, 0.280029296875, 0.2990570068359375, 0.318084716796875, 0.3371124267578125, 0.35614013671875, 0.3751678466796875, 0.394195556640625, 0.4132232666015625, 0.4322509765625, 0.4512786865234375, 0.470306396484375, 0.4893341064453125, 0.50836181640625, 0.5273895263671875, 0.546417236328125, 0.5654449462890625, 0.58447265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 9.0, 14.0, 8.0, 12.0, 19.0, 41.0, 74.0, 113.0, 257.0, 605.0, 1952.0, 8795.0, 75833.0, 849914.0, 97045.0, 10433.0, 2185.0, 676.0, 273.0, 121.0, 53.0, 45.0, 28.0, 10.0, 6.0, 5.0, 5.0, 6.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19780349731445312, -0.19223785400390625, -0.18667221069335938, -0.1811065673828125, -0.17554092407226562, -0.16997528076171875, -0.16440963745117188, -0.158843994140625, -0.15327835083007812, -0.14771270751953125, -0.14214706420898438, -0.1365814208984375, -0.13101577758789062, -0.12545013427734375, -0.11988449096679688, -0.11431884765625, -0.10875320434570312, -0.10318756103515625, -0.09762191772460938, -0.0920562744140625, -0.08649063110351562, -0.08092498779296875, -0.07535934448242188, -0.069793701171875, -0.06422805786132812, -0.05866241455078125, -0.053096771240234375, -0.0475311279296875, -0.041965484619140625, -0.03639984130859375, -0.030834197998046875, -0.0252685546875, -0.019702911376953125, -0.01413726806640625, -0.008571624755859375, -0.0030059814453125, 0.002559661865234375, 0.00812530517578125, 0.013690948486328125, 0.019256591796875, 0.024822235107421875, 0.03038787841796875, 0.035953521728515625, 0.0415191650390625, 0.047084808349609375, 0.05265045166015625, 0.058216094970703125, 0.06378173828125, 0.06934738159179688, 0.07491302490234375, 0.08047866821289062, 0.0860443115234375, 0.09160995483398438, 0.09717559814453125, 0.10274124145507812, 0.108306884765625, 0.11387252807617188, 0.11943817138671875, 0.12500381469726562, 0.1305694580078125, 0.13613510131835938, 0.14170074462890625, 0.14726638793945312, 0.15283203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 9.0, 8.0, 13.0, 22.0, 22.0, 34.0, 46.0, 63.0, 80.0, 134.0, 119.0, 113.0, 129.0, 52.0, 41.0, 27.0, 24.0, 10.0, 10.0, 8.0, 4.0, 8.0, 9.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5106983482837677e-05, -1.459755003452301e-05, -1.4088116586208344e-05, -1.3578683137893677e-05, -1.306924968957901e-05, -1.2559816241264343e-05, -1.2050382792949677e-05, -1.154094934463501e-05, -1.1031515896320343e-05, -1.0522082448005676e-05, -1.001264899969101e-05, -9.503215551376343e-06, -8.993782103061676e-06, -8.48434865474701e-06, -7.974915206432343e-06, -7.465481758117676e-06, -6.956048309803009e-06, -6.446614861488342e-06, -5.9371814131736755e-06, -5.427747964859009e-06, -4.918314516544342e-06, -4.408881068229675e-06, -3.8994476199150085e-06, -3.390014171600342e-06, -2.880580723285675e-06, -2.3711472749710083e-06, -1.8617138266563416e-06, -1.3522803783416748e-06, -8.428469300270081e-07, -3.334134817123413e-07, 1.7601996660232544e-07, 6.854534149169922e-07, 1.194886863231659e-06, 1.7043203115463257e-06, 2.2137537598609924e-06, 2.723187208175659e-06, 3.232620656490326e-06, 3.7420541048049927e-06, 4.2514875531196594e-06, 4.760921001434326e-06, 5.270354449748993e-06, 5.77978789806366e-06, 6.289221346378326e-06, 6.798654794692993e-06, 7.30808824300766e-06, 7.817521691322327e-06, 8.326955139636993e-06, 8.83638858795166e-06, 9.345822036266327e-06, 9.855255484580994e-06, 1.036468893289566e-05, 1.0874122381210327e-05, 1.1383555829524994e-05, 1.189298927783966e-05, 1.2402422726154327e-05, 1.2911856174468994e-05, 1.3421289622783661e-05, 1.3930723071098328e-05, 1.4440156519412994e-05, 1.4949589967727661e-05, 1.5459023416042328e-05, 1.5968456864356995e-05, 1.647789031267166e-05, 1.6987323760986328e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 13.0, 20.0, 21.0, 35.0, 70.0, 106.0, 160.0, 276.0, 465.0, 838.0, 1585.0, 3513.0, 9430.0, 41734.0, 594093.0, 352506.0, 29839.0, 7579.0, 2980.0, 1411.0, 738.0, 442.0, 254.0, 171.0, 107.0, 63.0, 35.0, 24.0, 14.0, 9.0, 6.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2088623046875, -0.2036285400390625, -0.198394775390625, -0.1931610107421875, -0.18792724609375, -0.1826934814453125, -0.177459716796875, -0.1722259521484375, -0.1669921875, -0.1617584228515625, -0.156524658203125, -0.1512908935546875, -0.14605712890625, -0.1408233642578125, -0.135589599609375, -0.1303558349609375, -0.1251220703125, -0.1198883056640625, -0.114654541015625, -0.1094207763671875, -0.10418701171875, -0.0989532470703125, -0.093719482421875, -0.0884857177734375, -0.083251953125, -0.0780181884765625, -0.072784423828125, -0.0675506591796875, -0.06231689453125, -0.0570831298828125, -0.051849365234375, -0.0466156005859375, -0.0413818359375, -0.0361480712890625, -0.030914306640625, -0.0256805419921875, -0.02044677734375, -0.0152130126953125, -0.009979248046875, -0.0047454833984375, 0.00048828125, 0.0057220458984375, 0.010955810546875, 0.0161895751953125, 0.02142333984375, 0.0266571044921875, 0.031890869140625, 0.0371246337890625, 0.0423583984375, 0.0475921630859375, 0.052825927734375, 0.0580596923828125, 0.06329345703125, 0.0685272216796875, 0.073760986328125, 0.0789947509765625, 0.084228515625, 0.0894622802734375, 0.094696044921875, 0.0999298095703125, 0.10516357421875, 0.1103973388671875, 0.115631103515625, 0.1208648681640625, 0.1260986328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 3.0, 12.0, 15.0, 26.0, 21.0, 40.0, 61.0, 102.0, 101.0, 150.0, 158.0, 82.0, 85.0, 42.0, 22.0, 20.0, 7.0, 10.0, 6.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0626220703125, -0.06041908264160156, -0.058216094970703125, -0.05601310729980469, -0.05381011962890625, -0.05160713195800781, -0.049404144287109375, -0.04720115661621094, -0.0449981689453125, -0.04279518127441406, -0.040592193603515625, -0.03838920593261719, -0.03618621826171875, -0.03398323059082031, -0.031780242919921875, -0.029577255249023438, -0.027374267578125, -0.025171279907226562, -0.022968292236328125, -0.020765304565429688, -0.01856231689453125, -0.016359329223632812, -0.014156341552734375, -0.011953353881835938, -0.0097503662109375, -0.0075473785400390625, -0.005344390869140625, -0.0031414031982421875, -0.00093841552734375, 0.0012645721435546875, 0.003467559814453125, 0.0056705474853515625, 0.00787353515625, 0.010076522827148438, 0.012279510498046875, 0.014482498168945312, 0.01668548583984375, 0.018888473510742188, 0.021091461181640625, 0.023294448852539062, 0.0254974365234375, 0.027700424194335938, 0.029903411865234375, 0.03210639953613281, 0.03430938720703125, 0.03651237487792969, 0.038715362548828125, 0.04091835021972656, 0.043121337890625, 0.04532432556152344, 0.047527313232421875, 0.04973030090332031, 0.05193328857421875, 0.05413627624511719, 0.056339263916015625, 0.05854225158691406, 0.0607452392578125, 0.06294822692871094, 0.06515121459960938, 0.06735420227050781, 0.06955718994140625, 0.07176017761230469, 0.07396316528320312, 0.07616615295410156, 0.078369140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 0.0, 8.0, 10.0, 16.0, 17.0, 38.0, 54.0, 125.0, 190.0, 200.0, 136.0, 77.0, 57.0, 32.0, 14.0, 12.0, 9.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.283629894256592, -3.2141385078430176, -3.1446471214294434, -3.07515549659729, -3.005664110183716, -2.9361727237701416, -2.8666810989379883, -2.797189712524414, -2.72769832611084, -2.6582069396972656, -2.5887155532836914, -2.519223928451538, -2.449732542037964, -2.3802411556243896, -2.3107495307922363, -2.241258144378662, -2.171766757965088, -2.1022753715515137, -2.0327839851379395, -1.9632923603057861, -1.893800973892212, -1.8243095874786377, -1.754818081855774, -1.6853265762329102, -1.615835189819336, -1.5463438034057617, -1.476852297782898, -1.4073607921600342, -1.33786940574646, -1.2683780193328857, -1.198886513710022, -1.1293950080871582, -1.0599033832550049, -0.9904119372367859, -0.9209204912185669, -0.8514290452003479, -0.7819375991821289, -0.7124461531639099, -0.6429547071456909, -0.5734632611274719, -0.5039718151092529, -0.43448036909103394, -0.36498892307281494, -0.29549747705459595, -0.22600603103637695, -0.15651458501815796, -0.08702313899993896, -0.01753169298171997, 0.05195975303649902, 0.12145119905471802, 0.190942645072937, 0.260434091091156, 0.329925537109375, 0.399416983127594, 0.468908429145813, 0.538399875164032, 0.607891321182251, 0.67738276720047, 0.746874213218689, 0.816365659236908, 0.885857105255127, 0.955348551273346, 1.024839997291565, 1.0943315029144287, 1.163822889328003]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 10.0, 8.0, 7.0, 11.0, 13.0, 13.0, 20.0, 17.0, 22.0, 36.0, 38.0, 32.0, 29.0, 51.0, 47.0, 46.0, 40.0, 47.0, 38.0, 50.0, 44.0, 53.0, 30.0, 35.0, 44.0, 39.0, 27.0, 28.0, 16.0, 29.0, 20.0, 14.0, 11.0, 2.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3882209062576294, -1.3489383459091187, -1.3096556663513184, -1.2703731060028076, -1.2310905456542969, -1.1918078660964966, -1.1525253057479858, -1.1132426261901855, -1.0739600658416748, -1.034677505493164, -0.9953948259353638, -0.956112265586853, -0.9168296456336975, -0.877547025680542, -0.8382644653320312, -0.7989818453788757, -0.7596992254257202, -0.7204166054725647, -0.6811339855194092, -0.6418514251708984, -0.6025688052177429, -0.5632861852645874, -0.5240036249160767, -0.48472100496292114, -0.4454383850097656, -0.4061557650566101, -0.366873174905777, -0.32759058475494385, -0.28830796480178833, -0.249025359749794, -0.20974275469779968, -0.17046016454696655, -0.13117754459381104, -0.09189493954181671, -0.05261233448982239, -0.013329729437828064, 0.02595287561416626, 0.06523548066616058, 0.10451808571815491, 0.14380067586898804, 0.18308329582214355, 0.22236590087413788, 0.2616485059261322, 0.30093109607696533, 0.34021371603012085, 0.37949633598327637, 0.4187789261341095, 0.4580615162849426, 0.49734413623809814, 0.5366267561912537, 0.5759093761444092, 0.6151919364929199, 0.6544745564460754, 0.693757176399231, 0.7330397367477417, 0.7723223567008972, 0.8116049766540527, 0.8508875966072083, 0.8901702165603638, 0.9294527769088745, 0.96873539686203, 1.0080180168151855, 1.0473005771636963, 1.086583137512207, 1.1258658170700073]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 25.0, 35.0, 45.0, 63.0, 92.0, 152.0, 230.0, 442.0, 959.0, 2669.0, 11402.0, 520328.0, 3621067.0, 29429.0, 4399.0, 1432.0, 581.0, 323.0, 203.0, 104.0, 69.0, 67.0, 50.0, 27.0, 17.0, 14.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9501953125, -1.8785247802734375, -1.806854248046875, -1.7351837158203125, -1.66351318359375, -1.5918426513671875, -1.520172119140625, -1.4485015869140625, -1.3768310546875, -1.3051605224609375, -1.233489990234375, -1.1618194580078125, -1.09014892578125, -1.0184783935546875, -0.946807861328125, -0.8751373291015625, -0.803466796875, -0.7317962646484375, -0.660125732421875, -0.5884552001953125, -0.51678466796875, -0.4451141357421875, -0.373443603515625, -0.3017730712890625, -0.2301025390625, -0.1584320068359375, -0.086761474609375, -0.0150909423828125, 0.05657958984375, 0.1282501220703125, 0.199920654296875, 0.2715911865234375, 0.34326171875, 0.4149322509765625, 0.486602783203125, 0.5582733154296875, 0.62994384765625, 0.7016143798828125, 0.773284912109375, 0.8449554443359375, 0.9166259765625, 0.9882965087890625, 1.059967041015625, 1.1316375732421875, 1.20330810546875, 1.2749786376953125, 1.346649169921875, 1.4183197021484375, 1.489990234375, 1.5616607666015625, 1.633331298828125, 1.7050018310546875, 1.77667236328125, 1.8483428955078125, 1.920013427734375, 1.9916839599609375, 2.0633544921875, 2.1350250244140625, 2.206695556640625, 2.2783660888671875, 2.35003662109375, 2.4217071533203125, 2.493377685546875, 2.5650482177734375, 2.63671875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 5.0, 10.0, 13.0, 13.0, 11.0, 21.0, 17.0, 26.0, 30.0, 44.0, 40.0, 49.0, 57.0, 67.0, 56.0, 57.0, 55.0, 74.0, 62.0, 45.0, 53.0, 39.0, 32.0, 27.0, 17.0, 18.0, 13.0, 11.0, 4.0, 11.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5053939819335938, -0.4863739013671875, -0.46735382080078125, -0.448333740234375, -0.42931365966796875, -0.4102935791015625, -0.39127349853515625, -0.37225341796875, -0.35323333740234375, -0.3342132568359375, -0.31519317626953125, -0.296173095703125, -0.27715301513671875, -0.2581329345703125, -0.23911285400390625, -0.2200927734375, -0.20107269287109375, -0.1820526123046875, -0.16303253173828125, -0.144012451171875, -0.12499237060546875, -0.1059722900390625, -0.08695220947265625, -0.06793212890625, -0.04891204833984375, -0.0298919677734375, -0.01087188720703125, 0.008148193359375, 0.02716827392578125, 0.0461883544921875, 0.06520843505859375, 0.084228515625, 0.10324859619140625, 0.1222686767578125, 0.14128875732421875, 0.160308837890625, 0.17932891845703125, 0.1983489990234375, 0.21736907958984375, 0.23638916015625, 0.25540924072265625, 0.2744293212890625, 0.29344940185546875, 0.312469482421875, 0.33148956298828125, 0.3505096435546875, 0.36952972412109375, 0.3885498046875, 0.40756988525390625, 0.4265899658203125, 0.44561004638671875, 0.464630126953125, 0.48365020751953125, 0.5026702880859375, 0.5216903686523438, 0.54071044921875, 0.5597305297851562, 0.5787506103515625, 0.5977706909179688, 0.616790771484375, 0.6358108520507812, 0.6548309326171875, 0.6738510131835938, 0.69287109375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 10.0, 3.0, 8.0, 16.0, 20.0, 40.0, 43.0, 78.0, 121.0, 187.0, 325.0, 636.0, 1334.0, 3130.0, 8630.0, 34577.0, 472973.0, 3553691.0, 93208.0, 16378.0, 5064.0, 1854.0, 861.0, 447.0, 247.0, 121.0, 88.0, 58.0, 45.0, 30.0, 13.0, 10.0, 5.0, 5.0, 8.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9052734375, -0.87322998046875, -0.8411865234375, -0.80914306640625, -0.777099609375, -0.74505615234375, -0.7130126953125, -0.68096923828125, -0.64892578125, -0.61688232421875, -0.5848388671875, -0.55279541015625, -0.520751953125, -0.48870849609375, -0.4566650390625, -0.42462158203125, -0.392578125, -0.36053466796875, -0.3284912109375, -0.29644775390625, -0.264404296875, -0.23236083984375, -0.2003173828125, -0.16827392578125, -0.13623046875, -0.10418701171875, -0.0721435546875, -0.04010009765625, -0.008056640625, 0.02398681640625, 0.0560302734375, 0.08807373046875, 0.1201171875, 0.15216064453125, 0.1842041015625, 0.21624755859375, 0.248291015625, 0.28033447265625, 0.3123779296875, 0.34442138671875, 0.37646484375, 0.40850830078125, 0.4405517578125, 0.47259521484375, 0.504638671875, 0.53668212890625, 0.5687255859375, 0.60076904296875, 0.6328125, 0.66485595703125, 0.6968994140625, 0.72894287109375, 0.760986328125, 0.79302978515625, 0.8250732421875, 0.85711669921875, 0.88916015625, 0.92120361328125, 0.9532470703125, 0.98529052734375, 1.017333984375, 1.04937744140625, 1.0814208984375, 1.11346435546875, 1.1455078125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 11.0, 16.0, 18.0, 28.0, 45.0, 62.0, 123.0, 277.0, 651.0, 1252.0, 824.0, 352.0, 162.0, 86.0, 56.0, 27.0, 22.0, 10.0, 12.0, 11.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285400390625, -0.2750701904296875, -0.264739990234375, -0.2544097900390625, -0.24407958984375, -0.2337493896484375, -0.223419189453125, -0.2130889892578125, -0.2027587890625, -0.1924285888671875, -0.182098388671875, -0.1717681884765625, -0.16143798828125, -0.1511077880859375, -0.140777587890625, -0.1304473876953125, -0.1201171875, -0.1097869873046875, -0.099456787109375, -0.0891265869140625, -0.07879638671875, -0.0684661865234375, -0.058135986328125, -0.0478057861328125, -0.0374755859375, -0.0271453857421875, -0.016815185546875, -0.0064849853515625, 0.00384521484375, 0.0141754150390625, 0.024505615234375, 0.0348358154296875, 0.045166015625, 0.0554962158203125, 0.065826416015625, 0.0761566162109375, 0.08648681640625, 0.0968170166015625, 0.107147216796875, 0.1174774169921875, 0.1278076171875, 0.1381378173828125, 0.148468017578125, 0.1587982177734375, 0.16912841796875, 0.1794586181640625, 0.189788818359375, 0.2001190185546875, 0.21044921875, 0.2207794189453125, 0.231109619140625, 0.2414398193359375, 0.25177001953125, 0.2621002197265625, 0.272430419921875, 0.2827606201171875, 0.2930908203125, 0.3034210205078125, 0.313751220703125, 0.3240814208984375, 0.33441162109375, 0.3447418212890625, 0.355072021484375, 0.3654022216796875, 0.375732421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 13.0, 21.0, 32.0, 44.0, 51.0, 70.0, 98.0, 116.0, 114.0, 113.0, 84.0, 45.0, 38.0, 32.0, 24.0, 23.0, 12.0, 8.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.154934048652649, -1.1261039972305298, -1.097273826599121, -1.068443775177002, -1.0396137237548828, -1.0107836723327637, -0.981953501701355, -0.9531234502792358, -0.9242933988571167, -0.8954632878303528, -0.8666332364082336, -0.8378031253814697, -0.8089730739593506, -0.7801429629325867, -0.7513128519058228, -0.7224828004837036, -0.6936526894569397, -0.6648225784301758, -0.6359925270080566, -0.6071624159812927, -0.5783323645591736, -0.5495022535324097, -0.5206722021102905, -0.4918420910835266, -0.4630120098590851, -0.43418192863464355, -0.405351847410202, -0.3765217661857605, -0.3476916551589966, -0.31886160373687744, -0.2900314927101135, -0.261201411485672, -0.23237133026123047, -0.20354124903678894, -0.1747111678123474, -0.1458810716867447, -0.11705099046230316, -0.08822090923786163, -0.05939081311225891, -0.030560731887817383, -0.0017306506633758545, 0.027099434286355972, 0.0559295192360878, 0.08475960791110992, 0.11358968913555145, 0.14241977035999298, 0.1712498664855957, 0.20007994771003723, 0.22891002893447876, 0.2577401101589203, 0.2865701913833618, 0.31540030241012573, 0.3442303538322449, 0.3730604648590088, 0.4018905460834503, 0.43072062730789185, 0.4595507085323334, 0.4883807897567749, 0.5172109007835388, 0.546040952205658, 0.5748710632324219, 0.603701114654541, 0.6325312256813049, 0.6613613367080688, 0.690191388130188]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 7.0, 10.0, 11.0, 21.0, 17.0, 23.0, 28.0, 38.0, 41.0, 47.0, 42.0, 50.0, 52.0, 44.0, 54.0, 59.0, 59.0, 64.0, 63.0, 44.0, 37.0, 36.0, 40.0, 24.0, 21.0, 17.0, 10.0, 14.0, 7.0, 10.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6195239424705505, -0.5981258153915405, -0.5767276287078857, -0.5553295016288757, -0.5339313745498657, -0.5125331878662109, -0.4911350607872009, -0.46973690390586853, -0.44833874702453613, -0.42694059014320374, -0.40554243326187134, -0.38414430618286133, -0.36274614930152893, -0.34134799242019653, -0.3199498653411865, -0.2985517084598541, -0.27715355157852173, -0.25575539469718933, -0.23435725271701813, -0.21295911073684692, -0.19156095385551453, -0.17016279697418213, -0.14876465499401093, -0.12736651301383972, -0.10596835613250732, -0.08457020670175552, -0.06317205727100372, -0.04177390784025192, -0.020375758409500122, 0.0010223910212516785, 0.02242054045200348, 0.04381868243217468, 0.0652167797088623, 0.0866149291396141, 0.1080130785703659, 0.1294112205505371, 0.1508093774318695, 0.1722075343132019, 0.1936056762933731, 0.2150038182735443, 0.2364019751548767, 0.2578001320362091, 0.2791982889175415, 0.3005964159965515, 0.3219945728778839, 0.3433927297592163, 0.3647908568382263, 0.3861890137195587, 0.4075871706008911, 0.4289853274822235, 0.4503834843635559, 0.4717816114425659, 0.4931797683238983, 0.5145779252052307, 0.5359760522842407, 0.5573742389678955, 0.5787723660469055, 0.6001704931259155, 0.6215686798095703, 0.6429668068885803, 0.6643649339675903, 0.6857631206512451, 0.7071612477302551, 0.7285593748092651, 0.7499575614929199]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 10.0, 5.0, 16.0, 38.0, 30.0, 77.0, 140.0, 276.0, 564.0, 1108.0, 2955.0, 11651.0, 108605.0, 829282.0, 79221.0, 9899.0, 2617.0, 1046.0, 454.0, 235.0, 132.0, 82.0, 47.0, 30.0, 10.0, 9.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.28537750244140625, -0.2753448486328125, -0.26531219482421875, -0.255279541015625, -0.24524688720703125, -0.2352142333984375, -0.22518157958984375, -0.21514892578125, -0.20511627197265625, -0.1950836181640625, -0.18505096435546875, -0.175018310546875, -0.16498565673828125, -0.1549530029296875, -0.14492034912109375, -0.1348876953125, -0.12485504150390625, -0.1148223876953125, -0.10478973388671875, -0.094757080078125, -0.08472442626953125, -0.0746917724609375, -0.06465911865234375, -0.05462646484375, -0.04459381103515625, -0.0345611572265625, -0.02452850341796875, -0.014495849609375, -0.00446319580078125, 0.0055694580078125, 0.01560211181640625, 0.025634765625, 0.03566741943359375, 0.0457000732421875, 0.05573272705078125, 0.065765380859375, 0.07579803466796875, 0.0858306884765625, 0.09586334228515625, 0.10589599609375, 0.11592864990234375, 0.1259613037109375, 0.13599395751953125, 0.146026611328125, 0.15605926513671875, 0.1660919189453125, 0.17612457275390625, 0.1861572265625, 0.19618988037109375, 0.2062225341796875, 0.21625518798828125, 0.226287841796875, 0.23632049560546875, 0.2463531494140625, 0.25638580322265625, 0.26641845703125, 0.27645111083984375, 0.2864837646484375, 0.29651641845703125, 0.306549072265625, 0.31658172607421875, 0.3266143798828125, 0.33664703369140625, 0.3466796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 14.0, 18.0, 18.0, 18.0, 34.0, 36.0, 51.0, 39.0, 48.0, 66.0, 41.0, 50.0, 70.0, 59.0, 59.0, 61.0, 63.0, 42.0, 41.0, 18.0, 36.0, 25.0, 15.0, 14.0, 15.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33837890625, -0.32334136962890625, -0.3083038330078125, -0.29326629638671875, -0.278228759765625, -0.26319122314453125, -0.2481536865234375, -0.23311614990234375, -0.21807861328125, -0.20304107666015625, -0.1880035400390625, -0.17296600341796875, -0.157928466796875, -0.14289093017578125, -0.1278533935546875, -0.11281585693359375, -0.0977783203125, -0.08274078369140625, -0.0677032470703125, -0.05266571044921875, -0.037628173828125, -0.02259063720703125, -0.0075531005859375, 0.00748443603515625, 0.02252197265625, 0.03755950927734375, 0.0525970458984375, 0.06763458251953125, 0.082672119140625, 0.09770965576171875, 0.1127471923828125, 0.12778472900390625, 0.142822265625, 0.15785980224609375, 0.1728973388671875, 0.18793487548828125, 0.202972412109375, 0.21800994873046875, 0.2330474853515625, 0.24808502197265625, 0.26312255859375, 0.27816009521484375, 0.2931976318359375, 0.30823516845703125, 0.323272705078125, 0.33831024169921875, 0.3533477783203125, 0.36838531494140625, 0.3834228515625, 0.39846038818359375, 0.4134979248046875, 0.42853546142578125, 0.443572998046875, 0.45861053466796875, 0.4736480712890625, 0.48868560791015625, 0.50372314453125, 0.5187606811523438, 0.5337982177734375, 0.5488357543945312, 0.563873291015625, 0.5789108276367188, 0.5939483642578125, 0.6089859008789062, 0.6240234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 6.0, 6.0, 7.0, 12.0, 14.0, 7.0, 20.0, 34.0, 31.0, 52.0, 69.0, 114.0, 165.0, 223.0, 330.0, 543.0, 857.0, 1602.0, 2995.0, 6646.0, 15998.0, 46093.0, 180777.0, 517453.0, 194433.0, 49235.0, 16777.0, 6739.0, 3115.0, 1638.0, 894.0, 533.0, 344.0, 241.0, 135.0, 121.0, 83.0, 65.0, 35.0, 28.0, 25.0, 22.0, 13.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1170654296875, -0.11322975158691406, -0.10939407348632812, -0.10555839538574219, -0.10172271728515625, -0.09788703918457031, -0.09405136108398438, -0.09021568298339844, -0.0863800048828125, -0.08254432678222656, -0.07870864868164062, -0.07487297058105469, -0.07103729248046875, -0.06720161437988281, -0.06336593627929688, -0.05953025817871094, -0.055694580078125, -0.05185890197753906, -0.048023223876953125, -0.04418754577636719, -0.04035186767578125, -0.03651618957519531, -0.032680511474609375, -0.028844833374023438, -0.0250091552734375, -0.021173477172851562, -0.017337799072265625, -0.013502120971679688, -0.00966644287109375, -0.0058307647705078125, -0.001995086669921875, 0.0018405914306640625, 0.00567626953125, 0.009511947631835938, 0.013347625732421875, 0.017183303833007812, 0.02101898193359375, 0.024854660034179688, 0.028690338134765625, 0.03252601623535156, 0.0363616943359375, 0.04019737243652344, 0.044033050537109375, 0.04786872863769531, 0.05170440673828125, 0.05554008483886719, 0.059375762939453125, 0.06321144104003906, 0.067047119140625, 0.07088279724121094, 0.07471847534179688, 0.07855415344238281, 0.08238983154296875, 0.08622550964355469, 0.09006118774414062, 0.09389686584472656, 0.0977325439453125, 0.10156822204589844, 0.10540390014648438, 0.10923957824707031, 0.11307525634765625, 0.11691093444824219, 0.12074661254882812, 0.12458229064941406, 0.12841796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 2.0, 4.0, 4.0, 10.0, 3.0, 12.0, 11.0, 6.0, 15.0, 24.0, 8.0, 19.0, 28.0, 21.0, 30.0, 34.0, 35.0, 34.0, 42.0, 38.0, 52.0, 48.0, 42.0, 48.0, 55.0, 50.0, 39.0, 32.0, 36.0, 43.0, 17.0, 26.0, 20.0, 10.0, 23.0, 13.0, 14.0, 3.0, 8.0, 6.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61767578125, -0.5970077514648438, -0.5763397216796875, -0.5556716918945312, -0.535003662109375, -0.5143356323242188, -0.4936676025390625, -0.47299957275390625, -0.45233154296875, -0.43166351318359375, -0.4109954833984375, -0.39032745361328125, -0.369659423828125, -0.34899139404296875, -0.3283233642578125, -0.30765533447265625, -0.2869873046875, -0.26631927490234375, -0.2456512451171875, -0.22498321533203125, -0.204315185546875, -0.18364715576171875, -0.1629791259765625, -0.14231109619140625, -0.12164306640625, -0.10097503662109375, -0.0803070068359375, -0.05963897705078125, -0.038970947265625, -0.01830291748046875, 0.0023651123046875, 0.02303314208984375, 0.043701171875, 0.06436920166015625, 0.0850372314453125, 0.10570526123046875, 0.126373291015625, 0.14704132080078125, 0.1677093505859375, 0.18837738037109375, 0.20904541015625, 0.22971343994140625, 0.2503814697265625, 0.27104949951171875, 0.291717529296875, 0.31238555908203125, 0.3330535888671875, 0.35372161865234375, 0.3743896484375, 0.39505767822265625, 0.4157257080078125, 0.43639373779296875, 0.457061767578125, 0.47772979736328125, 0.4983978271484375, 0.5190658569335938, 0.53973388671875, 0.5604019165039062, 0.5810699462890625, 0.6017379760742188, 0.622406005859375, 0.6430740356445312, 0.6637420654296875, 0.6844100952148438, 0.705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 11.0, 9.0, 17.0, 39.0, 59.0, 106.0, 179.0, 277.0, 538.0, 1002.0, 1874.0, 4064.0, 9535.0, 27572.0, 107252.0, 521443.0, 287043.0, 57247.0, 17446.0, 6675.0, 2976.0, 1420.0, 738.0, 453.0, 195.0, 125.0, 92.0, 56.0, 30.0, 28.0, 10.0, 8.0, 8.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04376220703125, -0.04229307174682617, -0.040823936462402344, -0.039354801177978516, -0.03788566589355469, -0.03641653060913086, -0.03494739532470703, -0.0334782600402832, -0.032009124755859375, -0.030539989471435547, -0.02907085418701172, -0.02760171890258789, -0.026132583618164062, -0.024663448333740234, -0.023194313049316406, -0.021725177764892578, -0.02025604248046875, -0.018786907196044922, -0.017317771911621094, -0.015848636627197266, -0.014379501342773438, -0.01291036605834961, -0.011441230773925781, -0.009972095489501953, -0.008502960205078125, -0.007033824920654297, -0.005564689636230469, -0.004095554351806641, -0.0026264190673828125, -0.0011572837829589844, 0.00031185150146484375, 0.0017809867858886719, 0.0032501220703125, 0.004719257354736328, 0.006188392639160156, 0.007657527923583984, 0.009126663208007812, 0.01059579849243164, 0.012064933776855469, 0.013534069061279297, 0.015003204345703125, 0.016472339630126953, 0.01794147491455078, 0.01941061019897461, 0.020879745483398438, 0.022348880767822266, 0.023818016052246094, 0.025287151336669922, 0.02675628662109375, 0.028225421905517578, 0.029694557189941406, 0.031163692474365234, 0.03263282775878906, 0.03410196304321289, 0.03557109832763672, 0.03704023361206055, 0.038509368896484375, 0.0399785041809082, 0.04144763946533203, 0.04291677474975586, 0.04438591003417969, 0.045855045318603516, 0.047324180603027344, 0.04879331588745117, 0.050262451171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 13.0, 18.0, 16.0, 19.0, 27.0, 48.0, 75.0, 99.0, 143.0, 152.0, 126.0, 78.0, 67.0, 33.0, 15.0, 10.0, 11.0, 17.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.707408905029297e-05, -3.601983189582825e-05, -3.4965574741363525e-05, -3.3911317586898804e-05, -3.285706043243408e-05, -3.180280327796936e-05, -3.074854612350464e-05, -2.9694288969039917e-05, -2.8640031814575195e-05, -2.7585774660110474e-05, -2.6531517505645752e-05, -2.547726035118103e-05, -2.442300319671631e-05, -2.3368746042251587e-05, -2.2314488887786865e-05, -2.1260231733322144e-05, -2.0205974578857422e-05, -1.91517174243927e-05, -1.809746026992798e-05, -1.7043203115463257e-05, -1.5988945960998535e-05, -1.4934688806533813e-05, -1.3880431652069092e-05, -1.282617449760437e-05, -1.1771917343139648e-05, -1.0717660188674927e-05, -9.663403034210205e-06, -8.609145879745483e-06, -7.554888725280762e-06, -6.50063157081604e-06, -5.446374416351318e-06, -4.392117261886597e-06, -3.337860107421875e-06, -2.2836029529571533e-06, -1.2293457984924316e-06, -1.7508864402770996e-07, 8.791685104370117e-07, 1.9334256649017334e-06, 2.987682819366455e-06, 4.041939973831177e-06, 5.0961971282958984e-06, 6.15045428276062e-06, 7.204711437225342e-06, 8.258968591690063e-06, 9.313225746154785e-06, 1.0367482900619507e-05, 1.1421740055084229e-05, 1.247599720954895e-05, 1.3530254364013672e-05, 1.4584511518478394e-05, 1.5638768672943115e-05, 1.6693025827407837e-05, 1.774728298187256e-05, 1.880154013633728e-05, 1.9855797290802002e-05, 2.0910054445266724e-05, 2.1964311599731445e-05, 2.3018568754196167e-05, 2.407282590866089e-05, 2.512708306312561e-05, 2.6181340217590332e-05, 2.7235597372055054e-05, 2.8289854526519775e-05, 2.9344111680984497e-05, 3.039836883544922e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 9.0, 12.0, 28.0, 30.0, 59.0, 93.0, 123.0, 249.0, 433.0, 760.0, 1374.0, 2689.0, 5246.0, 11301.0, 26458.0, 69848.0, 210543.0, 415106.0, 194319.0, 64238.0, 24427.0, 10600.0, 5002.0, 2455.0, 1350.0, 769.0, 386.0, 245.0, 141.0, 80.0, 58.0, 40.0, 22.0, 15.0, 14.0, 11.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290985107421875, -0.02817368507385254, -0.027248859405517578, -0.026324033737182617, -0.025399208068847656, -0.024474382400512695, -0.023549556732177734, -0.022624731063842773, -0.021699905395507812, -0.02077507972717285, -0.01985025405883789, -0.01892542839050293, -0.01800060272216797, -0.017075777053833008, -0.016150951385498047, -0.015226125717163086, -0.014301300048828125, -0.013376474380493164, -0.012451648712158203, -0.011526823043823242, -0.010601997375488281, -0.00967717170715332, -0.00875234603881836, -0.007827520370483398, -0.0069026947021484375, -0.0059778690338134766, -0.005053043365478516, -0.004128217697143555, -0.0032033920288085938, -0.002278566360473633, -0.0013537406921386719, -0.00042891502380371094, 0.00049591064453125, 0.001420736312866211, 0.002345561981201172, 0.003270387649536133, 0.004195213317871094, 0.005120038986206055, 0.006044864654541016, 0.0069696903228759766, 0.007894515991210938, 0.008819341659545898, 0.00974416732788086, 0.01066899299621582, 0.011593818664550781, 0.012518644332885742, 0.013443470001220703, 0.014368295669555664, 0.015293121337890625, 0.016217947006225586, 0.017142772674560547, 0.018067598342895508, 0.01899242401123047, 0.01991724967956543, 0.02084207534790039, 0.02176690101623535, 0.022691726684570312, 0.023616552352905273, 0.024541378021240234, 0.025466203689575195, 0.026391029357910156, 0.027315855026245117, 0.028240680694580078, 0.02916550636291504, 0.03009033203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 4.0, 10.0, 17.0, 9.0, 13.0, 13.0, 15.0, 21.0, 29.0, 24.0, 38.0, 56.0, 49.0, 53.0, 64.0, 57.0, 71.0, 60.0, 54.0, 59.0, 51.0, 47.0, 33.0, 35.0, 17.0, 21.0, 10.0, 10.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00872039794921875, -0.008465349674224854, -0.008210301399230957, -0.00795525312423706, -0.007700204849243164, -0.007445156574249268, -0.007190108299255371, -0.006935060024261475, -0.006680011749267578, -0.006424963474273682, -0.006169915199279785, -0.005914866924285889, -0.005659818649291992, -0.005404770374298096, -0.005149722099304199, -0.004894673824310303, -0.004639625549316406, -0.00438457727432251, -0.004129528999328613, -0.003874480724334717, -0.0036194324493408203, -0.003364384174346924, -0.0031093358993530273, -0.002854287624359131, -0.0025992393493652344, -0.002344191074371338, -0.0020891427993774414, -0.001834094524383545, -0.0015790462493896484, -0.001323997974395752, -0.0010689496994018555, -0.000813901424407959, -0.0005588531494140625, -0.000303804874420166, -4.875659942626953e-05, 0.00020629167556762695, 0.00046133995056152344, 0.0007163882255554199, 0.0009714365005493164, 0.0012264847755432129, 0.0014815330505371094, 0.0017365813255310059, 0.0019916296005249023, 0.002246677875518799, 0.0025017261505126953, 0.002756774425506592, 0.0030118227005004883, 0.0032668709754943848, 0.0035219192504882812, 0.0037769675254821777, 0.004032015800476074, 0.004287064075469971, 0.004542112350463867, 0.004797160625457764, 0.00505220890045166, 0.005307257175445557, 0.005562305450439453, 0.00581735372543335, 0.006072402000427246, 0.006327450275421143, 0.006582498550415039, 0.0068375468254089355, 0.007092595100402832, 0.0073476433753967285, 0.007602691650390625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 20.0, 49.0, 109.0, 232.0, 313.0, 136.0, 61.0, 35.0, 12.0, 9.0, 11.0, 2.0, 1.0, 3.0, 1.0], "bins": [-2.4478647708892822, -2.401827335357666, -2.355790138244629, -2.3097527027130127, -2.2637152671813965, -2.2176780700683594, -2.171640634536743, -2.125603199005127, -2.07956600189209, -2.0335285663604736, -1.987491250038147, -1.9414539337158203, -1.895416498184204, -1.8493791818618774, -1.8033418655395508, -1.7573044300079346, -1.7112669944763184, -1.6652296781539917, -1.6191922426223755, -1.5731549263000488, -1.5271174907684326, -1.481080174446106, -1.4350428581237793, -1.389005422592163, -1.3429681062698364, -1.2969307899475098, -1.2508933544158936, -1.204856038093567, -1.1588187217712402, -1.112781286239624, -1.0667439699172974, -1.0207066535949707, -0.9746692180633545, -0.9286318421363831, -0.8825944662094116, -0.836557149887085, -0.7905197739601135, -0.7444823980331421, -0.6984450817108154, -0.652407705783844, -0.6063703298568726, -0.5603329539299011, -0.5142955780029297, -0.468258261680603, -0.4222208857536316, -0.37618350982666016, -0.3301461637020111, -0.28410881757736206, -0.238071471452713, -0.19203411042690277, -0.14599674940109253, -0.09995938837528229, -0.053922027349472046, -0.007884666323661804, 0.03815269470214844, 0.08419004082679749, 0.13022741675376892, 0.17626477777957916, 0.2223021388053894, 0.26833951473236084, 0.3143768608570099, 0.36041420698165894, 0.40645158290863037, 0.4524889290332794, 0.49852630496025085]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 6.0, 4.0, 13.0, 15.0, 21.0, 24.0, 29.0, 34.0, 44.0, 45.0, 53.0, 53.0, 51.0, 60.0, 56.0, 70.0, 78.0, 63.0, 55.0, 41.0, 43.0, 34.0, 25.0, 19.0, 20.0, 10.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42076849937438965, -0.4054759442806244, -0.39018338918685913, -0.37489083409309387, -0.3595982789993286, -0.34430569410324097, -0.3290131688117981, -0.31372058391571045, -0.2984280288219452, -0.28313547372817993, -0.2678429186344147, -0.2525503635406494, -0.23725779354572296, -0.2219652384519577, -0.20667268335819244, -0.191380113363266, -0.17608757317066193, -0.16079501807689667, -0.1455024629831314, -0.13020989298820496, -0.1149173378944397, -0.09962478280067444, -0.08433222770690918, -0.06903966516256332, -0.053747110068798065, -0.03845455124974251, -0.0231619942933321, -0.007869437336921692, 0.007423121482133865, 0.022715680301189423, 0.03800823539495468, 0.05330079793930054, 0.0685933530330658, 0.08388590812683105, 0.09917847067117691, 0.11447102576494217, 0.12976358830928802, 0.14505614340305328, 0.16034869849681854, 0.175641268491745, 0.19093382358551025, 0.2062263786792755, 0.22151893377304077, 0.23681148886680603, 0.2521040439605713, 0.26739662885665894, 0.2826891541481018, 0.29798173904418945, 0.3132742643356323, 0.3285668194293976, 0.34385937452316284, 0.3591519296169281, 0.37444448471069336, 0.389737069606781, 0.4050295948982239, 0.4203221797943115, 0.4356147348880768, 0.45090728998184204, 0.4661998450756073, 0.48149240016937256, 0.4967849552631378, 0.5120775103569031, 0.5273700952529907, 0.5426626205444336, 0.5579552054405212]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 11.0, 12.0, 20.0, 38.0, 71.0, 95.0, 188.0, 329.0, 586.0, 1222.0, 2534.0, 6624.0, 20019.0, 99461.0, 615374.0, 246921.0, 37295.0, 10243.0, 3977.0, 1683.0, 859.0, 397.0, 232.0, 120.0, 76.0, 44.0, 28.0, 24.0, 21.0, 12.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37255859375, -0.3608131408691406, -0.34906768798828125, -0.3373222351074219, -0.3255767822265625, -0.3138313293457031, -0.30208587646484375, -0.2903404235839844, -0.278594970703125, -0.2668495178222656, -0.25510406494140625, -0.24335861206054688, -0.2316131591796875, -0.21986770629882812, -0.20812225341796875, -0.19637680053710938, -0.18463134765625, -0.17288589477539062, -0.16114044189453125, -0.14939498901367188, -0.1376495361328125, -0.12590408325195312, -0.11415863037109375, -0.10241317749023438, -0.090667724609375, -0.07892227172851562, -0.06717681884765625, -0.055431365966796875, -0.0436859130859375, -0.031940460205078125, -0.02019500732421875, -0.008449554443359375, 0.0032958984375, 0.015041351318359375, 0.02678680419921875, 0.038532257080078125, 0.0502777099609375, 0.062023162841796875, 0.07376861572265625, 0.08551406860351562, 0.097259521484375, 0.10900497436523438, 0.12075042724609375, 0.13249588012695312, 0.1442413330078125, 0.15598678588867188, 0.16773223876953125, 0.17947769165039062, 0.19122314453125, 0.20296859741210938, 0.21471405029296875, 0.22645950317382812, 0.2382049560546875, 0.24995040893554688, 0.26169586181640625, 0.2734413146972656, 0.285186767578125, 0.2969322204589844, 0.30867767333984375, 0.3204231262207031, 0.3321685791015625, 0.3439140319824219, 0.35565948486328125, 0.3674049377441406, 0.379150390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 8.0, 22.0, 30.0, 37.0, 40.0, 47.0, 60.0, 66.0, 69.0, 85.0, 80.0, 99.0, 85.0, 62.0, 49.0, 43.0, 36.0, 20.0, 15.0, 10.0, 11.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9449996948242188, -0.9041595458984375, -0.8633193969726562, -0.822479248046875, -0.7816390991210938, -0.7407989501953125, -0.6999588012695312, -0.65911865234375, -0.6182785034179688, -0.5774383544921875, -0.5365982055664062, -0.495758056640625, -0.45491790771484375, -0.4140777587890625, -0.37323760986328125, -0.3323974609375, -0.29155731201171875, -0.2507171630859375, -0.20987701416015625, -0.169036865234375, -0.12819671630859375, -0.0873565673828125, -0.04651641845703125, -0.00567626953125, 0.03516387939453125, 0.0760040283203125, 0.11684417724609375, 0.157684326171875, 0.19852447509765625, 0.2393646240234375, 0.28020477294921875, 0.321044921875, 0.36188507080078125, 0.4027252197265625, 0.44356536865234375, 0.484405517578125, 0.5252456665039062, 0.5660858154296875, 0.6069259643554688, 0.64776611328125, 0.6886062622070312, 0.7294464111328125, 0.7702865600585938, 0.811126708984375, 0.8519668579101562, 0.8928070068359375, 0.9336471557617188, 0.9744873046875, 1.0153274536132812, 1.0561676025390625, 1.0970077514648438, 1.137847900390625, 1.1786880493164062, 1.2195281982421875, 1.2603683471679688, 1.30120849609375, 1.3420486450195312, 1.3828887939453125, 1.4237289428710938, 1.464569091796875, 1.5054092407226562, 1.5462493896484375, 1.5870895385742188, 1.6279296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 11.0, 8.0, 13.0, 7.0, 18.0, 21.0, 27.0, 24.0, 40.0, 51.0, 70.0, 92.0, 111.0, 210.0, 450.0, 1397.0, 7774.0, 119225.0, 876392.0, 36915.0, 3872.0, 914.0, 314.0, 132.0, 94.0, 67.0, 60.0, 47.0, 43.0, 35.0, 25.0, 21.0, 17.0, 15.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6001434326171875, -0.579681396484375, -0.5592193603515625, -0.53875732421875, -0.5182952880859375, -0.497833251953125, -0.4773712158203125, -0.4569091796875, -0.4364471435546875, -0.415985107421875, -0.3955230712890625, -0.37506103515625, -0.3545989990234375, -0.334136962890625, -0.3136749267578125, -0.293212890625, -0.2727508544921875, -0.252288818359375, -0.2318267822265625, -0.21136474609375, -0.1909027099609375, -0.170440673828125, -0.1499786376953125, -0.1295166015625, -0.1090545654296875, -0.088592529296875, -0.0681304931640625, -0.04766845703125, -0.0272064208984375, -0.006744384765625, 0.0137176513671875, 0.0341796875, 0.0546417236328125, 0.075103759765625, 0.0955657958984375, 0.11602783203125, 0.1364898681640625, 0.156951904296875, 0.1774139404296875, 0.1978759765625, 0.2183380126953125, 0.238800048828125, 0.2592620849609375, 0.27972412109375, 0.3001861572265625, 0.320648193359375, 0.3411102294921875, 0.361572265625, 0.3820343017578125, 0.402496337890625, 0.4229583740234375, 0.44342041015625, 0.4638824462890625, 0.484344482421875, 0.5048065185546875, 0.5252685546875, 0.5457305908203125, 0.566192626953125, 0.5866546630859375, 0.60711669921875, 0.6275787353515625, 0.648040771484375, 0.6685028076171875, 0.68896484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 8.0, 9.0, 6.0, 7.0, 14.0, 9.0, 14.0, 21.0, 25.0, 21.0, 35.0, 29.0, 44.0, 33.0, 44.0, 52.0, 44.0, 41.0, 40.0, 56.0, 51.0, 46.0, 30.0, 43.0, 28.0, 42.0, 33.0, 26.0, 32.0, 26.0, 17.0, 17.0, 10.0, 19.0, 10.0, 4.0, 2.0, 3.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77587890625, -0.7499008178710938, -0.7239227294921875, -0.6979446411132812, -0.671966552734375, -0.6459884643554688, -0.6200103759765625, -0.5940322875976562, -0.56805419921875, -0.5420761108398438, -0.5160980224609375, -0.49011993408203125, -0.464141845703125, -0.43816375732421875, -0.4121856689453125, -0.38620758056640625, -0.3602294921875, -0.33425140380859375, -0.3082733154296875, -0.28229522705078125, -0.256317138671875, -0.23033905029296875, -0.2043609619140625, -0.17838287353515625, -0.15240478515625, -0.12642669677734375, -0.1004486083984375, -0.07447052001953125, -0.048492431640625, -0.02251434326171875, 0.0034637451171875, 0.02944183349609375, 0.055419921875, 0.08139801025390625, 0.1073760986328125, 0.13335418701171875, 0.159332275390625, 0.18531036376953125, 0.2112884521484375, 0.23726654052734375, 0.26324462890625, 0.28922271728515625, 0.3152008056640625, 0.34117889404296875, 0.367156982421875, 0.39313507080078125, 0.4191131591796875, 0.44509124755859375, 0.4710693359375, 0.49704742431640625, 0.5230255126953125, 0.5490036010742188, 0.574981689453125, 0.6009597778320312, 0.6269378662109375, 0.6529159545898438, 0.67889404296875, 0.7048721313476562, 0.7308502197265625, 0.7568283081054688, 0.782806396484375, 0.8087844848632812, 0.8347625732421875, 0.8607406616210938, 0.88671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 5.0, 3.0, 4.0, 9.0, 10.0, 11.0, 14.0, 25.0, 48.0, 122.0, 254.0, 668.0, 2547.0, 15920.0, 552025.0, 458691.0, 14703.0, 2317.0, 653.0, 268.0, 106.0, 60.0, 33.0, 20.0, 8.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19370460510253906, -0.18562698364257812, -0.1775493621826172, -0.16947174072265625, -0.1613941192626953, -0.15331649780273438, -0.14523887634277344, -0.1371612548828125, -0.12908363342285156, -0.12100601196289062, -0.11292839050292969, -0.10485076904296875, -0.09677314758300781, -0.08869552612304688, -0.08061790466308594, -0.072540283203125, -0.06446266174316406, -0.056385040283203125, -0.04830741882324219, -0.04022979736328125, -0.03215217590332031, -0.024074554443359375, -0.015996932983398438, -0.0079193115234375, 0.0001583099365234375, 0.008235931396484375, 0.016313552856445312, 0.02439117431640625, 0.03246879577636719, 0.040546417236328125, 0.04862403869628906, 0.05670166015625, 0.06477928161621094, 0.07285690307617188, 0.08093452453613281, 0.08901214599609375, 0.09708976745605469, 0.10516738891601562, 0.11324501037597656, 0.1213226318359375, 0.12940025329589844, 0.13747787475585938, 0.1455554962158203, 0.15363311767578125, 0.1617107391357422, 0.16978836059570312, 0.17786598205566406, 0.185943603515625, 0.19402122497558594, 0.20209884643554688, 0.2101764678955078, 0.21825408935546875, 0.2263317108154297, 0.23440933227539062, 0.24248695373535156, 0.2505645751953125, 0.25864219665527344, 0.2667198181152344, 0.2747974395751953, 0.28287506103515625, 0.2909526824951172, 0.2990303039550781, 0.30710792541503906, 0.315185546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 10.0, 10.0, 14.0, 22.0, 33.0, 45.0, 49.0, 81.0, 113.0, 150.0, 125.0, 118.0, 45.0, 54.0, 37.0, 19.0, 21.0, 5.0, 15.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.6941299438476562e-05, -2.629496157169342e-05, -2.564862370491028e-05, -2.5002285838127136e-05, -2.4355947971343994e-05, -2.3709610104560852e-05, -2.306327223777771e-05, -2.2416934370994568e-05, -2.1770596504211426e-05, -2.1124258637428284e-05, -2.047792077064514e-05, -1.9831582903862e-05, -1.9185245037078857e-05, -1.8538907170295715e-05, -1.7892569303512573e-05, -1.724623143672943e-05, -1.659989356994629e-05, -1.5953555703163147e-05, -1.5307217836380005e-05, -1.4660879969596863e-05, -1.401454210281372e-05, -1.3368204236030579e-05, -1.2721866369247437e-05, -1.2075528502464294e-05, -1.1429190635681152e-05, -1.078285276889801e-05, -1.0136514902114868e-05, -9.490177035331726e-06, -8.843839168548584e-06, -8.197501301765442e-06, -7.5511634349823e-06, -6.904825568199158e-06, -6.258487701416016e-06, -5.6121498346328735e-06, -4.9658119678497314e-06, -4.319474101066589e-06, -3.6731362342834473e-06, -3.026798367500305e-06, -2.380460500717163e-06, -1.734122633934021e-06, -1.087784767150879e-06, -4.414469003677368e-07, 2.0489096641540527e-07, 8.512288331985474e-07, 1.4975666999816895e-06, 2.1439045667648315e-06, 2.7902424335479736e-06, 3.4365803003311157e-06, 4.082918167114258e-06, 4.7292560338974e-06, 5.375593900680542e-06, 6.021931767463684e-06, 6.668269634246826e-06, 7.314607501029968e-06, 7.96094536781311e-06, 8.607283234596252e-06, 9.253621101379395e-06, 9.899958968162537e-06, 1.0546296834945679e-05, 1.119263470172882e-05, 1.1838972568511963e-05, 1.2485310435295105e-05, 1.3131648302078247e-05, 1.377798616886139e-05, 1.4424324035644531e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 13.0, 17.0, 23.0, 24.0, 69.0, 67.0, 108.0, 192.0, 309.0, 597.0, 1224.0, 3398.0, 13280.0, 102916.0, 828731.0, 80614.0, 11268.0, 3184.0, 1208.0, 520.0, 278.0, 177.0, 109.0, 72.0, 47.0, 33.0, 23.0, 18.0, 6.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.241455078125, -0.23500823974609375, -0.2285614013671875, -0.22211456298828125, -0.215667724609375, -0.20922088623046875, -0.2027740478515625, -0.19632720947265625, -0.18988037109375, -0.18343353271484375, -0.1769866943359375, -0.17053985595703125, -0.164093017578125, -0.15764617919921875, -0.1511993408203125, -0.14475250244140625, -0.1383056640625, -0.13185882568359375, -0.1254119873046875, -0.11896514892578125, -0.112518310546875, -0.10607147216796875, -0.0996246337890625, -0.09317779541015625, -0.08673095703125, -0.08028411865234375, -0.0738372802734375, -0.06739044189453125, -0.060943603515625, -0.05449676513671875, -0.0480499267578125, -0.04160308837890625, -0.03515625, -0.02870941162109375, -0.0222625732421875, -0.01581573486328125, -0.009368896484375, -0.00292205810546875, 0.0035247802734375, 0.00997161865234375, 0.01641845703125, 0.02286529541015625, 0.0293121337890625, 0.03575897216796875, 0.042205810546875, 0.04865264892578125, 0.0550994873046875, 0.06154632568359375, 0.0679931640625, 0.07444000244140625, 0.0808868408203125, 0.08733367919921875, 0.093780517578125, 0.10022735595703125, 0.1066741943359375, 0.11312103271484375, 0.11956787109375, 0.12601470947265625, 0.1324615478515625, 0.13890838623046875, 0.145355224609375, 0.15180206298828125, 0.1582489013671875, 0.16469573974609375, 0.171142578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 10.0, 11.0, 17.0, 23.0, 16.0, 59.0, 52.0, 100.0, 150.0, 157.0, 113.0, 102.0, 51.0, 42.0, 29.0, 23.0, 14.0, 4.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06781005859375, -0.06533336639404297, -0.06285667419433594, -0.060379981994628906, -0.057903289794921875, -0.055426597595214844, -0.05294990539550781, -0.05047321319580078, -0.04799652099609375, -0.04551982879638672, -0.04304313659667969, -0.040566444396972656, -0.038089752197265625, -0.035613059997558594, -0.03313636779785156, -0.03065967559814453, -0.0281829833984375, -0.02570629119873047, -0.023229598999023438, -0.020752906799316406, -0.018276214599609375, -0.015799522399902344, -0.013322830200195312, -0.010846138000488281, -0.00836944580078125, -0.005892753601074219, -0.0034160614013671875, -0.0009393692016601562, 0.001537322998046875, 0.004014015197753906, 0.0064907073974609375, 0.008967399597167969, 0.011444091796875, 0.013920783996582031, 0.016397476196289062, 0.018874168395996094, 0.021350860595703125, 0.023827552795410156, 0.026304244995117188, 0.02878093719482422, 0.03125762939453125, 0.03373432159423828, 0.03621101379394531, 0.038687705993652344, 0.041164398193359375, 0.043641090393066406, 0.04611778259277344, 0.04859447479248047, 0.0510711669921875, 0.05354785919189453, 0.05602455139160156, 0.058501243591308594, 0.060977935791015625, 0.06345462799072266, 0.06593132019042969, 0.06840801239013672, 0.07088470458984375, 0.07336139678955078, 0.07583808898925781, 0.07831478118896484, 0.08079147338867188, 0.0832681655883789, 0.08574485778808594, 0.08822154998779297, 0.0906982421875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 19.0, 40.0, 84.0, 125.0, 238.0, 241.0, 105.0, 54.0, 27.0, 16.0, 13.0, 7.0, 9.0, 5.0, 1.0, 1.0, 3.0], "bins": [-3.7459495067596436, -3.673616886138916, -3.6012845039367676, -3.52895188331604, -3.4566192626953125, -3.384286880493164, -3.3119542598724365, -3.239621639251709, -3.1672892570495605, -3.094956636428833, -3.0226242542266846, -2.950291633605957, -2.8779590129852295, -2.805626392364502, -2.7332940101623535, -2.660961389541626, -2.5886287689208984, -2.516296148300171, -2.4439637660980225, -2.371631145477295, -2.2992985248565674, -2.22696590423584, -2.1546335220336914, -2.082300901412964, -2.0099682807922363, -1.9376357793807983, -1.8653031587600708, -1.7929706573486328, -1.7206380367279053, -1.6483055353164673, -1.5759730339050293, -1.5036404132843018, -1.4313082695007324, -1.3589757680892944, -1.286643147468567, -1.214310646057129, -1.1419780254364014, -1.0696455240249634, -0.9973130226135254, -0.9249804615974426, -0.8526478409767151, -0.7803152799606323, -0.7079827785491943, -0.6356502175331116, -0.5633176565170288, -0.49098509550094604, -0.41865256428718567, -0.3463200330734253, -0.27398747205734253, -0.20165492594242096, -0.1293223798274994, -0.05698983371257782, 0.01534271240234375, 0.08767527341842651, 0.1600078046321869, 0.23234033584594727, 0.30467289686203003, 0.3770054578781128, 0.44933798909187317, 0.5216705203056335, 0.5940030813217163, 0.6663356423377991, 0.7386682033538818, 0.8110007047653198, 0.8833332657814026]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 9.0, 14.0, 16.0, 12.0, 14.0, 27.0, 33.0, 33.0, 28.0, 40.0, 37.0, 37.0, 45.0, 40.0, 42.0, 35.0, 46.0, 41.0, 52.0, 34.0, 45.0, 41.0, 43.0, 20.0, 41.0, 29.0, 26.0, 16.0, 23.0, 11.0, 15.0, 8.0, 8.0, 6.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3355566263198853, -1.291715383529663, -1.247874140739441, -1.2040328979492188, -1.1601916551589966, -1.1163504123687744, -1.0725090503692627, -1.0286678075790405, -0.9848265647888184, -0.9409853219985962, -0.897144079208374, -0.8533028364181519, -0.8094615340232849, -0.7656202912330627, -0.7217790484428406, -0.6779377460479736, -0.6340965628623962, -0.5902553200721741, -0.5464140772819519, -0.502572774887085, -0.4587315320968628, -0.4148902893066406, -0.37104904651641846, -0.3272077739238739, -0.28336653113365173, -0.23952527344226837, -0.195684015750885, -0.15184277296066284, -0.10800151526927948, -0.06416025757789612, -0.02031901478767395, 0.023522257804870605, 0.06736350059509277, 0.11120475828647614, 0.1550460159778595, 0.19888725876808167, 0.24272851645946503, 0.2865697741508484, 0.33041101694107056, 0.3742522895336151, 0.4180935323238373, 0.46193477511405945, 0.505776047706604, 0.5496172904968262, 0.5934585332870483, 0.6372997760772705, 0.6811410188674927, 0.7249823212623596, 0.7688235640525818, 0.812664806842804, 0.8565060496330261, 0.9003473520278931, 0.9441885948181152, 0.9880298376083374, 1.0318710803985596, 1.0757123231887817, 1.119553565979004, 1.163394808769226, 1.2072360515594482, 1.2510772943496704, 1.2949185371398926, 1.3387598991394043, 1.382601022720337, 1.4264423847198486, 1.4702836275100708]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 9.0, 10.0, 14.0, 25.0, 39.0, 64.0, 106.0, 166.0, 339.0, 646.0, 1240.0, 3008.0, 9173.0, 304686.0, 3819075.0, 46396.0, 5381.0, 1983.0, 903.0, 404.0, 259.0, 155.0, 81.0, 41.0, 24.0, 18.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.470733642578125, -1.41021728515625, -1.349700927734375, -1.2891845703125, -1.228668212890625, -1.16815185546875, -1.107635498046875, -1.047119140625, -0.986602783203125, -0.92608642578125, -0.865570068359375, -0.8050537109375, -0.744537353515625, -0.68402099609375, -0.623504638671875, -0.56298828125, -0.502471923828125, -0.44195556640625, -0.381439208984375, -0.3209228515625, -0.260406494140625, -0.19989013671875, -0.139373779296875, -0.078857421875, -0.018341064453125, 0.04217529296875, 0.102691650390625, 0.1632080078125, 0.223724365234375, 0.28424072265625, 0.344757080078125, 0.4052734375, 0.465789794921875, 0.52630615234375, 0.586822509765625, 0.6473388671875, 0.707855224609375, 0.76837158203125, 0.828887939453125, 0.889404296875, 0.949920654296875, 1.01043701171875, 1.070953369140625, 1.1314697265625, 1.191986083984375, 1.25250244140625, 1.313018798828125, 1.37353515625, 1.434051513671875, 1.49456787109375, 1.555084228515625, 1.6156005859375, 1.676116943359375, 1.73663330078125, 1.797149658203125, 1.857666015625, 1.918182373046875, 1.97869873046875, 2.039215087890625, 2.0997314453125, 2.160247802734375, 2.22076416015625, 2.281280517578125, 2.341796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 3.0, 5.0, 8.0, 20.0, 19.0, 30.0, 29.0, 35.0, 35.0, 50.0, 52.0, 53.0, 61.0, 72.0, 70.0, 52.0, 78.0, 56.0, 64.0, 35.0, 23.0, 36.0, 30.0, 17.0, 17.0, 11.0, 6.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5660552978515625, -0.546661376953125, -0.5272674560546875, -0.50787353515625, -0.4884796142578125, -0.469085693359375, -0.4496917724609375, -0.4302978515625, -0.4109039306640625, -0.391510009765625, -0.3721160888671875, -0.35272216796875, -0.3333282470703125, -0.313934326171875, -0.2945404052734375, -0.275146484375, -0.2557525634765625, -0.236358642578125, -0.2169647216796875, -0.19757080078125, -0.1781768798828125, -0.158782958984375, -0.1393890380859375, -0.1199951171875, -0.1006011962890625, -0.081207275390625, -0.0618133544921875, -0.04241943359375, -0.0230255126953125, -0.003631591796875, 0.0157623291015625, 0.03515625, 0.0545501708984375, 0.073944091796875, 0.0933380126953125, 0.11273193359375, 0.1321258544921875, 0.151519775390625, 0.1709136962890625, 0.1903076171875, 0.2097015380859375, 0.229095458984375, 0.2484893798828125, 0.26788330078125, 0.2872772216796875, 0.306671142578125, 0.3260650634765625, 0.345458984375, 0.3648529052734375, 0.384246826171875, 0.4036407470703125, 0.42303466796875, 0.4424285888671875, 0.461822509765625, 0.4812164306640625, 0.5006103515625, 0.5200042724609375, 0.539398193359375, 0.5587921142578125, 0.57818603515625, 0.5975799560546875, 0.616973876953125, 0.6363677978515625, 0.65576171875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 12.0, 11.0, 18.0, 38.0, 35.0, 58.0, 110.0, 147.0, 243.0, 371.0, 604.0, 1046.0, 1914.0, 3423.0, 7207.0, 19611.0, 87656.0, 2487563.0, 1483216.0, 69777.0, 17077.0, 6655.0, 3228.0, 1663.0, 991.0, 596.0, 364.0, 199.0, 138.0, 96.0, 68.0, 34.0, 31.0, 20.0, 12.0, 8.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71044921875, -0.6888809204101562, -0.6673126220703125, -0.6457443237304688, -0.624176025390625, -0.6026077270507812, -0.5810394287109375, -0.5594711303710938, -0.53790283203125, -0.5163345336914062, -0.4947662353515625, -0.47319793701171875, -0.451629638671875, -0.43006134033203125, -0.4084930419921875, -0.38692474365234375, -0.3653564453125, -0.34378814697265625, -0.3222198486328125, -0.30065155029296875, -0.279083251953125, -0.25751495361328125, -0.2359466552734375, -0.21437835693359375, -0.19281005859375, -0.17124176025390625, -0.1496734619140625, -0.12810516357421875, -0.106536865234375, -0.08496856689453125, -0.0634002685546875, -0.04183197021484375, -0.020263671875, 0.00130462646484375, 0.0228729248046875, 0.04444122314453125, 0.066009521484375, 0.08757781982421875, 0.1091461181640625, 0.13071441650390625, 0.15228271484375, 0.17385101318359375, 0.1954193115234375, 0.21698760986328125, 0.238555908203125, 0.26012420654296875, 0.2816925048828125, 0.30326080322265625, 0.3248291015625, 0.34639739990234375, 0.3679656982421875, 0.38953399658203125, 0.411102294921875, 0.43267059326171875, 0.4542388916015625, 0.47580718994140625, 0.49737548828125, 0.5189437866210938, 0.5405120849609375, 0.5620803833007812, 0.583648681640625, 0.6052169799804688, 0.6267852783203125, 0.6483535766601562, 0.669921875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 5.0, 9.0, 13.0, 9.0, 13.0, 28.0, 35.0, 57.0, 110.0, 197.0, 357.0, 690.0, 987.0, 694.0, 374.0, 183.0, 91.0, 67.0, 33.0, 23.0, 11.0, 12.0, 8.0, 11.0, 3.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2161865234375, -0.2088489532470703, -0.20151138305664062, -0.19417381286621094, -0.18683624267578125, -0.17949867248535156, -0.17216110229492188, -0.1648235321044922, -0.1574859619140625, -0.1501483917236328, -0.14281082153320312, -0.13547325134277344, -0.12813568115234375, -0.12079811096191406, -0.11346054077148438, -0.10612297058105469, -0.098785400390625, -0.09144783020019531, -0.08411026000976562, -0.07677268981933594, -0.06943511962890625, -0.06209754943847656, -0.054759979248046875, -0.04742240905761719, -0.0400848388671875, -0.03274726867675781, -0.025409698486328125, -0.018072128295898438, -0.01073455810546875, -0.0033969879150390625, 0.003940582275390625, 0.011278152465820312, 0.01861572265625, 0.025953292846679688, 0.033290863037109375, 0.04062843322753906, 0.04796600341796875, 0.05530357360839844, 0.06264114379882812, 0.06997871398925781, 0.0773162841796875, 0.08465385437011719, 0.09199142456054688, 0.09932899475097656, 0.10666656494140625, 0.11400413513183594, 0.12134170532226562, 0.1286792755126953, 0.136016845703125, 0.1433544158935547, 0.15069198608398438, 0.15802955627441406, 0.16536712646484375, 0.17270469665527344, 0.18004226684570312, 0.1873798370361328, 0.1947174072265625, 0.2020549774169922, 0.20939254760742188, 0.21673011779785156, 0.22406768798828125, 0.23140525817871094, 0.23874282836914062, 0.2460803985595703, 0.25341796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 8.0, 9.0, 15.0, 25.0, 30.0, 45.0, 65.0, 104.0, 115.0, 153.0, 121.0, 73.0, 61.0, 48.0, 27.0, 21.0, 11.0, 9.0, 8.0, 8.0, 7.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.006345510482788, -0.9785889387130737, -0.9508323669433594, -0.923075795173645, -0.8953192234039307, -0.8675626516342163, -0.839806079864502, -0.8120495080947876, -0.7842929363250732, -0.7565363645553589, -0.7287797927856445, -0.7010232210159302, -0.6732666492462158, -0.6455100774765015, -0.6177535057067871, -0.5899969339370728, -0.5622404217720032, -0.5344838500022888, -0.5067272782325745, -0.4789707064628601, -0.45121413469314575, -0.4234575629234314, -0.39570102095603943, -0.3679444491863251, -0.3401878774166107, -0.31243130564689636, -0.284674733877182, -0.25691819190979004, -0.2291616052389145, -0.20140503346920013, -0.17364847660064697, -0.14589190483093262, -0.11813539266586304, -0.09037882089614868, -0.06262225657701492, -0.034865692257881165, -0.007109120488166809, 0.020647451281547546, 0.04840400815010071, 0.07616057991981506, 0.10391715168952942, 0.13167372345924377, 0.15943029522895813, 0.1871868520975113, 0.21494342386722565, 0.24269999563694, 0.27045655250549316, 0.2982131242752075, 0.3259696960449219, 0.35372626781463623, 0.3814828395843506, 0.40923941135406494, 0.4369959831237793, 0.46475255489349365, 0.4925090968608856, 0.5202656984329224, 0.5480222702026367, 0.5757788419723511, 0.6035354137420654, 0.6312919855117798, 0.6590485572814941, 0.6868051290512085, 0.7145617008209229, 0.7423182725906372, 0.7700747847557068]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 6.0, 17.0, 24.0, 26.0, 25.0, 31.0, 31.0, 41.0, 43.0, 45.0, 52.0, 45.0, 60.0, 58.0, 60.0, 62.0, 53.0, 52.0, 44.0, 39.0, 33.0, 25.0, 26.0, 23.0, 14.0, 21.0, 11.0, 11.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5457655191421509, -0.5264434814453125, -0.5071214437484741, -0.48779940605163574, -0.46847739815711975, -0.44915536046028137, -0.429833322763443, -0.410511314868927, -0.3911892771720886, -0.37186723947525024, -0.35254520177841187, -0.3332231640815735, -0.3139011561870575, -0.2945791184902191, -0.27525708079338074, -0.25593507289886475, -0.23661300539970398, -0.2172909677028656, -0.19796894490718842, -0.17864690721035004, -0.15932488441467285, -0.14000284671783447, -0.1206808090209961, -0.10135878622531891, -0.08203674852848053, -0.06271471828222275, -0.04339268431067467, -0.024070650339126587, -0.004748620092868805, 0.014573410153388977, 0.033895447850227356, 0.05321747064590454, 0.07253950834274292, 0.0918615385890007, 0.11118356883525848, 0.13050560653209686, 0.14982762932777405, 0.16914966702461243, 0.1884717047214508, 0.207793727517128, 0.22711576521396637, 0.24643780291080475, 0.26575982570648193, 0.2850818634033203, 0.3044039011001587, 0.32372593879699707, 0.34304797649383545, 0.36236998438835144, 0.3816920220851898, 0.4010140597820282, 0.4203360974788666, 0.43965810537338257, 0.45898014307022095, 0.4783021807670593, 0.4976242184638977, 0.5169462561607361, 0.5362682938575745, 0.5555903315544128, 0.5749123692512512, 0.5942344069480896, 0.613556444644928, 0.6328784227371216, 0.65220046043396, 0.6715224981307983, 0.6908445358276367]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 6.0, 7.0, 12.0, 9.0, 19.0, 27.0, 32.0, 43.0, 58.0, 67.0, 116.0, 170.0, 254.0, 452.0, 746.0, 1424.0, 2700.0, 5500.0, 11426.0, 26122.0, 66329.0, 197824.0, 419762.0, 198922.0, 66516.0, 26680.0, 11607.0, 5531.0, 2711.0, 1411.0, 781.0, 432.0, 287.0, 176.0, 103.0, 89.0, 50.0, 40.0, 31.0, 20.0, 13.0, 11.0, 5.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0755615234375, -0.07316303253173828, -0.07076454162597656, -0.06836605072021484, -0.06596755981445312, -0.0635690689086914, -0.06117057800292969, -0.05877208709716797, -0.05637359619140625, -0.05397510528564453, -0.05157661437988281, -0.049178123474121094, -0.046779632568359375, -0.044381141662597656, -0.04198265075683594, -0.03958415985107422, -0.0371856689453125, -0.03478717803955078, -0.03238868713378906, -0.029990196228027344, -0.027591705322265625, -0.025193214416503906, -0.022794723510742188, -0.02039623260498047, -0.01799774169921875, -0.015599250793457031, -0.013200759887695312, -0.010802268981933594, -0.008403778076171875, -0.006005287170410156, -0.0036067962646484375, -0.0012083053588867188, 0.001190185546875, 0.0035886764526367188, 0.0059871673583984375, 0.008385658264160156, 0.010784149169921875, 0.013182640075683594, 0.015581130981445312, 0.01797962188720703, 0.02037811279296875, 0.02277660369873047, 0.025175094604492188, 0.027573585510253906, 0.029972076416015625, 0.032370567321777344, 0.03476905822753906, 0.03716754913330078, 0.0395660400390625, 0.04196453094482422, 0.04436302185058594, 0.046761512756347656, 0.049160003662109375, 0.051558494567871094, 0.05395698547363281, 0.05635547637939453, 0.05875396728515625, 0.06115245819091797, 0.06355094909667969, 0.0659494400024414, 0.06834793090820312, 0.07074642181396484, 0.07314491271972656, 0.07554340362548828, 0.07794189453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 12.0, 15.0, 32.0, 28.0, 35.0, 51.0, 54.0, 65.0, 77.0, 93.0, 89.0, 92.0, 70.0, 64.0, 47.0, 35.0, 42.0, 21.0, 25.0, 16.0, 13.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.4050445556640625, -0.387725830078125, -0.3704071044921875, -0.35308837890625, -0.3357696533203125, -0.318450927734375, -0.3011322021484375, -0.2838134765625, -0.2664947509765625, -0.249176025390625, -0.2318572998046875, -0.21453857421875, -0.1972198486328125, -0.179901123046875, -0.1625823974609375, -0.145263671875, -0.1279449462890625, -0.110626220703125, -0.0933074951171875, -0.07598876953125, -0.0586700439453125, -0.041351318359375, -0.0240325927734375, -0.0067138671875, 0.0106048583984375, 0.027923583984375, 0.0452423095703125, 0.06256103515625, 0.0798797607421875, 0.097198486328125, 0.1145172119140625, 0.1318359375, 0.1491546630859375, 0.166473388671875, 0.1837921142578125, 0.20111083984375, 0.2184295654296875, 0.235748291015625, 0.2530670166015625, 0.2703857421875, 0.2877044677734375, 0.305023193359375, 0.3223419189453125, 0.33966064453125, 0.3569793701171875, 0.374298095703125, 0.3916168212890625, 0.408935546875, 0.4262542724609375, 0.443572998046875, 0.4608917236328125, 0.47821044921875, 0.4955291748046875, 0.512847900390625, 0.5301666259765625, 0.5474853515625, 0.5648040771484375, 0.582122802734375, 0.5994415283203125, 0.61676025390625, 0.6340789794921875, 0.651397705078125, 0.6687164306640625, 0.68603515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 19.0, 13.0, 18.0, 33.0, 46.0, 46.0, 105.0, 153.0, 248.0, 349.0, 634.0, 1089.0, 1856.0, 3389.0, 6196.0, 12906.0, 27814.0, 65877.0, 168063.0, 344421.0, 241246.0, 96810.0, 39893.0, 18068.0, 8680.0, 4504.0, 2505.0, 1403.0, 787.0, 493.0, 295.0, 178.0, 140.0, 77.0, 50.0, 47.0, 29.0, 26.0, 11.0, 10.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055755615234375, -0.0538783073425293, -0.052000999450683594, -0.05012369155883789, -0.04824638366699219, -0.046369075775146484, -0.04449176788330078, -0.04261445999145508, -0.040737152099609375, -0.03885984420776367, -0.03698253631591797, -0.035105228424072266, -0.03322792053222656, -0.03135061264038086, -0.029473304748535156, -0.027595996856689453, -0.02571868896484375, -0.023841381072998047, -0.021964073181152344, -0.02008676528930664, -0.018209457397460938, -0.016332149505615234, -0.014454841613769531, -0.012577533721923828, -0.010700225830078125, -0.008822917938232422, -0.006945610046386719, -0.005068302154541016, -0.0031909942626953125, -0.0013136863708496094, 0.0005636215209960938, 0.002440929412841797, 0.0043182373046875, 0.006195545196533203, 0.008072853088378906, 0.00995016098022461, 0.011827468872070312, 0.013704776763916016, 0.015582084655761719, 0.017459392547607422, 0.019336700439453125, 0.021214008331298828, 0.02309131622314453, 0.024968624114990234, 0.026845932006835938, 0.02872323989868164, 0.030600547790527344, 0.03247785568237305, 0.03435516357421875, 0.03623247146606445, 0.038109779357910156, 0.03998708724975586, 0.04186439514160156, 0.043741703033447266, 0.04561901092529297, 0.04749631881713867, 0.049373626708984375, 0.05125093460083008, 0.05312824249267578, 0.055005550384521484, 0.05688285827636719, 0.05876016616821289, 0.060637474060058594, 0.0625147819519043, 0.06439208984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 11.0, 7.0, 11.0, 11.0, 9.0, 16.0, 17.0, 23.0, 31.0, 20.0, 30.0, 48.0, 38.0, 41.0, 46.0, 56.0, 43.0, 42.0, 47.0, 41.0, 44.0, 41.0, 36.0, 34.0, 29.0, 22.0, 22.0, 22.0, 24.0, 24.0, 14.0, 8.0, 14.0, 12.0, 9.0, 6.0, 11.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.57763671875, -0.5601806640625, -0.542724609375, -0.5252685546875, -0.5078125, -0.4903564453125, -0.472900390625, -0.4554443359375, -0.43798828125, -0.4205322265625, -0.403076171875, -0.3856201171875, -0.3681640625, -0.3507080078125, -0.333251953125, -0.3157958984375, -0.29833984375, -0.2808837890625, -0.263427734375, -0.2459716796875, -0.228515625, -0.2110595703125, -0.193603515625, -0.1761474609375, -0.15869140625, -0.1412353515625, -0.123779296875, -0.1063232421875, -0.0888671875, -0.0714111328125, -0.053955078125, -0.0364990234375, -0.01904296875, -0.0015869140625, 0.015869140625, 0.0333251953125, 0.05078125, 0.0682373046875, 0.085693359375, 0.1031494140625, 0.12060546875, 0.1380615234375, 0.155517578125, 0.1729736328125, 0.1904296875, 0.2078857421875, 0.225341796875, 0.2427978515625, 0.26025390625, 0.2777099609375, 0.295166015625, 0.3126220703125, 0.330078125, 0.3475341796875, 0.364990234375, 0.3824462890625, 0.39990234375, 0.4173583984375, 0.434814453125, 0.4522705078125, 0.4697265625, 0.4871826171875, 0.504638671875, 0.5220947265625, 0.53955078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 14.0, 19.0, 28.0, 38.0, 55.0, 124.0, 229.0, 448.0, 850.0, 2068.0, 5245.0, 16776.0, 72480.0, 459626.0, 403635.0, 63116.0, 15177.0, 4865.0, 1988.0, 886.0, 423.0, 181.0, 105.0, 73.0, 43.0, 18.0, 13.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0443115234375, -0.04314422607421875, -0.0419769287109375, -0.04080963134765625, -0.039642333984375, -0.03847503662109375, -0.0373077392578125, -0.03614044189453125, -0.03497314453125, -0.03380584716796875, -0.0326385498046875, -0.03147125244140625, -0.030303955078125, -0.02913665771484375, -0.0279693603515625, -0.02680206298828125, -0.025634765625, -0.02446746826171875, -0.0233001708984375, -0.02213287353515625, -0.020965576171875, -0.01979827880859375, -0.0186309814453125, -0.01746368408203125, -0.01629638671875, -0.01512908935546875, -0.0139617919921875, -0.01279449462890625, -0.011627197265625, -0.01045989990234375, -0.0092926025390625, -0.00812530517578125, -0.0069580078125, -0.00579071044921875, -0.0046234130859375, -0.00345611572265625, -0.002288818359375, -0.00112152099609375, 4.57763671875e-05, 0.00121307373046875, 0.00238037109375, 0.00354766845703125, 0.0047149658203125, 0.00588226318359375, 0.007049560546875, 0.00821685791015625, 0.0093841552734375, 0.01055145263671875, 0.01171875, 0.01288604736328125, 0.0140533447265625, 0.01522064208984375, 0.016387939453125, 0.01755523681640625, 0.0187225341796875, 0.01988983154296875, 0.02105712890625, 0.02222442626953125, 0.0233917236328125, 0.02455902099609375, 0.025726318359375, 0.02689361572265625, 0.0280609130859375, 0.02922821044921875, 0.0303955078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 10.0, 20.0, 20.0, 20.0, 41.0, 55.0, 96.0, 104.0, 129.0, 148.0, 92.0, 78.0, 50.0, 32.0, 26.0, 17.0, 14.0, 6.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7583370208740234e-05, -1.690257340669632e-05, -1.6221776604652405e-05, -1.554097980260849e-05, -1.4860183000564575e-05, -1.417938619852066e-05, -1.3498589396476746e-05, -1.281779259443283e-05, -1.2136995792388916e-05, -1.1456198990345001e-05, -1.0775402188301086e-05, -1.0094605386257172e-05, -9.413808584213257e-06, -8.733011782169342e-06, -8.052214980125427e-06, -7.3714181780815125e-06, -6.690621376037598e-06, -6.009824573993683e-06, -5.329027771949768e-06, -4.648230969905853e-06, -3.9674341678619385e-06, -3.2866373658180237e-06, -2.605840563774109e-06, -1.925043761730194e-06, -1.2442469596862793e-06, -5.634501576423645e-07, 1.1734664440155029e-07, 7.981434464454651e-07, 1.4789402484893799e-06, 2.1597370505332947e-06, 2.8405338525772095e-06, 3.5213306546211243e-06, 4.202127456665039e-06, 4.882924258708954e-06, 5.563721060752869e-06, 6.2445178627967834e-06, 6.925314664840698e-06, 7.606111466884613e-06, 8.286908268928528e-06, 8.967705070972443e-06, 9.648501873016357e-06, 1.0329298675060272e-05, 1.1010095477104187e-05, 1.1690892279148102e-05, 1.2371689081192017e-05, 1.3052485883235931e-05, 1.3733282685279846e-05, 1.4414079487323761e-05, 1.5094876289367676e-05, 1.577567309141159e-05, 1.6456469893455505e-05, 1.713726669549942e-05, 1.7818063497543335e-05, 1.849886029958725e-05, 1.9179657101631165e-05, 1.986045390367508e-05, 2.0541250705718994e-05, 2.122204750776291e-05, 2.1902844309806824e-05, 2.258364111185074e-05, 2.3264437913894653e-05, 2.3945234715938568e-05, 2.4626031517982483e-05, 2.5306828320026398e-05, 2.5987625122070312e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 6.0, 5.0, 10.0, 17.0, 16.0, 30.0, 37.0, 55.0, 88.0, 119.0, 221.0, 332.0, 605.0, 1058.0, 1968.0, 3654.0, 7472.0, 16687.0, 41348.0, 112174.0, 319239.0, 341410.0, 123158.0, 44183.0, 17858.0, 8037.0, 3926.0, 2087.0, 1114.0, 647.0, 401.0, 223.0, 119.0, 76.0, 53.0, 43.0, 19.0, 22.0, 11.0, 10.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0227508544921875, -0.022062301635742188, -0.021373748779296875, -0.020685195922851562, -0.01999664306640625, -0.019308090209960938, -0.018619537353515625, -0.017930984497070312, -0.017242431640625, -0.016553878784179688, -0.015865325927734375, -0.015176773071289062, -0.01448822021484375, -0.013799667358398438, -0.013111114501953125, -0.012422561645507812, -0.0117340087890625, -0.011045455932617188, -0.010356903076171875, -0.009668350219726562, -0.00897979736328125, -0.008291244506835938, -0.007602691650390625, -0.0069141387939453125, -0.0062255859375, -0.0055370330810546875, -0.004848480224609375, -0.0041599273681640625, -0.00347137451171875, -0.0027828216552734375, -0.002094268798828125, -0.0014057159423828125, -0.0007171630859375, -2.86102294921875e-05, 0.000659942626953125, 0.0013484954833984375, 0.00203704833984375, 0.0027256011962890625, 0.003414154052734375, 0.0041027069091796875, 0.004791259765625, 0.0054798126220703125, 0.006168365478515625, 0.0068569183349609375, 0.00754547119140625, 0.008234024047851562, 0.008922576904296875, 0.009611129760742188, 0.0102996826171875, 0.010988235473632812, 0.011676788330078125, 0.012365341186523438, 0.01305389404296875, 0.013742446899414062, 0.014430999755859375, 0.015119552612304688, 0.01580810546875, 0.016496658325195312, 0.017185211181640625, 0.017873764038085938, 0.01856231689453125, 0.019250869750976562, 0.019939422607421875, 0.020627975463867188, 0.0213165283203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 15.0, 6.0, 16.0, 21.0, 21.0, 28.0, 43.0, 46.0, 50.0, 53.0, 56.0, 85.0, 65.0, 60.0, 66.0, 70.0, 55.0, 48.0, 32.0, 30.0, 20.0, 24.0, 18.0, 17.0, 11.0, 4.0, 7.0, 2.0, 3.0, 7.0, 0.0, 5.0, 1.0, 1.0], "bins": [-0.010040283203125, -0.009804010391235352, -0.009567737579345703, -0.009331464767456055, -0.009095191955566406, -0.008858919143676758, -0.00862264633178711, -0.008386373519897461, -0.008150100708007812, -0.007913827896118164, -0.007677555084228516, -0.007441282272338867, -0.007205009460449219, -0.00696873664855957, -0.006732463836669922, -0.0064961910247802734, -0.006259918212890625, -0.0060236454010009766, -0.005787372589111328, -0.00555109977722168, -0.005314826965332031, -0.005078554153442383, -0.004842281341552734, -0.004606008529663086, -0.0043697357177734375, -0.004133462905883789, -0.0038971900939941406, -0.003660917282104492, -0.0034246444702148438, -0.0031883716583251953, -0.002952098846435547, -0.0027158260345458984, -0.00247955322265625, -0.0022432804107666016, -0.002007007598876953, -0.0017707347869873047, -0.0015344619750976562, -0.0012981891632080078, -0.0010619163513183594, -0.0008256435394287109, -0.0005893707275390625, -0.00035309791564941406, -0.00011682510375976562, 0.00011944770812988281, 0.00035572052001953125, 0.0005919933319091797, 0.0008282661437988281, 0.0010645389556884766, 0.001300811767578125, 0.0015370845794677734, 0.0017733573913574219, 0.0020096302032470703, 0.0022459030151367188, 0.002482175827026367, 0.0027184486389160156, 0.002954721450805664, 0.0031909942626953125, 0.003427267074584961, 0.0036635398864746094, 0.003899812698364258, 0.004136085510253906, 0.004372358322143555, 0.004608631134033203, 0.0048449039459228516, 0.0050811767578125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 12.0, 15.0, 43.0, 98.0, 275.0, 335.0, 137.0, 35.0, 23.0, 11.0, 13.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-2.4358296394348145, -2.389970541000366, -2.344111204147339, -2.2982521057128906, -2.2523930072784424, -2.206533670425415, -2.160674571990967, -2.1148154735565186, -2.0689563751220703, -2.023097276687622, -1.9772380590438843, -1.9313788414001465, -1.8855197429656982, -1.8396605253219604, -1.7938013076782227, -1.7479422092437744, -1.702082872390747, -1.6562236547470093, -1.610364556312561, -1.5645053386688232, -1.518646240234375, -1.4727870225906372, -1.4269278049468994, -1.3810687065124512, -1.3352094888687134, -1.2893502712249756, -1.2434911727905273, -1.1976319551467896, -1.1517727375030518, -1.1059136390686035, -1.0600544214248657, -1.014195203781128, -0.9683359861373901, -0.9224768280982971, -0.8766176700592041, -0.8307584524154663, -0.7848992943763733, -0.7390401363372803, -0.6931809186935425, -0.6473217606544495, -0.6014626026153564, -0.5556034445762634, -0.5097442865371704, -0.4638850688934326, -0.4180259108543396, -0.3721667528152466, -0.3263075649738312, -0.28044837713241577, -0.23458921909332275, -0.18873004615306854, -0.14287087321281433, -0.09701170027256012, -0.05115252733230591, -0.005293354392051697, 0.040565818548202515, 0.08642500638961792, 0.13228416442871094, 0.17814333736896515, 0.22400251030921936, 0.26986169815063477, 0.3157208561897278, 0.3615800142288208, 0.4074392020702362, 0.4532983899116516, 0.49915754795074463]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 14.0, 23.0, 23.0, 21.0, 37.0, 40.0, 37.0, 52.0, 52.0, 64.0, 66.0, 68.0, 69.0, 72.0, 57.0, 62.0, 42.0, 38.0, 36.0, 27.0, 17.0, 20.0, 16.0, 13.0, 6.0, 3.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3846094310283661, -0.37079745531082153, -0.35698550939559937, -0.3431735336780548, -0.32936158776283264, -0.3155496120452881, -0.3017376661300659, -0.28792569041252136, -0.2741137146949768, -0.26030173897743225, -0.24648979306221008, -0.23267781734466553, -0.21886587142944336, -0.2050538957118988, -0.19124193489551544, -0.17742997407913208, -0.1636180281639099, -0.14980606734752655, -0.1359941065311432, -0.12218213826417923, -0.10837017744779587, -0.0945582166314125, -0.08074624836444855, -0.06693428754806519, -0.053122326731681824, -0.03931036591529846, -0.0254984013736248, -0.011686436831951141, 0.0021255239844322205, 0.015937484800815582, 0.02974945306777954, 0.0435614138841629, 0.057373374700546265, 0.07118533551692963, 0.08499729633331299, 0.09880926460027695, 0.11262122541666031, 0.12643319368362427, 0.14024515450000763, 0.154057115316391, 0.16786907613277435, 0.18168103694915771, 0.19549299776554108, 0.20930495858192444, 0.223116934299469, 0.23692888021469116, 0.2507408559322357, 0.2645528316497803, 0.27836477756500244, 0.292176753282547, 0.30598869919776917, 0.3198006749153137, 0.3336126208305359, 0.34742459654808044, 0.361236572265625, 0.37504851818084717, 0.38886046409606934, 0.4026724398136139, 0.41648438572883606, 0.4302963614463806, 0.4441083073616028, 0.45792028307914734, 0.4717322587966919, 0.48554420471191406, 0.4993561804294586]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 7.0, 19.0, 23.0, 35.0, 48.0, 75.0, 126.0, 241.0, 375.0, 723.0, 1237.0, 2643.0, 6032.0, 16155.0, 59343.0, 378934.0, 477513.0, 73438.0, 18814.0, 6755.0, 2816.0, 1381.0, 715.0, 434.0, 236.0, 156.0, 89.0, 64.0, 26.0, 29.0, 18.0, 12.0, 12.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.26369476318359375, -0.2539520263671875, -0.24420928955078125, -0.234466552734375, -0.22472381591796875, -0.2149810791015625, -0.20523834228515625, -0.19549560546875, -0.18575286865234375, -0.1760101318359375, -0.16626739501953125, -0.156524658203125, -0.14678192138671875, -0.1370391845703125, -0.12729644775390625, -0.1175537109375, -0.10781097412109375, -0.0980682373046875, -0.08832550048828125, -0.078582763671875, -0.06884002685546875, -0.0590972900390625, -0.04935455322265625, -0.03961181640625, -0.02986907958984375, -0.0201263427734375, -0.01038360595703125, -0.000640869140625, 0.00910186767578125, 0.0188446044921875, 0.02858734130859375, 0.038330078125, 0.04807281494140625, 0.0578155517578125, 0.06755828857421875, 0.077301025390625, 0.08704376220703125, 0.0967864990234375, 0.10652923583984375, 0.11627197265625, 0.12601470947265625, 0.1357574462890625, 0.14550018310546875, 0.155242919921875, 0.16498565673828125, 0.1747283935546875, 0.18447113037109375, 0.1942138671875, 0.20395660400390625, 0.2136993408203125, 0.22344207763671875, 0.233184814453125, 0.24292755126953125, 0.2526702880859375, 0.26241302490234375, 0.27215576171875, 0.28189849853515625, 0.2916412353515625, 0.30138397216796875, 0.311126708984375, 0.32086944580078125, 0.3306121826171875, 0.34035491943359375, 0.35009765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 1.0, 5.0, 14.0, 15.0, 28.0, 21.0, 25.0, 41.0, 44.0, 42.0, 63.0, 74.0, 72.0, 67.0, 70.0, 84.0, 55.0, 61.0, 46.0, 38.0, 26.0, 19.0, 24.0, 16.0, 15.0, 9.0, 8.0, 2.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.836090087890625, -0.80596923828125, -0.775848388671875, -0.7457275390625, -0.715606689453125, -0.68548583984375, -0.655364990234375, -0.625244140625, -0.595123291015625, -0.56500244140625, -0.534881591796875, -0.5047607421875, -0.474639892578125, -0.44451904296875, -0.414398193359375, -0.38427734375, -0.354156494140625, -0.32403564453125, -0.293914794921875, -0.2637939453125, -0.233673095703125, -0.20355224609375, -0.173431396484375, -0.143310546875, -0.113189697265625, -0.08306884765625, -0.052947998046875, -0.0228271484375, 0.007293701171875, 0.03741455078125, 0.067535400390625, 0.09765625, 0.127777099609375, 0.15789794921875, 0.188018798828125, 0.2181396484375, 0.248260498046875, 0.27838134765625, 0.308502197265625, 0.338623046875, 0.368743896484375, 0.39886474609375, 0.428985595703125, 0.4591064453125, 0.489227294921875, 0.51934814453125, 0.549468994140625, 0.57958984375, 0.609710693359375, 0.63983154296875, 0.669952392578125, 0.7000732421875, 0.730194091796875, 0.76031494140625, 0.790435791015625, 0.820556640625, 0.850677490234375, 0.88079833984375, 0.910919189453125, 0.9410400390625, 0.971160888671875, 1.00128173828125, 1.031402587890625, 1.0615234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 16.0, 20.0, 18.0, 30.0, 36.0, 65.0, 105.0, 159.0, 249.0, 562.0, 2199.0, 17864.0, 678809.0, 334272.0, 11391.0, 1598.0, 513.0, 228.0, 123.0, 82.0, 68.0, 41.0, 30.0, 19.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.673828125, -0.6545257568359375, -0.635223388671875, -0.6159210205078125, -0.59661865234375, -0.5773162841796875, -0.558013916015625, -0.5387115478515625, -0.5194091796875, -0.5001068115234375, -0.480804443359375, -0.4615020751953125, -0.44219970703125, -0.4228973388671875, -0.403594970703125, -0.3842926025390625, -0.364990234375, -0.3456878662109375, -0.326385498046875, -0.3070831298828125, -0.28778076171875, -0.2684783935546875, -0.249176025390625, -0.2298736572265625, -0.2105712890625, -0.1912689208984375, -0.171966552734375, -0.1526641845703125, -0.13336181640625, -0.1140594482421875, -0.094757080078125, -0.0754547119140625, -0.05615234375, -0.0368499755859375, -0.017547607421875, 0.0017547607421875, 0.02105712890625, 0.0403594970703125, 0.059661865234375, 0.0789642333984375, 0.0982666015625, 0.1175689697265625, 0.136871337890625, 0.1561737060546875, 0.17547607421875, 0.1947784423828125, 0.214080810546875, 0.2333831787109375, 0.252685546875, 0.2719879150390625, 0.291290283203125, 0.3105926513671875, 0.32989501953125, 0.3491973876953125, 0.368499755859375, 0.3878021240234375, 0.4071044921875, 0.4264068603515625, 0.445709228515625, 0.4650115966796875, 0.48431396484375, 0.5036163330078125, 0.522918701171875, 0.5422210693359375, 0.5615234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 5.0, 7.0, 8.0, 8.0, 12.0, 20.0, 19.0, 20.0, 26.0, 29.0, 26.0, 29.0, 44.0, 40.0, 48.0, 38.0, 33.0, 44.0, 40.0, 60.0, 48.0, 52.0, 54.0, 35.0, 47.0, 25.0, 23.0, 16.0, 24.0, 15.0, 14.0, 16.0, 14.0, 7.0, 10.0, 5.0, 6.0, 10.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67431640625, -0.6527099609375, -0.631103515625, -0.6094970703125, -0.587890625, -0.5662841796875, -0.544677734375, -0.5230712890625, -0.50146484375, -0.4798583984375, -0.458251953125, -0.4366455078125, -0.4150390625, -0.3934326171875, -0.371826171875, -0.3502197265625, -0.32861328125, -0.3070068359375, -0.285400390625, -0.2637939453125, -0.2421875, -0.2205810546875, -0.198974609375, -0.1773681640625, -0.15576171875, -0.1341552734375, -0.112548828125, -0.0909423828125, -0.0693359375, -0.0477294921875, -0.026123046875, -0.0045166015625, 0.01708984375, 0.0386962890625, 0.060302734375, 0.0819091796875, 0.103515625, 0.1251220703125, 0.146728515625, 0.1683349609375, 0.18994140625, 0.2115478515625, 0.233154296875, 0.2547607421875, 0.2763671875, 0.2979736328125, 0.319580078125, 0.3411865234375, 0.36279296875, 0.3843994140625, 0.406005859375, 0.4276123046875, 0.44921875, 0.4708251953125, 0.492431640625, 0.5140380859375, 0.53564453125, 0.5572509765625, 0.578857421875, 0.6004638671875, 0.6220703125, 0.6436767578125, 0.665283203125, 0.6868896484375, 0.70849609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 10.0, 10.0, 16.0, 15.0, 26.0, 37.0, 82.0, 125.0, 251.0, 756.0, 2417.0, 12286.0, 192757.0, 803654.0, 29661.0, 4487.0, 1175.0, 403.0, 158.0, 95.0, 35.0, 23.0, 21.0, 10.0, 6.0, 10.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.239501953125, -0.2318267822265625, -0.224151611328125, -0.2164764404296875, -0.20880126953125, -0.2011260986328125, -0.193450927734375, -0.1857757568359375, -0.1781005859375, -0.1704254150390625, -0.162750244140625, -0.1550750732421875, -0.14739990234375, -0.1397247314453125, -0.132049560546875, -0.1243743896484375, -0.11669921875, -0.1090240478515625, -0.101348876953125, -0.0936737060546875, -0.08599853515625, -0.0783233642578125, -0.070648193359375, -0.0629730224609375, -0.0552978515625, -0.0476226806640625, -0.039947509765625, -0.0322723388671875, -0.02459716796875, -0.0169219970703125, -0.009246826171875, -0.0015716552734375, 0.006103515625, 0.0137786865234375, 0.021453857421875, 0.0291290283203125, 0.03680419921875, 0.0444793701171875, 0.052154541015625, 0.0598297119140625, 0.0675048828125, 0.0751800537109375, 0.082855224609375, 0.0905303955078125, 0.09820556640625, 0.1058807373046875, 0.113555908203125, 0.1212310791015625, 0.12890625, 0.1365814208984375, 0.144256591796875, 0.1519317626953125, 0.15960693359375, 0.1672821044921875, 0.174957275390625, 0.1826324462890625, 0.1903076171875, 0.1979827880859375, 0.205657958984375, 0.2133331298828125, 0.22100830078125, 0.2286834716796875, 0.236358642578125, 0.2440338134765625, 0.251708984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 7.0, 18.0, 14.0, 29.0, 25.0, 40.0, 67.0, 89.0, 129.0, 136.0, 120.0, 96.0, 55.0, 43.0, 27.0, 17.0, 20.0, 12.0, 8.0, 8.0, 6.0, 7.0, 2.0, 7.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.2351741790771484e-05, -2.1683983504772186e-05, -2.1016225218772888e-05, -2.034846693277359e-05, -1.9680708646774292e-05, -1.9012950360774994e-05, -1.8345192074775696e-05, -1.7677433788776398e-05, -1.70096755027771e-05, -1.63419172167778e-05, -1.5674158930778503e-05, -1.5006400644779205e-05, -1.4338642358779907e-05, -1.3670884072780609e-05, -1.3003125786781311e-05, -1.2335367500782013e-05, -1.1667609214782715e-05, -1.0999850928783417e-05, -1.0332092642784119e-05, -9.66433435678482e-06, -8.996576070785522e-06, -8.328817784786224e-06, -7.661059498786926e-06, -6.993301212787628e-06, -6.32554292678833e-06, -5.657784640789032e-06, -4.990026354789734e-06, -4.322268068790436e-06, -3.6545097827911377e-06, -2.9867514967918396e-06, -2.3189932107925415e-06, -1.6512349247932434e-06, -9.834766387939453e-07, -3.157183527946472e-07, 3.520399332046509e-07, 1.019798219203949e-06, 1.687556505203247e-06, 2.355314791202545e-06, 3.0230730772018433e-06, 3.6908313632011414e-06, 4.3585896492004395e-06, 5.0263479351997375e-06, 5.694106221199036e-06, 6.361864507198334e-06, 7.029622793197632e-06, 7.69738107919693e-06, 8.365139365196228e-06, 9.032897651195526e-06, 9.700655937194824e-06, 1.0368414223194122e-05, 1.103617250919342e-05, 1.1703930795192719e-05, 1.2371689081192017e-05, 1.3039447367191315e-05, 1.3707205653190613e-05, 1.4374963939189911e-05, 1.5042722225189209e-05, 1.5710480511188507e-05, 1.6378238797187805e-05, 1.7045997083187103e-05, 1.77137553691864e-05, 1.83815136551857e-05, 1.9049271941184998e-05, 1.9717030227184296e-05, 2.0384788513183594e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 10.0, 5.0, 11.0, 17.0, 23.0, 32.0, 50.0, 48.0, 99.0, 144.0, 201.0, 336.0, 601.0, 1318.0, 3053.0, 9340.0, 50008.0, 719223.0, 230976.0, 23065.0, 5612.0, 2136.0, 944.0, 521.0, 262.0, 166.0, 108.0, 84.0, 54.0, 34.0, 29.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.2319011688232422, -0.22576522827148438, -0.21962928771972656, -0.21349334716796875, -0.20735740661621094, -0.20122146606445312, -0.1950855255126953, -0.1889495849609375, -0.1828136444091797, -0.17667770385742188, -0.17054176330566406, -0.16440582275390625, -0.15826988220214844, -0.15213394165039062, -0.1459980010986328, -0.139862060546875, -0.1337261199951172, -0.12759017944335938, -0.12145423889160156, -0.11531829833984375, -0.10918235778808594, -0.10304641723632812, -0.09691047668457031, -0.0907745361328125, -0.08463859558105469, -0.07850265502929688, -0.07236671447753906, -0.06623077392578125, -0.06009483337402344, -0.053958892822265625, -0.04782295227050781, -0.04168701171875, -0.03555107116699219, -0.029415130615234375, -0.023279190063476562, -0.01714324951171875, -0.011007308959960938, -0.004871368408203125, 0.0012645721435546875, 0.0074005126953125, 0.013536453247070312, 0.019672393798828125, 0.025808334350585938, 0.03194427490234375, 0.03808021545410156, 0.044216156005859375, 0.05035209655761719, 0.056488037109375, 0.06262397766113281, 0.06875991821289062, 0.07489585876464844, 0.08103179931640625, 0.08716773986816406, 0.09330368041992188, 0.09943962097167969, 0.1055755615234375, 0.11171150207519531, 0.11784744262695312, 0.12398338317871094, 0.13011932373046875, 0.13625526428222656, 0.14239120483398438, 0.1485271453857422, 0.1546630859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 11.0, 11.0, 20.0, 23.0, 29.0, 39.0, 65.0, 118.0, 154.0, 142.0, 121.0, 78.0, 54.0, 37.0, 25.0, 18.0, 8.0, 7.0, 5.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05908203125, -0.05674266815185547, -0.05440330505371094, -0.052063941955566406, -0.049724578857421875, -0.047385215759277344, -0.04504585266113281, -0.04270648956298828, -0.04036712646484375, -0.03802776336669922, -0.03568840026855469, -0.033349037170410156, -0.031009674072265625, -0.028670310974121094, -0.026330947875976562, -0.02399158477783203, -0.0216522216796875, -0.01931285858154297, -0.016973495483398438, -0.014634132385253906, -0.012294769287109375, -0.009955406188964844, -0.0076160430908203125, -0.005276679992675781, -0.00293731689453125, -0.0005979537963867188, 0.0017414093017578125, 0.004080772399902344, 0.006420135498046875, 0.008759498596191406, 0.011098861694335938, 0.013438224792480469, 0.015777587890625, 0.01811695098876953, 0.020456314086914062, 0.022795677185058594, 0.025135040283203125, 0.027474403381347656, 0.029813766479492188, 0.03215312957763672, 0.03449249267578125, 0.03683185577392578, 0.03917121887207031, 0.041510581970214844, 0.043849945068359375, 0.046189308166503906, 0.04852867126464844, 0.05086803436279297, 0.0532073974609375, 0.05554676055908203, 0.05788612365722656, 0.060225486755371094, 0.06256484985351562, 0.06490421295166016, 0.06724357604980469, 0.06958293914794922, 0.07192230224609375, 0.07426166534423828, 0.07660102844238281, 0.07894039154052734, 0.08127975463867188, 0.0836191177368164, 0.08595848083496094, 0.08829784393310547, 0.09063720703125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 14.0, 22.0, 66.0, 169.0, 350.0, 210.0, 88.0, 35.0, 16.0, 10.0, 10.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1026254892349243, -1.0155296325683594, -0.9284337162971497, -0.8413378000259399, -0.754241943359375, -0.6671460866928101, -0.5800501704216003, -0.4929542541503906, -0.4058583974838257, -0.31876251101493835, -0.23166662454605103, -0.1445707380771637, -0.05747485160827637, 0.029621034860610962, 0.11671692132949829, 0.203812837600708, 0.29090869426727295, 0.3780045807361603, 0.4651004672050476, 0.5521963834762573, 0.6392922401428223, 0.7263880968093872, 0.8134840130805969, 0.9005799293518066, 0.9876757860183716, 1.0747716426849365, 1.161867618560791, 1.248963475227356, 1.336059331893921, 1.4231551885604858, 1.5102510452270508, 1.5973470211029053, 1.6844429969787598, 1.7715388536453247, 1.8586347103118896, 1.9457306861877441, 2.0328264236450195, 2.119922399520874, 2.2070183753967285, 2.294114112854004, 2.3812100887298584, 2.468306064605713, 2.5554018020629883, 2.6424977779388428, 2.7295937538146973, 2.8166894912719727, 2.903785467147827, 2.9908814430236816, 3.077977180480957, 3.1650731563568115, 3.252168893814087, 3.3392648696899414, 3.426360607147217, 3.5134565830230713, 3.600552558898926, 3.687648296356201, 3.7747442722320557, 3.86184024810791, 3.9489359855651855, 4.036031723022461, 4.1231279373168945, 4.21022367477417, 4.297319412231445, 4.384415626525879, 4.471511363983154]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 9.0, 9.0, 17.0, 12.0, 30.0, 14.0, 25.0, 17.0, 31.0, 31.0, 17.0, 39.0, 33.0, 43.0, 47.0, 41.0, 35.0, 41.0, 46.0, 46.0, 34.0, 31.0, 39.0, 35.0, 32.0, 29.0, 32.0, 15.0, 21.0, 15.0, 14.0, 21.0, 24.0, 12.0, 9.0, 8.0, 11.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.1144568920135498, -1.0803848505020142, -1.046312928199768, -1.0122408866882324, -0.9781688451766968, -0.9440968632698059, -0.910024881362915, -0.8759528398513794, -0.8418807983398438, -0.8078088164329529, -0.7737367749214172, -0.7396647930145264, -0.7055927515029907, -0.6715207695960999, -0.637448787689209, -0.6033767461776733, -0.5693047642707825, -0.5352327823638916, -0.501160740852356, -0.4670887589454651, -0.43301671743392944, -0.3989447355270386, -0.3648727238178253, -0.33080071210861206, -0.2967287003993988, -0.26265668869018555, -0.2285846769809723, -0.19451268017292023, -0.16044066846370697, -0.1263686567544937, -0.09229665994644165, -0.058224648237228394, -0.024152636528015137, 0.009919371455907822, 0.04399137943983078, 0.07806338369846344, 0.1121353954076767, 0.14620740711688995, 0.18027940392494202, 0.21435141563415527, 0.24842342734336853, 0.2824954390525818, 0.31656745076179504, 0.3506394624710083, 0.38471144437789917, 0.4187834858894348, 0.4528554677963257, 0.48692747950553894, 0.5209994912147522, 0.5550714731216431, 0.5891435146331787, 0.6232154965400696, 0.6572875380516052, 0.6913595199584961, 0.7254315614700317, 0.7595035433769226, 0.7935755252838135, 0.8276475071907043, 0.86171954870224, 0.8957915306091309, 0.9298635721206665, 0.9639355540275574, 0.9980075359344482, 1.0320795774459839, 1.0661516189575195]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 12.0, 11.0, 17.0, 12.0, 18.0, 11.0, 27.0, 35.0, 49.0, 73.0, 108.0, 130.0, 188.0, 302.0, 399.0, 669.0, 984.0, 1971.0, 3945.0, 11594.0, 161677.0, 3706916.0, 278504.0, 16602.0, 4627.0, 2113.0, 1197.0, 659.0, 458.0, 268.0, 206.0, 138.0, 113.0, 74.0, 40.0, 35.0, 36.0, 20.0, 16.0, 5.0, 1.0, 6.0, 9.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.27734375, -1.239288330078125, -1.20123291015625, -1.163177490234375, -1.1251220703125, -1.087066650390625, -1.04901123046875, -1.010955810546875, -0.972900390625, -0.934844970703125, -0.89678955078125, -0.858734130859375, -0.8206787109375, -0.782623291015625, -0.74456787109375, -0.706512451171875, -0.66845703125, -0.630401611328125, -0.59234619140625, -0.554290771484375, -0.5162353515625, -0.478179931640625, -0.44012451171875, -0.402069091796875, -0.364013671875, -0.325958251953125, -0.28790283203125, -0.249847412109375, -0.2117919921875, -0.173736572265625, -0.13568115234375, -0.097625732421875, -0.0595703125, -0.021514892578125, 0.01654052734375, 0.054595947265625, 0.0926513671875, 0.130706787109375, 0.16876220703125, 0.206817626953125, 0.244873046875, 0.282928466796875, 0.32098388671875, 0.359039306640625, 0.3970947265625, 0.435150146484375, 0.47320556640625, 0.511260986328125, 0.54931640625, 0.587371826171875, 0.62542724609375, 0.663482666015625, 0.7015380859375, 0.739593505859375, 0.77764892578125, 0.815704345703125, 0.853759765625, 0.891815185546875, 0.92987060546875, 0.967926025390625, 1.0059814453125, 1.044036865234375, 1.08209228515625, 1.120147705078125, 1.158203125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 4.0, 2.0, 8.0, 11.0, 14.0, 20.0, 28.0, 25.0, 27.0, 36.0, 36.0, 46.0, 48.0, 43.0, 57.0, 63.0, 78.0, 66.0, 57.0, 63.0, 54.0, 43.0, 31.0, 28.0, 24.0, 18.0, 17.0, 6.0, 10.0, 15.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5202560424804688, -0.5058441162109375, -0.49143218994140625, -0.477020263671875, -0.46260833740234375, -0.4481964111328125, -0.43378448486328125, -0.41937255859375, -0.40496063232421875, -0.3905487060546875, -0.37613677978515625, -0.361724853515625, -0.34731292724609375, -0.3329010009765625, -0.31848907470703125, -0.3040771484375, -0.28966522216796875, -0.2752532958984375, -0.26084136962890625, -0.246429443359375, -0.23201751708984375, -0.2176055908203125, -0.20319366455078125, -0.18878173828125, -0.17436981201171875, -0.1599578857421875, -0.14554595947265625, -0.131134033203125, -0.11672210693359375, -0.1023101806640625, -0.08789825439453125, -0.073486328125, -0.05907440185546875, -0.0446624755859375, -0.03025054931640625, -0.015838623046875, -0.00142669677734375, 0.0129852294921875, 0.02739715576171875, 0.04180908203125, 0.05622100830078125, 0.0706329345703125, 0.08504486083984375, 0.099456787109375, 0.11386871337890625, 0.1282806396484375, 0.14269256591796875, 0.1571044921875, 0.17151641845703125, 0.1859283447265625, 0.20034027099609375, 0.214752197265625, 0.22916412353515625, 0.2435760498046875, 0.25798797607421875, 0.27239990234375, 0.28681182861328125, 0.3012237548828125, 0.31563568115234375, 0.330047607421875, 0.34445953369140625, 0.3588714599609375, 0.37328338623046875, 0.3876953125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 10.0, 10.0, 29.0, 24.0, 50.0, 77.0, 132.0, 196.0, 361.0, 685.0, 1281.0, 3132.0, 9888.0, 58161.0, 3548501.0, 535264.0, 25930.0, 6062.0, 2179.0, 1043.0, 512.0, 308.0, 180.0, 105.0, 62.0, 34.0, 27.0, 17.0, 3.0, 9.0, 3.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1892471313476562, -1.1577911376953125, -1.1263351440429688, -1.094879150390625, -1.0634231567382812, -1.0319671630859375, -1.0005111694335938, -0.96905517578125, -0.9375991821289062, -0.9061431884765625, -0.8746871948242188, -0.843231201171875, -0.8117752075195312, -0.7803192138671875, -0.7488632202148438, -0.7174072265625, -0.6859512329101562, -0.6544952392578125, -0.6230392456054688, -0.591583251953125, -0.5601272583007812, -0.5286712646484375, -0.49721527099609375, -0.46575927734375, -0.43430328369140625, -0.4028472900390625, -0.37139129638671875, -0.339935302734375, -0.30847930908203125, -0.2770233154296875, -0.24556732177734375, -0.214111328125, -0.18265533447265625, -0.1511993408203125, -0.11974334716796875, -0.088287353515625, -0.05683135986328125, -0.0253753662109375, 0.00608062744140625, 0.03753662109375, 0.06899261474609375, 0.1004486083984375, 0.13190460205078125, 0.163360595703125, 0.19481658935546875, 0.2262725830078125, 0.25772857666015625, 0.2891845703125, 0.32064056396484375, 0.3520965576171875, 0.38355255126953125, 0.415008544921875, 0.44646453857421875, 0.4779205322265625, 0.5093765258789062, 0.54083251953125, 0.5722885131835938, 0.6037445068359375, 0.6352005004882812, 0.666656494140625, 0.6981124877929688, 0.7295684814453125, 0.7610244750976562, 0.79248046875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 29.0, 39.0, 52.0, 107.0, 253.0, 544.0, 1075.0, 999.0, 469.0, 206.0, 86.0, 46.0, 50.0, 18.0, 17.0, 9.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2783203125, -0.2698707580566406, -0.26142120361328125, -0.2529716491699219, -0.2445220947265625, -0.23607254028320312, -0.22762298583984375, -0.21917343139648438, -0.210723876953125, -0.20227432250976562, -0.19382476806640625, -0.18537521362304688, -0.1769256591796875, -0.16847610473632812, -0.16002655029296875, -0.15157699584960938, -0.14312744140625, -0.13467788696289062, -0.12622833251953125, -0.11777877807617188, -0.1093292236328125, -0.10087966918945312, -0.09243011474609375, -0.08398056030273438, -0.075531005859375, -0.06708145141601562, -0.05863189697265625, -0.050182342529296875, -0.0417327880859375, -0.033283233642578125, -0.02483367919921875, -0.016384124755859375, -0.0079345703125, 0.000514984130859375, 0.00896453857421875, 0.017414093017578125, 0.0258636474609375, 0.034313201904296875, 0.04276275634765625, 0.051212310791015625, 0.059661865234375, 0.06811141967773438, 0.07656097412109375, 0.08501052856445312, 0.0934600830078125, 0.10190963745117188, 0.11035919189453125, 0.11880874633789062, 0.12725830078125, 0.13570785522460938, 0.14415740966796875, 0.15260696411132812, 0.1610565185546875, 0.16950607299804688, 0.17795562744140625, 0.18640518188476562, 0.194854736328125, 0.20330429077148438, 0.21175384521484375, 0.22020339965820312, 0.2286529541015625, 0.23710250854492188, 0.24555206298828125, 0.2540016174316406, 0.262451171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 11.0, 8.0, 20.0, 14.0, 34.0, 43.0, 65.0, 85.0, 133.0, 149.0, 125.0, 86.0, 59.0, 56.0, 35.0, 23.0, 13.0, 7.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0908448696136475, -1.0625654458999634, -1.0342860221862793, -1.0060065984725952, -0.9777271151542664, -0.9494476914405823, -0.9211682677268982, -0.8928887844085693, -0.8646093606948853, -0.8363299369812012, -0.8080505132675171, -0.7797710299491882, -0.7514916062355042, -0.7232121825218201, -0.694932758808136, -0.6666532754898071, -0.638373851776123, -0.610094428062439, -0.5818150043487549, -0.553535521030426, -0.5252560973167419, -0.49697667360305786, -0.4686972498893738, -0.4404177963733673, -0.4121384024620056, -0.38385897874832153, -0.35557952523231506, -0.327300101518631, -0.2990206480026245, -0.27074122428894043, -0.24246178567409515, -0.21418234705924988, -0.1859028935432434, -0.15762345492839813, -0.12934401631355286, -0.10106458514928818, -0.0727851465344429, -0.04450571537017822, -0.016226276755332947, 0.012053161859512329, 0.040332600474357605, 0.06861203908920288, 0.09689147770404816, 0.12517091631889343, 0.15345034003257751, 0.1817297786474228, 0.21000921726226807, 0.23828865587711334, 0.2665680944919586, 0.2948475182056427, 0.32312697172164917, 0.35140639543533325, 0.3796858489513397, 0.4079652726650238, 0.4362447261810303, 0.46452414989471436, 0.49280357360839844, 0.5210829973220825, 0.5493624210357666, 0.5776419043540955, 0.6059213280677795, 0.6342007517814636, 0.6624801754951477, 0.6907596588134766, 0.7190390825271606]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 9.0, 8.0, 5.0, 6.0, 22.0, 21.0, 21.0, 27.0, 43.0, 28.0, 42.0, 35.0, 43.0, 51.0, 54.0, 55.0, 56.0, 52.0, 48.0, 38.0, 43.0, 46.0, 41.0, 27.0, 38.0, 20.0, 23.0, 17.0, 13.0, 15.0, 12.0, 7.0, 10.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.510971188545227, -0.49620920419692993, -0.4814472198486328, -0.4666852355003357, -0.4519232511520386, -0.43716126680374146, -0.42239928245544434, -0.4076372981071472, -0.3928753137588501, -0.378113329410553, -0.36335134506225586, -0.34858936071395874, -0.3338273763656616, -0.3190653920173645, -0.3043034076690674, -0.28954142332077026, -0.27477943897247314, -0.260017454624176, -0.2452554702758789, -0.2304934859275818, -0.21573150157928467, -0.20096951723098755, -0.18620753288269043, -0.1714455485343933, -0.1566835641860962, -0.14192157983779907, -0.12715959548950195, -0.11239761114120483, -0.09763562679290771, -0.0828736424446106, -0.06811165809631348, -0.05334967374801636, -0.03858768939971924, -0.02382570505142212, -0.009063720703125, 0.005698263645172119, 0.02046024799346924, 0.03522223234176636, 0.04998421669006348, 0.0647462010383606, 0.07950818538665771, 0.09427016973495483, 0.10903215408325195, 0.12379413843154907, 0.1385561227798462, 0.1533181071281433, 0.16808009147644043, 0.18284207582473755, 0.19760406017303467, 0.2123660445213318, 0.2271280288696289, 0.24189001321792603, 0.25665199756622314, 0.27141398191452026, 0.2861759662628174, 0.3009379506111145, 0.3156999349594116, 0.33046191930770874, 0.34522390365600586, 0.359985888004303, 0.3747478723526001, 0.3895098567008972, 0.40427184104919434, 0.41903382539749146, 0.4337958097457886]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 10.0, 18.0, 19.0, 28.0, 43.0, 57.0, 88.0, 119.0, 193.0, 299.0, 498.0, 850.0, 1458.0, 2708.0, 5178.0, 10694.0, 24983.0, 65598.0, 200869.0, 425952.0, 197335.0, 64584.0, 24813.0, 10737.0, 4995.0, 2709.0, 1434.0, 796.0, 528.0, 317.0, 208.0, 130.0, 83.0, 60.0, 42.0, 26.0, 27.0, 12.0, 8.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.09173583984375, -0.08899688720703125, -0.0862579345703125, -0.08351898193359375, -0.080780029296875, -0.07804107666015625, -0.0753021240234375, -0.07256317138671875, -0.06982421875, -0.06708526611328125, -0.0643463134765625, -0.06160736083984375, -0.058868408203125, -0.05612945556640625, -0.0533905029296875, -0.05065155029296875, -0.04791259765625, -0.04517364501953125, -0.0424346923828125, -0.03969573974609375, -0.036956787109375, -0.03421783447265625, -0.0314788818359375, -0.02873992919921875, -0.0260009765625, -0.02326202392578125, -0.0205230712890625, -0.01778411865234375, -0.015045166015625, -0.01230621337890625, -0.0095672607421875, -0.00682830810546875, -0.00408935546875, -0.00135040283203125, 0.0013885498046875, 0.00412750244140625, 0.006866455078125, 0.00960540771484375, 0.0123443603515625, 0.01508331298828125, 0.017822265625, 0.02056121826171875, 0.0233001708984375, 0.02603912353515625, 0.028778076171875, 0.03151702880859375, 0.0342559814453125, 0.03699493408203125, 0.03973388671875, 0.04247283935546875, 0.0452117919921875, 0.04795074462890625, 0.050689697265625, 0.05342864990234375, 0.0561676025390625, 0.05890655517578125, 0.0616455078125, 0.06438446044921875, 0.0671234130859375, 0.06986236572265625, 0.072601318359375, 0.07534027099609375, 0.0780792236328125, 0.08081817626953125, 0.08355712890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 4.0, 4.0, 7.0, 4.0, 11.0, 9.0, 23.0, 18.0, 22.0, 31.0, 32.0, 36.0, 42.0, 46.0, 50.0, 59.0, 51.0, 62.0, 65.0, 71.0, 36.0, 45.0, 51.0, 33.0, 29.0, 28.0, 21.0, 25.0, 16.0, 13.0, 15.0, 10.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340576171875, -0.32952880859375, -0.3184814453125, -0.30743408203125, -0.29638671875, -0.28533935546875, -0.2742919921875, -0.26324462890625, -0.252197265625, -0.24114990234375, -0.2301025390625, -0.21905517578125, -0.2080078125, -0.19696044921875, -0.1859130859375, -0.17486572265625, -0.163818359375, -0.15277099609375, -0.1417236328125, -0.13067626953125, -0.11962890625, -0.10858154296875, -0.0975341796875, -0.08648681640625, -0.075439453125, -0.06439208984375, -0.0533447265625, -0.04229736328125, -0.03125, -0.02020263671875, -0.0091552734375, 0.00189208984375, 0.012939453125, 0.02398681640625, 0.0350341796875, 0.04608154296875, 0.05712890625, 0.06817626953125, 0.0792236328125, 0.09027099609375, 0.101318359375, 0.11236572265625, 0.1234130859375, 0.13446044921875, 0.1455078125, 0.15655517578125, 0.1676025390625, 0.17864990234375, 0.189697265625, 0.20074462890625, 0.2117919921875, 0.22283935546875, 0.23388671875, 0.24493408203125, 0.2559814453125, 0.26702880859375, 0.278076171875, 0.28912353515625, 0.3001708984375, 0.31121826171875, 0.322265625, 0.33331298828125, 0.3443603515625, 0.35540771484375, 0.366455078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 10.0, 22.0, 28.0, 45.0, 35.0, 70.0, 93.0, 123.0, 193.0, 284.0, 460.0, 697.0, 1096.0, 1924.0, 3184.0, 5631.0, 10427.0, 19500.0, 39308.0, 83136.0, 188957.0, 322460.0, 197202.0, 86987.0, 40860.0, 20457.0, 10717.0, 5939.0, 3355.0, 1942.0, 1211.0, 724.0, 485.0, 307.0, 197.0, 150.0, 99.0, 78.0, 52.0, 30.0, 14.0, 15.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.05401611328125, -0.052186012268066406, -0.05035591125488281, -0.04852581024169922, -0.046695709228515625, -0.04486560821533203, -0.04303550720214844, -0.041205406188964844, -0.03937530517578125, -0.037545204162597656, -0.03571510314941406, -0.03388500213623047, -0.032054901123046875, -0.03022480010986328, -0.028394699096679688, -0.026564598083496094, -0.0247344970703125, -0.022904396057128906, -0.021074295043945312, -0.01924419403076172, -0.017414093017578125, -0.015583992004394531, -0.013753890991210938, -0.011923789978027344, -0.01009368896484375, -0.008263587951660156, -0.0064334869384765625, -0.004603385925292969, -0.002773284912109375, -0.0009431838989257812, 0.0008869171142578125, 0.0027170181274414062, 0.004547119140625, 0.006377220153808594, 0.008207321166992188, 0.010037422180175781, 0.011867523193359375, 0.013697624206542969, 0.015527725219726562, 0.017357826232910156, 0.01918792724609375, 0.021018028259277344, 0.022848129272460938, 0.02467823028564453, 0.026508331298828125, 0.02833843231201172, 0.030168533325195312, 0.031998634338378906, 0.0338287353515625, 0.035658836364746094, 0.03748893737792969, 0.03931903839111328, 0.041149139404296875, 0.04297924041748047, 0.04480934143066406, 0.046639442443847656, 0.04846954345703125, 0.050299644470214844, 0.05212974548339844, 0.05395984649658203, 0.055789947509765625, 0.05762004852294922, 0.05945014953613281, 0.061280250549316406, 0.0631103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 5.0, 14.0, 6.0, 9.0, 13.0, 16.0, 13.0, 18.0, 22.0, 19.0, 17.0, 28.0, 23.0, 34.0, 39.0, 32.0, 32.0, 44.0, 45.0, 48.0, 50.0, 54.0, 40.0, 47.0, 33.0, 32.0, 34.0, 21.0, 36.0, 21.0, 21.0, 22.0, 20.0, 22.0, 14.0, 10.0, 4.0, 9.0, 6.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5400390625, -0.523040771484375, -0.50604248046875, -0.489044189453125, -0.4720458984375, -0.455047607421875, -0.43804931640625, -0.421051025390625, -0.404052734375, -0.387054443359375, -0.37005615234375, -0.353057861328125, -0.3360595703125, -0.319061279296875, -0.30206298828125, -0.285064697265625, -0.26806640625, -0.251068115234375, -0.23406982421875, -0.217071533203125, -0.2000732421875, -0.183074951171875, -0.16607666015625, -0.149078369140625, -0.132080078125, -0.115081787109375, -0.09808349609375, -0.081085205078125, -0.0640869140625, -0.047088623046875, -0.03009033203125, -0.013092041015625, 0.00390625, 0.020904541015625, 0.03790283203125, 0.054901123046875, 0.0718994140625, 0.088897705078125, 0.10589599609375, 0.122894287109375, 0.139892578125, 0.156890869140625, 0.17388916015625, 0.190887451171875, 0.2078857421875, 0.224884033203125, 0.24188232421875, 0.258880615234375, 0.27587890625, 0.292877197265625, 0.30987548828125, 0.326873779296875, 0.3438720703125, 0.360870361328125, 0.37786865234375, 0.394866943359375, 0.411865234375, 0.428863525390625, 0.44586181640625, 0.462860107421875, 0.4798583984375, 0.496856689453125, 0.51385498046875, 0.530853271484375, 0.5478515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 11.0, 17.0, 19.0, 25.0, 33.0, 65.0, 112.0, 202.0, 390.0, 721.0, 1561.0, 3669.0, 9399.0, 29132.0, 116315.0, 517442.0, 283745.0, 58674.0, 16482.0, 5946.0, 2287.0, 1077.0, 513.0, 281.0, 189.0, 76.0, 68.0, 33.0, 26.0, 14.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.048828125, -0.04760026931762695, -0.046372413635253906, -0.04514455795288086, -0.04391670227050781, -0.042688846588134766, -0.04146099090576172, -0.04023313522338867, -0.039005279541015625, -0.03777742385864258, -0.03654956817626953, -0.035321712493896484, -0.03409385681152344, -0.03286600112915039, -0.031638145446777344, -0.030410289764404297, -0.02918243408203125, -0.027954578399658203, -0.026726722717285156, -0.02549886703491211, -0.024271011352539062, -0.023043155670166016, -0.02181529998779297, -0.020587444305419922, -0.019359588623046875, -0.018131732940673828, -0.01690387725830078, -0.015676021575927734, -0.014448165893554688, -0.01322031021118164, -0.011992454528808594, -0.010764598846435547, -0.0095367431640625, -0.008308887481689453, -0.007081031799316406, -0.005853176116943359, -0.0046253204345703125, -0.0033974647521972656, -0.0021696090698242188, -0.0009417533874511719, 0.000286102294921875, 0.0015139579772949219, 0.0027418136596679688, 0.003969669342041016, 0.0051975250244140625, 0.006425380706787109, 0.007653236389160156, 0.008881092071533203, 0.01010894775390625, 0.011336803436279297, 0.012564659118652344, 0.01379251480102539, 0.015020370483398438, 0.016248226165771484, 0.01747608184814453, 0.018703937530517578, 0.019931793212890625, 0.021159648895263672, 0.02238750457763672, 0.023615360260009766, 0.024843215942382812, 0.02607107162475586, 0.027298927307128906, 0.028526782989501953, 0.029754638671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 8.0, 10.0, 16.0, 24.0, 40.0, 62.0, 98.0, 107.0, 136.0, 146.0, 111.0, 64.0, 44.0, 33.0, 32.0, 9.0, 12.0, 7.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.159046173095703e-05, -3.07764858007431e-05, -2.9962509870529175e-05, -2.9148533940315247e-05, -2.833455801010132e-05, -2.752058207988739e-05, -2.6706606149673462e-05, -2.5892630219459534e-05, -2.5078654289245605e-05, -2.4264678359031677e-05, -2.345070242881775e-05, -2.263672649860382e-05, -2.1822750568389893e-05, -2.1008774638175964e-05, -2.0194798707962036e-05, -1.9380822777748108e-05, -1.856684684753418e-05, -1.775287091732025e-05, -1.6938894987106323e-05, -1.6124919056892395e-05, -1.5310943126678467e-05, -1.4496967196464539e-05, -1.368299126625061e-05, -1.2869015336036682e-05, -1.2055039405822754e-05, -1.1241063475608826e-05, -1.0427087545394897e-05, -9.61311161518097e-06, -8.799135684967041e-06, -7.985159754753113e-06, -7.1711838245391846e-06, -6.357207894325256e-06, -5.543231964111328e-06, -4.7292560338974e-06, -3.915280103683472e-06, -3.1013041734695435e-06, -2.2873282432556152e-06, -1.473352313041687e-06, -6.593763828277588e-07, 1.5459954738616943e-07, 9.685754776000977e-07, 1.7825514078140259e-06, 2.596527338027954e-06, 3.4105032682418823e-06, 4.2244791984558105e-06, 5.038455128669739e-06, 5.852431058883667e-06, 6.666406989097595e-06, 7.4803829193115234e-06, 8.294358849525452e-06, 9.10833477973938e-06, 9.922310709953308e-06, 1.0736286640167236e-05, 1.1550262570381165e-05, 1.2364238500595093e-05, 1.3178214430809021e-05, 1.399219036102295e-05, 1.4806166291236877e-05, 1.5620142221450806e-05, 1.6434118151664734e-05, 1.7248094081878662e-05, 1.806207001209259e-05, 1.887604594230652e-05, 1.9690021872520447e-05, 2.0503997802734375e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 6.0, 13.0, 24.0, 28.0, 31.0, 59.0, 88.0, 143.0, 229.0, 377.0, 568.0, 983.0, 1588.0, 2869.0, 5558.0, 11076.0, 23334.0, 53624.0, 136157.0, 323894.0, 287083.0, 114624.0, 45520.0, 20048.0, 9336.0, 4809.0, 2685.0, 1522.0, 845.0, 539.0, 322.0, 208.0, 124.0, 90.0, 56.0, 33.0, 23.0, 15.0, 11.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244140625, -0.02369403839111328, -0.022974014282226562, -0.022253990173339844, -0.021533966064453125, -0.020813941955566406, -0.020093917846679688, -0.01937389373779297, -0.01865386962890625, -0.01793384552001953, -0.017213821411132812, -0.016493797302246094, -0.015773773193359375, -0.015053749084472656, -0.014333724975585938, -0.013613700866699219, -0.0128936767578125, -0.012173652648925781, -0.011453628540039062, -0.010733604431152344, -0.010013580322265625, -0.009293556213378906, -0.008573532104492188, -0.007853507995605469, -0.00713348388671875, -0.006413459777832031, -0.0056934356689453125, -0.004973411560058594, -0.004253387451171875, -0.0035333633422851562, -0.0028133392333984375, -0.0020933151245117188, -0.001373291015625, -0.0006532669067382812, 6.67572021484375e-05, 0.0007867813110351562, 0.001506805419921875, 0.0022268295288085938, 0.0029468536376953125, 0.0036668777465820312, 0.00438690185546875, 0.005106925964355469, 0.0058269500732421875, 0.006546974182128906, 0.007266998291015625, 0.007987022399902344, 0.008707046508789062, 0.009427070617675781, 0.0101470947265625, 0.010867118835449219, 0.011587142944335938, 0.012307167053222656, 0.013027191162109375, 0.013747215270996094, 0.014467239379882812, 0.015187263488769531, 0.01590728759765625, 0.01662731170654297, 0.017347335815429688, 0.018067359924316406, 0.018787384033203125, 0.019507408142089844, 0.020227432250976562, 0.02094745635986328, 0.02166748046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 4.0, 3.0, 13.0, 14.0, 15.0, 10.0, 15.0, 22.0, 34.0, 28.0, 37.0, 42.0, 46.0, 47.0, 54.0, 60.0, 67.0, 64.0, 44.0, 48.0, 57.0, 48.0, 31.0, 36.0, 27.0, 24.0, 16.0, 14.0, 18.0, 11.0, 13.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0079498291015625, -0.007714807987213135, -0.0074797868728637695, -0.007244765758514404, -0.007009744644165039, -0.006774723529815674, -0.006539702415466309, -0.006304681301116943, -0.006069660186767578, -0.005834639072418213, -0.005599617958068848, -0.005364596843719482, -0.005129575729370117, -0.004894554615020752, -0.004659533500671387, -0.0044245123863220215, -0.004189491271972656, -0.003954470157623291, -0.0037194490432739258, -0.0034844279289245605, -0.0032494068145751953, -0.00301438570022583, -0.002779364585876465, -0.0025443434715270996, -0.0023093223571777344, -0.002074301242828369, -0.001839280128479004, -0.0016042590141296387, -0.0013692378997802734, -0.0011342167854309082, -0.000899195671081543, -0.0006641745567321777, -0.0004291534423828125, -0.00019413232803344727, 4.088878631591797e-05, 0.0002759099006652832, 0.0005109310150146484, 0.0007459521293640137, 0.000980973243713379, 0.0012159943580627441, 0.0014510154724121094, 0.0016860365867614746, 0.0019210577011108398, 0.002156078815460205, 0.0023910999298095703, 0.0026261210441589355, 0.0028611421585083008, 0.003096163272857666, 0.0033311843872070312, 0.0035662055015563965, 0.0038012266159057617, 0.004036247730255127, 0.004271268844604492, 0.004506289958953857, 0.004741311073303223, 0.004976332187652588, 0.005211353302001953, 0.005446374416351318, 0.005681395530700684, 0.005916416645050049, 0.006151437759399414, 0.006386458873748779, 0.0066214799880981445, 0.00685650110244751, 0.007091522216796875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 4.0, 4.0, 4.0, 12.0, 24.0, 38.0, 89.0, 145.0, 236.0, 191.0, 105.0, 63.0, 41.0, 19.0, 11.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2030118703842163, -1.174246072769165, -1.1454803943634033, -1.1167147159576416, -1.0879489183425903, -1.059183120727539, -1.0304174423217773, -1.0016517639160156, -0.9728859663009644, -0.9441202282905579, -0.9153544902801514, -0.8865887522697449, -0.8578230142593384, -0.8290572762489319, -0.8002915382385254, -0.7715258002281189, -0.7427600622177124, -0.7139943242073059, -0.6852285861968994, -0.6564628481864929, -0.6276971101760864, -0.5989313721656799, -0.5701656341552734, -0.5413998961448669, -0.5126341581344604, -0.48386842012405396, -0.45510268211364746, -0.42633694410324097, -0.3975712060928345, -0.368805468082428, -0.3400397300720215, -0.311273992061615, -0.2825081944465637, -0.2537424564361572, -0.22497671842575073, -0.19621098041534424, -0.16744524240493774, -0.13867950439453125, -0.10991376638412476, -0.08114802837371826, -0.05238229036331177, -0.023616552352905273, 0.005149185657501221, 0.033914923667907715, 0.06268066167831421, 0.0914463996887207, 0.1202121376991272, 0.1489778757095337, 0.17774361371994019, 0.20650935173034668, 0.23527508974075317, 0.26404082775115967, 0.29280656576156616, 0.32157230377197266, 0.35033804178237915, 0.37910377979278564, 0.40786951780319214, 0.43663525581359863, 0.4654009938240051, 0.4941667318344116, 0.5229324698448181, 0.5516982078552246, 0.5804639458656311, 0.6092296838760376, 0.6379954218864441]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 9.0, 20.0, 17.0, 29.0, 30.0, 28.0, 41.0, 35.0, 42.0, 48.0, 53.0, 52.0, 62.0, 68.0, 37.0, 55.0, 43.0, 43.0, 50.0, 25.0, 37.0, 29.0, 23.0, 16.0, 15.0, 10.0, 6.0, 10.0, 12.0, 7.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3230491578578949, -0.31289345026016235, -0.3027377128601074, -0.2925819754600525, -0.28242626786231995, -0.2722705602645874, -0.26211482286453247, -0.25195908546447754, -0.241803377866745, -0.23164765536785126, -0.22149193286895752, -0.21133621037006378, -0.20118048787117004, -0.1910247653722763, -0.18086904287338257, -0.17071332037448883, -0.1605575978755951, -0.15040187537670135, -0.14024615287780762, -0.13009043037891388, -0.11993470788002014, -0.1097789853811264, -0.09962326288223267, -0.08946754038333893, -0.07931181788444519, -0.06915609538555145, -0.059000372886657715, -0.04884465038776398, -0.03868892788887024, -0.0285332053899765, -0.018377482891082764, -0.008221760392189026, 0.0019339919090270996, 0.012089714407920837, 0.022245436906814575, 0.03240115940570831, 0.04255688190460205, 0.05271260440349579, 0.06286832690238953, 0.07302404940128326, 0.083179771900177, 0.09333549439907074, 0.10349121689796448, 0.11364693939685822, 0.12380266189575195, 0.1339583843946457, 0.14411410689353943, 0.15426982939243317, 0.1644255518913269, 0.17458127439022064, 0.18473699688911438, 0.19489271938800812, 0.20504844188690186, 0.2152041643857956, 0.22535988688468933, 0.23551560938358307, 0.2456713318824768, 0.25582706928253174, 0.2659827768802643, 0.2761384844779968, 0.28629422187805176, 0.2964499592781067, 0.30660566687583923, 0.3167613744735718, 0.3269171118736267]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 1.0, 7.0, 12.0, 17.0, 18.0, 27.0, 42.0, 52.0, 65.0, 101.0, 143.0, 228.0, 412.0, 591.0, 947.0, 1690.0, 3206.0, 6810.0, 20802.0, 166446.0, 761878.0, 61500.0, 12616.0, 4857.0, 2511.0, 1321.0, 789.0, 480.0, 301.0, 210.0, 134.0, 92.0, 76.0, 45.0, 29.0, 16.0, 19.0, 18.0, 12.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.358154296875, -0.3467140197753906, -0.33527374267578125, -0.3238334655761719, -0.3123931884765625, -0.3009529113769531, -0.28951263427734375, -0.2780723571777344, -0.266632080078125, -0.2551918029785156, -0.24375152587890625, -0.23231124877929688, -0.2208709716796875, -0.20943069458007812, -0.19799041748046875, -0.18655014038085938, -0.17510986328125, -0.16366958618164062, -0.15222930908203125, -0.14078903198242188, -0.1293487548828125, -0.11790847778320312, -0.10646820068359375, -0.09502792358398438, -0.083587646484375, -0.07214736938476562, -0.06070709228515625, -0.049266815185546875, -0.0378265380859375, -0.026386260986328125, -0.01494598388671875, -0.003505706787109375, 0.0079345703125, 0.019374847412109375, 0.03081512451171875, 0.042255401611328125, 0.0536956787109375, 0.06513595581054688, 0.07657623291015625, 0.08801651000976562, 0.099456787109375, 0.11089706420898438, 0.12233734130859375, 0.13377761840820312, 0.1452178955078125, 0.15665817260742188, 0.16809844970703125, 0.17953872680664062, 0.19097900390625, 0.20241928100585938, 0.21385955810546875, 0.22529983520507812, 0.2367401123046875, 0.24818038940429688, 0.25962066650390625, 0.2710609436035156, 0.282501220703125, 0.2939414978027344, 0.30538177490234375, 0.3168220520019531, 0.3282623291015625, 0.3397026062011719, 0.35114288330078125, 0.3625831604003906, 0.3740234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 9.0, 8.0, 11.0, 12.0, 22.0, 33.0, 36.0, 32.0, 44.0, 64.0, 47.0, 56.0, 51.0, 76.0, 68.0, 58.0, 59.0, 49.0, 54.0, 38.0, 36.0, 28.0, 18.0, 21.0, 12.0, 9.0, 13.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73828125, -0.7150039672851562, -0.6917266845703125, -0.6684494018554688, -0.645172119140625, -0.6218948364257812, -0.5986175537109375, -0.5753402709960938, -0.55206298828125, -0.5287857055664062, -0.5055084228515625, -0.48223114013671875, -0.458953857421875, -0.43567657470703125, -0.4123992919921875, -0.38912200927734375, -0.3658447265625, -0.34256744384765625, -0.3192901611328125, -0.29601287841796875, -0.272735595703125, -0.24945831298828125, -0.2261810302734375, -0.20290374755859375, -0.17962646484375, -0.15634918212890625, -0.1330718994140625, -0.10979461669921875, -0.086517333984375, -0.06324005126953125, -0.0399627685546875, -0.01668548583984375, 0.006591796875, 0.02986907958984375, 0.0531463623046875, 0.07642364501953125, 0.099700927734375, 0.12297821044921875, 0.1462554931640625, 0.16953277587890625, 0.19281005859375, 0.21608734130859375, 0.2393646240234375, 0.26264190673828125, 0.285919189453125, 0.30919647216796875, 0.3324737548828125, 0.35575103759765625, 0.3790283203125, 0.40230560302734375, 0.4255828857421875, 0.44886016845703125, 0.472137451171875, 0.49541473388671875, 0.5186920166015625, 0.5419692993164062, 0.56524658203125, 0.5885238647460938, 0.6118011474609375, 0.6350784301757812, 0.658355712890625, 0.6816329956054688, 0.7049102783203125, 0.7281875610351562, 0.75146484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 9.0, 7.0, 8.0, 21.0, 28.0, 55.0, 115.0, 266.0, 812.0, 3481.0, 67036.0, 965316.0, 9074.0, 1501.0, 478.0, 178.0, 86.0, 36.0, 22.0, 13.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0540008544921875, -1.019134521484375, -0.9842681884765625, -0.94940185546875, -0.9145355224609375, -0.879669189453125, -0.8448028564453125, -0.8099365234375, -0.7750701904296875, -0.740203857421875, -0.7053375244140625, -0.67047119140625, -0.6356048583984375, -0.600738525390625, -0.5658721923828125, -0.531005859375, -0.4961395263671875, -0.461273193359375, -0.4264068603515625, -0.39154052734375, -0.3566741943359375, -0.321807861328125, -0.2869415283203125, -0.2520751953125, -0.2172088623046875, -0.182342529296875, -0.1474761962890625, -0.11260986328125, -0.0777435302734375, -0.042877197265625, -0.0080108642578125, 0.02685546875, 0.0617218017578125, 0.096588134765625, 0.1314544677734375, 0.16632080078125, 0.2011871337890625, 0.236053466796875, 0.2709197998046875, 0.3057861328125, 0.3406524658203125, 0.375518798828125, 0.4103851318359375, 0.44525146484375, 0.4801177978515625, 0.514984130859375, 0.5498504638671875, 0.584716796875, 0.6195831298828125, 0.654449462890625, 0.6893157958984375, 0.72418212890625, 0.7590484619140625, 0.793914794921875, 0.8287811279296875, 0.8636474609375, 0.8985137939453125, 0.933380126953125, 0.9682464599609375, 1.00311279296875, 1.0379791259765625, 1.072845458984375, 1.1077117919921875, 1.142578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 8.0, 8.0, 12.0, 15.0, 19.0, 24.0, 15.0, 27.0, 28.0, 32.0, 33.0, 31.0, 39.0, 34.0, 29.0, 55.0, 42.0, 50.0, 38.0, 44.0, 48.0, 37.0, 43.0, 35.0, 30.0, 13.0, 36.0, 19.0, 20.0, 24.0, 18.0, 8.0, 9.0, 6.0, 5.0, 8.0, 7.0, 4.0, 3.0, 9.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5345077514648438, -0.5157928466796875, -0.49707794189453125, -0.478363037109375, -0.45964813232421875, -0.4409332275390625, -0.42221832275390625, -0.40350341796875, -0.38478851318359375, -0.3660736083984375, -0.34735870361328125, -0.328643798828125, -0.30992889404296875, -0.2912139892578125, -0.27249908447265625, -0.2537841796875, -0.23506927490234375, -0.2163543701171875, -0.19763946533203125, -0.178924560546875, -0.16020965576171875, -0.1414947509765625, -0.12277984619140625, -0.10406494140625, -0.08535003662109375, -0.0666351318359375, -0.04792022705078125, -0.029205322265625, -0.01049041748046875, 0.0082244873046875, 0.02693939208984375, 0.045654296875, 0.06436920166015625, 0.0830841064453125, 0.10179901123046875, 0.120513916015625, 0.13922882080078125, 0.1579437255859375, 0.17665863037109375, 0.19537353515625, 0.21408843994140625, 0.2328033447265625, 0.25151824951171875, 0.270233154296875, 0.28894805908203125, 0.3076629638671875, 0.32637786865234375, 0.3450927734375, 0.36380767822265625, 0.3825225830078125, 0.40123748779296875, 0.419952392578125, 0.43866729736328125, 0.4573822021484375, 0.47609710693359375, 0.49481201171875, 0.5135269165039062, 0.5322418212890625, 0.5509567260742188, 0.569671630859375, 0.5883865356445312, 0.6071014404296875, 0.6258163452148438, 0.64453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 24.0, 34.0, 83.0, 230.0, 674.0, 3352.0, 118792.0, 914863.0, 8783.0, 1133.0, 331.0, 124.0, 48.0, 30.0, 17.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24860382080078125, -0.2403717041015625, -0.23213958740234375, -0.223907470703125, -0.21567535400390625, -0.2074432373046875, -0.19921112060546875, -0.19097900390625, -0.18274688720703125, -0.1745147705078125, -0.16628265380859375, -0.158050537109375, -0.14981842041015625, -0.1415863037109375, -0.13335418701171875, -0.1251220703125, -0.11688995361328125, -0.1086578369140625, -0.10042572021484375, -0.092193603515625, -0.08396148681640625, -0.0757293701171875, -0.06749725341796875, -0.05926513671875, -0.05103302001953125, -0.0428009033203125, -0.03456878662109375, -0.026336669921875, -0.01810455322265625, -0.0098724365234375, -0.00164031982421875, 0.006591796875, 0.01482391357421875, 0.0230560302734375, 0.03128814697265625, 0.039520263671875, 0.04775238037109375, 0.0559844970703125, 0.06421661376953125, 0.07244873046875, 0.08068084716796875, 0.0889129638671875, 0.09714508056640625, 0.105377197265625, 0.11360931396484375, 0.1218414306640625, 0.13007354736328125, 0.1383056640625, 0.14653778076171875, 0.1547698974609375, 0.16300201416015625, 0.171234130859375, 0.17946624755859375, 0.1876983642578125, 0.19593048095703125, 0.20416259765625, 0.21239471435546875, 0.2206268310546875, 0.22885894775390625, 0.237091064453125, 0.24532318115234375, 0.2535552978515625, 0.26178741455078125, 0.27001953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 4.0, 2.0, 9.0, 16.0, 34.0, 31.0, 95.0, 178.0, 266.0, 163.0, 75.0, 55.0, 31.0, 13.0, 11.0, 10.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.8505921363830566e-05, -2.7745962142944336e-05, -2.6986002922058105e-05, -2.6226043701171875e-05, -2.5466084480285645e-05, -2.4706125259399414e-05, -2.3946166038513184e-05, -2.3186206817626953e-05, -2.2426247596740723e-05, -2.1666288375854492e-05, -2.0906329154968262e-05, -2.014636993408203e-05, -1.93864107131958e-05, -1.862645149230957e-05, -1.786649227142334e-05, -1.710653305053711e-05, -1.634657382965088e-05, -1.558661460876465e-05, -1.4826655387878418e-05, -1.4066696166992188e-05, -1.3306736946105957e-05, -1.2546777725219727e-05, -1.1786818504333496e-05, -1.1026859283447266e-05, -1.0266900062561035e-05, -9.506940841674805e-06, -8.746981620788574e-06, -7.987022399902344e-06, -7.227063179016113e-06, -6.467103958129883e-06, -5.707144737243652e-06, -4.947185516357422e-06, -4.187226295471191e-06, -3.427267074584961e-06, -2.6673078536987305e-06, -1.9073486328125e-06, -1.1473894119262695e-06, -3.8743019104003906e-07, 3.725290298461914e-07, 1.1324882507324219e-06, 1.8924474716186523e-06, 2.652406692504883e-06, 3.4123659133911133e-06, 4.172325134277344e-06, 4.932284355163574e-06, 5.692243576049805e-06, 6.452202796936035e-06, 7.212162017822266e-06, 7.972121238708496e-06, 8.732080459594727e-06, 9.492039680480957e-06, 1.0251998901367188e-05, 1.1011958122253418e-05, 1.1771917343139648e-05, 1.2531876564025879e-05, 1.329183578491211e-05, 1.405179500579834e-05, 1.481175422668457e-05, 1.55717134475708e-05, 1.633167266845703e-05, 1.7091631889343262e-05, 1.7851591110229492e-05, 1.8611550331115723e-05, 1.9371509552001953e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 8.0, 11.0, 25.0, 38.0, 61.0, 129.0, 209.0, 443.0, 969.0, 2794.0, 12670.0, 356866.0, 653338.0, 15736.0, 3187.0, 1107.0, 429.0, 219.0, 127.0, 81.0, 45.0, 19.0, 19.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2376708984375, -0.2317371368408203, -0.22580337524414062, -0.21986961364746094, -0.21393585205078125, -0.20800209045410156, -0.20206832885742188, -0.1961345672607422, -0.1902008056640625, -0.1842670440673828, -0.17833328247070312, -0.17239952087402344, -0.16646575927734375, -0.16053199768066406, -0.15459823608398438, -0.1486644744873047, -0.142730712890625, -0.1367969512939453, -0.13086318969726562, -0.12492942810058594, -0.11899566650390625, -0.11306190490722656, -0.10712814331054688, -0.10119438171386719, -0.0952606201171875, -0.08932685852050781, -0.08339309692382812, -0.07745933532714844, -0.07152557373046875, -0.06559181213378906, -0.059658050537109375, -0.05372428894042969, -0.04779052734375, -0.04185676574707031, -0.035923004150390625, -0.029989242553710938, -0.02405548095703125, -0.018121719360351562, -0.012187957763671875, -0.0062541961669921875, -0.0003204345703125, 0.0056133270263671875, 0.011547088623046875, 0.017480850219726562, 0.02341461181640625, 0.029348373413085938, 0.035282135009765625, 0.04121589660644531, 0.047149658203125, 0.05308341979980469, 0.059017181396484375, 0.06495094299316406, 0.07088470458984375, 0.07681846618652344, 0.08275222778320312, 0.08868598937988281, 0.0946197509765625, 0.10055351257324219, 0.10648727416992188, 0.11242103576660156, 0.11835479736328125, 0.12428855895996094, 0.13022232055664062, 0.1361560821533203, 0.14208984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 4.0, 9.0, 4.0, 7.0, 21.0, 27.0, 24.0, 38.0, 45.0, 69.0, 76.0, 149.0, 160.0, 91.0, 74.0, 55.0, 42.0, 26.0, 13.0, 15.0, 9.0, 8.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02728271484375, -0.0260467529296875, -0.024810791015625, -0.0235748291015625, -0.0223388671875, -0.0211029052734375, -0.019866943359375, -0.0186309814453125, -0.01739501953125, -0.0161590576171875, -0.014923095703125, -0.0136871337890625, -0.012451171875, -0.0112152099609375, -0.009979248046875, -0.0087432861328125, -0.00750732421875, -0.0062713623046875, -0.005035400390625, -0.0037994384765625, -0.0025634765625, -0.0013275146484375, -9.1552734375e-05, 0.0011444091796875, 0.00238037109375, 0.0036163330078125, 0.004852294921875, 0.0060882568359375, 0.00732421875, 0.0085601806640625, 0.009796142578125, 0.0110321044921875, 0.01226806640625, 0.0135040283203125, 0.014739990234375, 0.0159759521484375, 0.0172119140625, 0.0184478759765625, 0.019683837890625, 0.0209197998046875, 0.02215576171875, 0.0233917236328125, 0.024627685546875, 0.0258636474609375, 0.027099609375, 0.0283355712890625, 0.029571533203125, 0.0308074951171875, 0.03204345703125, 0.0332794189453125, 0.034515380859375, 0.0357513427734375, 0.0369873046875, 0.0382232666015625, 0.039459228515625, 0.0406951904296875, 0.04193115234375, 0.0431671142578125, 0.044403076171875, 0.0456390380859375, 0.046875, 0.0481109619140625, 0.049346923828125, 0.0505828857421875, 0.05181884765625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 1.0, 7.0, 15.0, 13.0, 37.0, 83.0, 137.0, 203.0, 207.0, 113.0, 72.0, 50.0, 23.0, 13.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4265085458755493, -1.3737664222717285, -1.3210242986679077, -1.268282175064087, -1.2155400514602661, -1.1627979278564453, -1.110055685043335, -1.0573135614395142, -1.0045714378356934, -0.9518293142318726, -0.8990871906280518, -0.846345067024231, -0.7936028838157654, -0.7408607602119446, -0.6881186366081238, -0.6353764533996582, -0.5826343894004822, -0.5298922657966614, -0.4771501123905182, -0.4244079887866974, -0.3716658353805542, -0.3189237117767334, -0.2661815881729126, -0.2134394347667694, -0.1606973111629486, -0.10795517265796661, -0.055213041603565216, -0.0024709105491638184, 0.050271227955818176, 0.10301336646080017, 0.15575549006462097, 0.20849764347076416, 0.26123976707458496, 0.31398189067840576, 0.36672404408454895, 0.41946616768836975, 0.47220832109451294, 0.5249504446983337, 0.5776925683021545, 0.6304347515106201, 0.6831768751144409, 0.7359189987182617, 0.7886611223220825, 0.8414032459259033, 0.8941454291343689, 0.9468875527381897, 0.9996296763420105, 1.052371859550476, 1.1051139831542969, 1.1578561067581177, 1.2105982303619385, 1.2633403539657593, 1.31608247756958, 1.3688247203826904, 1.4215667247772217, 1.474308967590332, 1.5270509719848633, 1.579793095588684, 1.6325352191925049, 1.6852773427963257, 1.7380194664001465, 1.7907617092132568, 1.843503713607788, 1.8962459564208984, 1.9489880800247192]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 13.0, 3.0, 9.0, 11.0, 11.0, 9.0, 16.0, 10.0, 14.0, 16.0, 11.0, 28.0, 21.0, 22.0, 28.0, 22.0, 25.0, 32.0, 45.0, 29.0, 35.0, 34.0, 37.0, 31.0, 41.0, 40.0, 35.0, 28.0, 31.0, 32.0, 24.0, 29.0, 40.0, 30.0, 16.0, 20.0, 11.0, 18.0, 12.0, 14.0, 7.0, 16.0, 19.0, 7.0, 2.0, 7.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8438077569007874, -0.815995991230011, -0.7881841659545898, -0.7603724002838135, -0.7325605750083923, -0.704748809337616, -0.6769369840621948, -0.6491252183914185, -0.6213134527206421, -0.5935016870498657, -0.5656898617744446, -0.5378780961036682, -0.5100662708282471, -0.4822545051574707, -0.45444270968437195, -0.4266309142112732, -0.39881908893585205, -0.3710072934627533, -0.34319549798965454, -0.3153837323188782, -0.28757190704345703, -0.25976014137268066, -0.2319483458995819, -0.20413655042648315, -0.1763247549533844, -0.14851295948028564, -0.12070117145776749, -0.09288938343524933, -0.06507758796215057, -0.03726579248905182, -0.009454011917114258, 0.018357783555984497, 0.04616951942443848, 0.07398131489753723, 0.10179310292005539, 0.12960489094257355, 0.1574166864156723, 0.18522848188877106, 0.21304026246070862, 0.24085205793380737, 0.26866385340690613, 0.2964756488800049, 0.32428744435310364, 0.3520992398262024, 0.37991100549697876, 0.4077228307723999, 0.43553459644317627, 0.463346391916275, 0.4911581873893738, 0.5189699530601501, 0.5467817783355713, 0.5745935440063477, 0.6024053692817688, 0.6302171349525452, 0.6580289602279663, 0.6858407258987427, 0.713652491569519, 0.7414642572402954, 0.7692760825157166, 0.7970878481864929, 0.8248996734619141, 0.8527114391326904, 0.8805232048034668, 0.9083350300788879, 0.9361468553543091]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 16.0, 11.0, 16.0, 22.0, 19.0, 29.0, 35.0, 36.0, 46.0, 67.0, 126.0, 153.0, 243.0, 422.0, 650.0, 1095.0, 2235.0, 5718.0, 31711.0, 1835508.0, 2266340.0, 38438.0, 5955.0, 2293.0, 1201.0, 664.0, 397.0, 214.0, 184.0, 107.0, 82.0, 48.0, 53.0, 30.0, 28.0, 16.0, 20.0, 12.0, 9.0, 9.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96923828125, -0.9358444213867188, -0.9024505615234375, -0.8690567016601562, -0.835662841796875, -0.8022689819335938, -0.7688751220703125, -0.7354812622070312, -0.70208740234375, -0.6686935424804688, -0.6352996826171875, -0.6019058227539062, -0.568511962890625, -0.5351181030273438, -0.5017242431640625, -0.46833038330078125, -0.4349365234375, -0.40154266357421875, -0.3681488037109375, -0.33475494384765625, -0.301361083984375, -0.26796722412109375, -0.2345733642578125, -0.20117950439453125, -0.16778564453125, -0.13439178466796875, -0.1009979248046875, -0.06760406494140625, -0.034210205078125, -0.00081634521484375, 0.0325775146484375, 0.06597137451171875, 0.099365234375, 0.13275909423828125, 0.1661529541015625, 0.19954681396484375, 0.232940673828125, 0.26633453369140625, 0.2997283935546875, 0.33312225341796875, 0.36651611328125, 0.39990997314453125, 0.4333038330078125, 0.46669769287109375, 0.500091552734375, 0.5334854125976562, 0.5668792724609375, 0.6002731323242188, 0.6336669921875, 0.6670608520507812, 0.7004547119140625, 0.7338485717773438, 0.767242431640625, 0.8006362915039062, 0.8340301513671875, 0.8674240112304688, 0.90081787109375, 0.9342117309570312, 0.9676055908203125, 1.0009994506835938, 1.034393310546875, 1.0677871704101562, 1.1011810302734375, 1.1345748901367188, 1.16796875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 7.0, 14.0, 14.0, 17.0, 19.0, 26.0, 24.0, 23.0, 34.0, 45.0, 41.0, 62.0, 53.0, 52.0, 50.0, 51.0, 53.0, 68.0, 48.0, 46.0, 42.0, 41.0, 19.0, 32.0, 26.0, 12.0, 17.0, 8.0, 9.0, 11.0, 3.0, 8.0, 5.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.3283653259277344, -0.31664276123046875, -0.3049201965332031, -0.2931976318359375, -0.2814750671386719, -0.26975250244140625, -0.2580299377441406, -0.246307373046875, -0.23458480834960938, -0.22286224365234375, -0.21113967895507812, -0.1994171142578125, -0.18769454956054688, -0.17597198486328125, -0.16424942016601562, -0.15252685546875, -0.14080429077148438, -0.12908172607421875, -0.11735916137695312, -0.1056365966796875, -0.09391403198242188, -0.08219146728515625, -0.07046890258789062, -0.058746337890625, -0.047023773193359375, -0.03530120849609375, -0.023578643798828125, -0.0118560791015625, -0.000133514404296875, 0.01158905029296875, 0.023311614990234375, 0.0350341796875, 0.046756744384765625, 0.05847930908203125, 0.07020187377929688, 0.0819244384765625, 0.09364700317382812, 0.10536956787109375, 0.11709213256835938, 0.128814697265625, 0.14053726196289062, 0.15225982666015625, 0.16398239135742188, 0.1757049560546875, 0.18742752075195312, 0.19915008544921875, 0.21087265014648438, 0.22259521484375, 0.23431777954101562, 0.24604034423828125, 0.2577629089355469, 0.2694854736328125, 0.2812080383300781, 0.29293060302734375, 0.3046531677246094, 0.316375732421875, 0.3280982971191406, 0.33982086181640625, 0.3515434265136719, 0.3632659912109375, 0.3749885559082031, 0.38671112060546875, 0.3984336853027344, 0.41015625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 15.0, 23.0, 45.0, 45.0, 81.0, 147.0, 250.0, 543.0, 1119.0, 2638.0, 8344.0, 44778.0, 3008414.0, 1086484.0, 30774.0, 6609.0, 2135.0, 862.0, 412.0, 232.0, 105.0, 67.0, 42.0, 28.0, 22.0, 16.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9650344848632812, -0.9373931884765625, -0.9097518920898438, -0.882110595703125, -0.8544692993164062, -0.8268280029296875, -0.7991867065429688, -0.77154541015625, -0.7439041137695312, -0.7162628173828125, -0.6886215209960938, -0.660980224609375, -0.6333389282226562, -0.6056976318359375, -0.5780563354492188, -0.5504150390625, -0.5227737426757812, -0.4951324462890625, -0.46749114990234375, -0.439849853515625, -0.41220855712890625, -0.3845672607421875, -0.35692596435546875, -0.32928466796875, -0.30164337158203125, -0.2740020751953125, -0.24636077880859375, -0.218719482421875, -0.19107818603515625, -0.1634368896484375, -0.13579559326171875, -0.108154296875, -0.08051300048828125, -0.0528717041015625, -0.02523040771484375, 0.002410888671875, 0.03005218505859375, 0.0576934814453125, 0.08533477783203125, 0.11297607421875, 0.14061737060546875, 0.1682586669921875, 0.19589996337890625, 0.223541259765625, 0.25118255615234375, 0.2788238525390625, 0.30646514892578125, 0.3341064453125, 0.36174774169921875, 0.3893890380859375, 0.41703033447265625, 0.444671630859375, 0.47231292724609375, 0.4999542236328125, 0.5275955200195312, 0.55523681640625, 0.5828781127929688, 0.6105194091796875, 0.6381607055664062, 0.665802001953125, 0.6934432983398438, 0.7210845947265625, 0.7487258911132812, 0.7763671875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 10.0, 22.0, 16.0, 15.0, 49.0, 69.0, 157.0, 296.0, 574.0, 988.0, 877.0, 415.0, 241.0, 114.0, 66.0, 37.0, 27.0, 23.0, 15.0, 12.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.1618175506591797, -0.15530014038085938, -0.14878273010253906, -0.14226531982421875, -0.13574790954589844, -0.12923049926757812, -0.12271308898925781, -0.1161956787109375, -0.10967826843261719, -0.10316085815429688, -0.09664344787597656, -0.09012603759765625, -0.08360862731933594, -0.07709121704101562, -0.07057380676269531, -0.064056396484375, -0.05753898620605469, -0.051021575927734375, -0.04450416564941406, -0.03798675537109375, -0.03146934509277344, -0.024951934814453125, -0.018434524536132812, -0.0119171142578125, -0.0053997039794921875, 0.001117706298828125, 0.0076351165771484375, 0.01415252685546875, 0.020669937133789062, 0.027187347412109375, 0.03370475769042969, 0.04022216796875, 0.04673957824707031, 0.053256988525390625, 0.05977439880371094, 0.06629180908203125, 0.07280921936035156, 0.07932662963867188, 0.08584403991699219, 0.0923614501953125, 0.09887886047363281, 0.10539627075195312, 0.11191368103027344, 0.11843109130859375, 0.12494850158691406, 0.13146591186523438, 0.1379833221435547, 0.144500732421875, 0.1510181427001953, 0.15753555297851562, 0.16405296325683594, 0.17057037353515625, 0.17708778381347656, 0.18360519409179688, 0.1901226043701172, 0.1966400146484375, 0.2031574249267578, 0.20967483520507812, 0.21619224548339844, 0.22270965576171875, 0.22922706604003906, 0.23574447631835938, 0.2422618865966797, 0.248779296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 10.0, 15.0, 13.0, 44.0, 52.0, 139.0, 189.0, 185.0, 136.0, 92.0, 58.0, 31.0, 15.0, 7.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4539974927902222, -1.416054368019104, -1.3781112432479858, -1.3401682376861572, -1.302225112915039, -1.264281988143921, -1.2263388633728027, -1.1883957386016846, -1.1504526138305664, -1.1125094890594482, -1.07456636428833, -1.036623239517212, -0.9986801743507385, -0.9607371091842651, -0.922793984413147, -0.8848508596420288, -0.8469077944755554, -0.8089646697044373, -0.7710216045379639, -0.7330784797668457, -0.6951353549957275, -0.6571922302246094, -0.619249165058136, -0.5813060402870178, -0.5433629751205444, -0.5054198503494263, -0.4674767553806305, -0.4295336604118347, -0.39159053564071655, -0.3536474406719208, -0.315704345703125, -0.27776122093200684, -0.23981809616088867, -0.2018749862909317, -0.16393187642097473, -0.12598878145217896, -0.08804567158222198, -0.050102561712265015, -0.012159466743469238, 0.025783658027648926, 0.0637267529964447, 0.10166986286640167, 0.13961297273635864, 0.17755606770515442, 0.2154991775751114, 0.25344228744506836, 0.29138538241386414, 0.3293285071849823, 0.3672716021537781, 0.40521469712257385, 0.443157821893692, 0.4811009168624878, 0.519044041633606, 0.5569871664047241, 0.5949302315711975, 0.6328733563423157, 0.6708164215087891, 0.7087595462799072, 0.7467026114463806, 0.7846457362174988, 0.8225888609886169, 0.8605319261550903, 0.8984750509262085, 0.9364181756973267, 0.9743613004684448]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 9.0, 3.0, 10.0, 11.0, 11.0, 13.0, 10.0, 18.0, 12.0, 20.0, 21.0, 22.0, 29.0, 40.0, 46.0, 41.0, 42.0, 35.0, 39.0, 44.0, 41.0, 34.0, 41.0, 42.0, 45.0, 47.0, 35.0, 35.0, 26.0, 31.0, 23.0, 31.0, 18.0, 11.0, 9.0, 10.0, 11.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3959617614746094, -0.3849647045135498, -0.37396761775016785, -0.3629705607891083, -0.3519735038280487, -0.34097644686698914, -0.3299793601036072, -0.3189823031425476, -0.30798524618148804, -0.29698818922042847, -0.2859911024570465, -0.27499404549598694, -0.26399698853492737, -0.2529999315738678, -0.24200284481048584, -0.23100578784942627, -0.2200087159872055, -0.20901164412498474, -0.19801458716392517, -0.1870175153017044, -0.17602045834064484, -0.16502338647842407, -0.1540263295173645, -0.14302925765514374, -0.13203218579292297, -0.1210351213812828, -0.11003805696964264, -0.09904098510742188, -0.0880439281463623, -0.07704685628414154, -0.06604979187250137, -0.055052727460861206, -0.044055670499801636, -0.03305860608816147, -0.022061539813876152, -0.011064473539590836, -6.740912795066833e-05, 0.010929655283689499, 0.021926723420619965, 0.03292378783226013, 0.0439208522439003, 0.054917916655540466, 0.06591498106718063, 0.0769120454788208, 0.08790911734104156, 0.09890617430210114, 0.1099032461643219, 0.12090031057596207, 0.13189737498760223, 0.142894446849823, 0.15389150381088257, 0.16488857567310333, 0.1758856326341629, 0.18688270449638367, 0.19787976145744324, 0.208876833319664, 0.21987390518188477, 0.23087097704410553, 0.2418680340051651, 0.25286510586738586, 0.26386216282844543, 0.274859219789505, 0.28585630655288696, 0.29685336351394653, 0.3078504204750061]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 15.0, 23.0, 32.0, 59.0, 102.0, 181.0, 339.0, 677.0, 1483.0, 4088.0, 14162.0, 80342.0, 663418.0, 242384.0, 29971.0, 6967.0, 2318.0, 942.0, 443.0, 218.0, 131.0, 96.0, 44.0, 34.0, 14.0, 14.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.1441783905029297, -0.13857650756835938, -0.13297462463378906, -0.12737274169921875, -0.12177085876464844, -0.11616897583007812, -0.11056709289550781, -0.1049652099609375, -0.09936332702636719, -0.09376144409179688, -0.08815956115722656, -0.08255767822265625, -0.07695579528808594, -0.07135391235351562, -0.06575202941894531, -0.060150146484375, -0.05454826354980469, -0.048946380615234375, -0.04334449768066406, -0.03774261474609375, -0.03214073181152344, -0.026538848876953125, -0.020936965942382812, -0.0153350830078125, -0.009733200073242188, -0.004131317138671875, 0.0014705657958984375, 0.00707244873046875, 0.012674331665039062, 0.018276214599609375, 0.023878097534179688, 0.02947998046875, 0.03508186340332031, 0.040683746337890625, 0.04628562927246094, 0.05188751220703125, 0.05748939514160156, 0.06309127807617188, 0.06869316101074219, 0.0742950439453125, 0.07989692687988281, 0.08549880981445312, 0.09110069274902344, 0.09670257568359375, 0.10230445861816406, 0.10790634155273438, 0.11350822448730469, 0.119110107421875, 0.12471199035644531, 0.13031387329101562, 0.13591575622558594, 0.14151763916015625, 0.14711952209472656, 0.15272140502929688, 0.1583232879638672, 0.1639251708984375, 0.1695270538330078, 0.17512893676757812, 0.18073081970214844, 0.18633270263671875, 0.19193458557128906, 0.19753646850585938, 0.2031383514404297, 0.208740234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 9.0, 7.0, 12.0, 11.0, 14.0, 9.0, 18.0, 30.0, 25.0, 38.0, 48.0, 53.0, 47.0, 54.0, 53.0, 63.0, 55.0, 58.0, 60.0, 43.0, 56.0, 38.0, 32.0, 36.0, 35.0, 28.0, 15.0, 10.0, 14.0, 4.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286865234375, -0.2773017883300781, -0.26773834228515625, -0.2581748962402344, -0.2486114501953125, -0.23904800415039062, -0.22948455810546875, -0.21992111206054688, -0.210357666015625, -0.20079421997070312, -0.19123077392578125, -0.18166732788085938, -0.1721038818359375, -0.16254043579101562, -0.15297698974609375, -0.14341354370117188, -0.13385009765625, -0.12428665161132812, -0.11472320556640625, -0.10515975952148438, -0.0955963134765625, -0.08603286743164062, -0.07646942138671875, -0.06690597534179688, -0.057342529296875, -0.047779083251953125, -0.03821563720703125, -0.028652191162109375, -0.0190887451171875, -0.009525299072265625, 3.814697265625e-05, 0.009601593017578125, 0.0191650390625, 0.028728485107421875, 0.03829193115234375, 0.047855377197265625, 0.0574188232421875, 0.06698226928710938, 0.07654571533203125, 0.08610916137695312, 0.095672607421875, 0.10523605346679688, 0.11479949951171875, 0.12436294555664062, 0.1339263916015625, 0.14348983764648438, 0.15305328369140625, 0.16261672973632812, 0.17218017578125, 0.18174362182617188, 0.19130706787109375, 0.20087051391601562, 0.2104339599609375, 0.21999740600585938, 0.22956085205078125, 0.23912429809570312, 0.248687744140625, 0.2582511901855469, 0.26781463623046875, 0.2773780822753906, 0.2869415283203125, 0.2965049743652344, 0.30606842041015625, 0.3156318664550781, 0.3251953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 14.0, 19.0, 25.0, 26.0, 53.0, 82.0, 100.0, 140.0, 183.0, 320.0, 514.0, 799.0, 1380.0, 2535.0, 5544.0, 14214.0, 47166.0, 210498.0, 534732.0, 166962.0, 39489.0, 12687.0, 5100.0, 2407.0, 1367.0, 763.0, 428.0, 310.0, 200.0, 142.0, 112.0, 66.0, 55.0, 25.0, 25.0, 19.0, 10.0, 12.0, 5.0, 1.0, 2.0, 5.0, 4.0, 3.0, 1.0], "bins": [-0.11151123046875, -0.10853195190429688, -0.10555267333984375, -0.10257339477539062, -0.0995941162109375, -0.09661483764648438, -0.09363555908203125, -0.09065628051757812, -0.087677001953125, -0.08469772338867188, -0.08171844482421875, -0.07873916625976562, -0.0757598876953125, -0.07278060913085938, -0.06980133056640625, -0.06682205200195312, -0.0638427734375, -0.060863494873046875, -0.05788421630859375, -0.054904937744140625, -0.0519256591796875, -0.048946380615234375, -0.04596710205078125, -0.042987823486328125, -0.040008544921875, -0.037029266357421875, -0.03404998779296875, -0.031070709228515625, -0.0280914306640625, -0.025112152099609375, -0.02213287353515625, -0.019153594970703125, -0.01617431640625, -0.013195037841796875, -0.01021575927734375, -0.007236480712890625, -0.0042572021484375, -0.001277923583984375, 0.00170135498046875, 0.004680633544921875, 0.007659912109375, 0.010639190673828125, 0.01361846923828125, 0.016597747802734375, 0.0195770263671875, 0.022556304931640625, 0.02553558349609375, 0.028514862060546875, 0.031494140625, 0.034473419189453125, 0.03745269775390625, 0.040431976318359375, 0.0434112548828125, 0.046390533447265625, 0.04936981201171875, 0.052349090576171875, 0.055328369140625, 0.058307647705078125, 0.06128692626953125, 0.06426620483398438, 0.0672454833984375, 0.07022476196289062, 0.07320404052734375, 0.07618331909179688, 0.07916259765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 4.0, 10.0, 7.0, 10.0, 19.0, 18.0, 27.0, 25.0, 28.0, 40.0, 36.0, 35.0, 37.0, 45.0, 59.0, 48.0, 53.0, 55.0, 52.0, 47.0, 51.0, 39.0, 39.0, 38.0, 31.0, 23.0, 18.0, 23.0, 10.0, 18.0, 8.0, 5.0, 10.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4663810729980469, -0.45058441162109375, -0.4347877502441406, -0.4189910888671875, -0.4031944274902344, -0.38739776611328125, -0.3716011047363281, -0.355804443359375, -0.3400077819824219, -0.32421112060546875, -0.3084144592285156, -0.2926177978515625, -0.2768211364746094, -0.26102447509765625, -0.24522781372070312, -0.22943115234375, -0.21363449096679688, -0.19783782958984375, -0.18204116821289062, -0.1662445068359375, -0.15044784545898438, -0.13465118408203125, -0.11885452270507812, -0.103057861328125, -0.08726119995117188, -0.07146453857421875, -0.055667877197265625, -0.0398712158203125, -0.024074554443359375, -0.00827789306640625, 0.007518768310546875, 0.0233154296875, 0.039112091064453125, 0.05490875244140625, 0.07070541381835938, 0.0865020751953125, 0.10229873657226562, 0.11809539794921875, 0.13389205932617188, 0.149688720703125, 0.16548538208007812, 0.18128204345703125, 0.19707870483398438, 0.2128753662109375, 0.22867202758789062, 0.24446868896484375, 0.2602653503417969, 0.27606201171875, 0.2918586730957031, 0.30765533447265625, 0.3234519958496094, 0.3392486572265625, 0.3550453186035156, 0.37084197998046875, 0.3866386413574219, 0.402435302734375, 0.4182319641113281, 0.43402862548828125, 0.4498252868652344, 0.4656219482421875, 0.4814186096191406, 0.49721527099609375, 0.5130119323730469, 0.52880859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 17.0, 17.0, 28.0, 44.0, 52.0, 101.0, 162.0, 258.0, 478.0, 998.0, 2073.0, 4651.0, 12838.0, 45234.0, 230089.0, 557710.0, 144950.0, 31728.0, 9828.0, 3766.0, 1625.0, 833.0, 425.0, 216.0, 155.0, 86.0, 53.0, 36.0, 28.0, 10.0, 12.0, 14.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03021240234375, -0.029249191284179688, -0.028285980224609375, -0.027322769165039062, -0.02635955810546875, -0.025396347045898438, -0.024433135986328125, -0.023469924926757812, -0.0225067138671875, -0.021543502807617188, -0.020580291748046875, -0.019617080688476562, -0.01865386962890625, -0.017690658569335938, -0.016727447509765625, -0.015764236450195312, -0.014801025390625, -0.013837814331054688, -0.012874603271484375, -0.011911392211914062, -0.01094818115234375, -0.009984970092773438, -0.009021759033203125, -0.008058547973632812, -0.0070953369140625, -0.0061321258544921875, -0.005168914794921875, -0.0042057037353515625, -0.00324249267578125, -0.0022792816162109375, -0.001316070556640625, -0.0003528594970703125, 0.0006103515625, 0.0015735626220703125, 0.002536773681640625, 0.0034999847412109375, 0.00446319580078125, 0.0054264068603515625, 0.006389617919921875, 0.0073528289794921875, 0.0083160400390625, 0.009279251098632812, 0.010242462158203125, 0.011205673217773438, 0.01216888427734375, 0.013132095336914062, 0.014095306396484375, 0.015058517456054688, 0.016021728515625, 0.016984939575195312, 0.017948150634765625, 0.018911361694335938, 0.01987457275390625, 0.020837783813476562, 0.021800994873046875, 0.022764205932617188, 0.0237274169921875, 0.024690628051757812, 0.025653839111328125, 0.026617050170898438, 0.02758026123046875, 0.028543472290039062, 0.029506683349609375, 0.030469894409179688, 0.03143310546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 1.0, 5.0, 8.0, 7.0, 22.0, 12.0, 32.0, 38.0, 49.0, 65.0, 94.0, 112.0, 110.0, 110.0, 71.0, 69.0, 52.0, 31.0, 30.0, 20.0, 18.0, 7.0, 9.0, 7.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4781951904296875e-05, -1.4241784811019897e-05, -1.370161771774292e-05, -1.3161450624465942e-05, -1.2621283531188965e-05, -1.2081116437911987e-05, -1.154094934463501e-05, -1.1000782251358032e-05, -1.0460615158081055e-05, -9.920448064804077e-06, -9.3802809715271e-06, -8.840113878250122e-06, -8.299946784973145e-06, -7.759779691696167e-06, -7.2196125984191895e-06, -6.679445505142212e-06, -6.139278411865234e-06, -5.599111318588257e-06, -5.058944225311279e-06, -4.518777132034302e-06, -3.978610038757324e-06, -3.4384429454803467e-06, -2.898275852203369e-06, -2.3581087589263916e-06, -1.817941665649414e-06, -1.2777745723724365e-06, -7.37607479095459e-07, -1.9744038581848145e-07, 3.427267074584961e-07, 8.828938007354736e-07, 1.4230608940124512e-06, 1.9632279872894287e-06, 2.5033950805664062e-06, 3.043562173843384e-06, 3.5837292671203613e-06, 4.123896360397339e-06, 4.664063453674316e-06, 5.204230546951294e-06, 5.7443976402282715e-06, 6.284564733505249e-06, 6.8247318267822266e-06, 7.364898920059204e-06, 7.905066013336182e-06, 8.44523310661316e-06, 8.985400199890137e-06, 9.525567293167114e-06, 1.0065734386444092e-05, 1.060590147972107e-05, 1.1146068572998047e-05, 1.1686235666275024e-05, 1.2226402759552002e-05, 1.276656985282898e-05, 1.3306736946105957e-05, 1.3846904039382935e-05, 1.4387071132659912e-05, 1.492723822593689e-05, 1.5467405319213867e-05, 1.6007572412490845e-05, 1.6547739505767822e-05, 1.70879065990448e-05, 1.7628073692321777e-05, 1.8168240785598755e-05, 1.8708407878875732e-05, 1.924857497215271e-05, 1.9788742065429688e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 13.0, 15.0, 18.0, 37.0, 46.0, 84.0, 121.0, 160.0, 287.0, 466.0, 766.0, 1242.0, 2375.0, 4582.0, 8882.0, 19570.0, 46646.0, 123927.0, 304241.0, 314509.0, 130991.0, 49634.0, 20278.0, 9289.0, 4528.0, 2439.0, 1314.0, 780.0, 463.0, 302.0, 182.0, 112.0, 74.0, 57.0, 42.0, 27.0, 19.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017547607421875, -0.016921520233154297, -0.016295433044433594, -0.01566934585571289, -0.015043258666992188, -0.014417171478271484, -0.013791084289550781, -0.013164997100830078, -0.012538909912109375, -0.011912822723388672, -0.011286735534667969, -0.010660648345947266, -0.010034561157226562, -0.00940847396850586, -0.008782386779785156, -0.008156299591064453, -0.00753021240234375, -0.006904125213623047, -0.006278038024902344, -0.005651950836181641, -0.0050258636474609375, -0.004399776458740234, -0.0037736892700195312, -0.003147602081298828, -0.002521514892578125, -0.0018954277038574219, -0.0012693405151367188, -0.0006432533264160156, -1.71661376953125e-05, 0.0006089210510253906, 0.0012350082397460938, 0.0018610954284667969, 0.0024871826171875, 0.003113269805908203, 0.0037393569946289062, 0.004365444183349609, 0.0049915313720703125, 0.005617618560791016, 0.006243705749511719, 0.006869792938232422, 0.007495880126953125, 0.008121967315673828, 0.008748054504394531, 0.009374141693115234, 0.010000228881835938, 0.01062631607055664, 0.011252403259277344, 0.011878490447998047, 0.01250457763671875, 0.013130664825439453, 0.013756752014160156, 0.01438283920288086, 0.015008926391601562, 0.015635013580322266, 0.01626110076904297, 0.016887187957763672, 0.017513275146484375, 0.018139362335205078, 0.01876544952392578, 0.019391536712646484, 0.020017623901367188, 0.02064371109008789, 0.021269798278808594, 0.021895885467529297, 0.02252197265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 7.0, 6.0, 14.0, 18.0, 14.0, 20.0, 23.0, 31.0, 35.0, 40.0, 59.0, 54.0, 77.0, 79.0, 51.0, 69.0, 74.0, 52.0, 48.0, 51.0, 24.0, 38.0, 30.0, 24.0, 12.0, 10.0, 8.0, 9.0, 7.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00891876220703125, -0.008684635162353516, -0.008450508117675781, -0.008216381072998047, -0.007982254028320312, -0.007748126983642578, -0.007513999938964844, -0.007279872894287109, -0.007045745849609375, -0.006811618804931641, -0.006577491760253906, -0.006343364715576172, -0.0061092376708984375, -0.005875110626220703, -0.005640983581542969, -0.005406856536865234, -0.0051727294921875, -0.004938602447509766, -0.004704475402832031, -0.004470348358154297, -0.0042362213134765625, -0.004002094268798828, -0.0037679672241210938, -0.0035338401794433594, -0.003299713134765625, -0.0030655860900878906, -0.0028314590454101562, -0.002597332000732422, -0.0023632049560546875, -0.002129077911376953, -0.0018949508666992188, -0.0016608238220214844, -0.00142669677734375, -0.0011925697326660156, -0.0009584426879882812, -0.0007243156433105469, -0.0004901885986328125, -0.0002560615539550781, -2.193450927734375e-05, 0.00021219253540039062, 0.000446319580078125, 0.0006804466247558594, 0.0009145736694335938, 0.0011487007141113281, 0.0013828277587890625, 0.0016169548034667969, 0.0018510818481445312, 0.0020852088928222656, 0.0023193359375, 0.0025534629821777344, 0.0027875900268554688, 0.003021717071533203, 0.0032558441162109375, 0.003489971160888672, 0.0037240982055664062, 0.003958225250244141, 0.004192352294921875, 0.004426479339599609, 0.004660606384277344, 0.004894733428955078, 0.0051288604736328125, 0.005362987518310547, 0.005597114562988281, 0.005831241607666016, 0.00606536865234375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 44.0, 51.0, 104.0, 159.0, 174.0, 157.0, 104.0, 61.0, 43.0, 19.0, 19.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.8640743494033813, -0.8442875146865845, -0.8245007395744324, -0.8047139048576355, -0.7849271297454834, -0.7651402950286865, -0.7453534603118896, -0.7255666255950928, -0.7057798504829407, -0.6859930157661438, -0.6662062406539917, -0.6464194059371948, -0.626632571220398, -0.6068457961082458, -0.587058961391449, -0.5672721862792969, -0.5474853515625, -0.5276985168457031, -0.507911741733551, -0.48812490701675415, -0.46833810210227966, -0.4485512971878052, -0.4287644624710083, -0.4089776575565338, -0.3891908526420593, -0.36940404772758484, -0.34961724281311035, -0.3298304080963135, -0.310043603181839, -0.2902567982673645, -0.2704699635505676, -0.25068315863609314, -0.23089641332626343, -0.21110960841178894, -0.19132278859615326, -0.17153596878051758, -0.1517491638660431, -0.1319623589515686, -0.11217553913593292, -0.09238871932029724, -0.07260191440582275, -0.05281510204076767, -0.033028289675712585, -0.013241477310657501, 0.006545335054397583, 0.026332147419452667, 0.04611895978450775, 0.06590577960014343, 0.08569258451461792, 0.105479396879673, 0.1252662092447281, 0.14505302906036377, 0.16483983397483826, 0.18462663888931274, 0.20441345870494843, 0.2242002785205841, 0.2439870834350586, 0.2637738883495331, 0.28356069326400757, 0.30334752798080444, 0.32313433289527893, 0.3429211378097534, 0.3627079725265503, 0.3824947774410248, 0.40228158235549927]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 10.0, 6.0, 3.0, 10.0, 7.0, 16.0, 11.0, 15.0, 15.0, 19.0, 27.0, 28.0, 35.0, 46.0, 42.0, 60.0, 53.0, 41.0, 50.0, 43.0, 62.0, 53.0, 57.0, 43.0, 48.0, 32.0, 43.0, 33.0, 22.0, 17.0, 12.0, 14.0, 8.0, 6.0, 4.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2526215612888336, -0.24417267739772797, -0.23572379350662231, -0.22727490961551666, -0.218826025724411, -0.21037714183330536, -0.2019282579421997, -0.19347938895225525, -0.1850304901599884, -0.17658160626888275, -0.1681327223777771, -0.15968383848667145, -0.1512349545955658, -0.14278607070446014, -0.1343371868133545, -0.12588831782341003, -0.11743943393230438, -0.10899055004119873, -0.10054166615009308, -0.09209278225898743, -0.08364389836788177, -0.07519501447677612, -0.06674613803625107, -0.058297254145145416, -0.049848370254039764, -0.04139948636293411, -0.03295060247182846, -0.024501722306013107, -0.016052838414907455, -0.007603954523801804, 0.0008449256420135498, 0.009293809533119202, 0.017742693424224854, 0.026191577315330505, 0.03464046120643616, 0.04308934137225151, 0.05153822526335716, 0.059987109154462814, 0.06843598932027817, 0.07688487321138382, 0.08533375710248947, 0.09378264099359512, 0.10223152488470078, 0.11068040132522583, 0.11912928521633148, 0.12757816910743713, 0.13602705299854279, 0.14447593688964844, 0.1529248207807541, 0.16137370467185974, 0.1698225885629654, 0.17827147245407104, 0.1867203563451767, 0.19516924023628235, 0.2036181092262268, 0.21206700801849365, 0.2205158770084381, 0.22896476089954376, 0.23741364479064941, 0.24586252868175507, 0.2543114125728607, 0.2627602815628052, 0.271209180355072, 0.2796580493450165, 0.2881069481372833]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 11.0, 18.0, 23.0, 28.0, 50.0, 69.0, 88.0, 118.0, 202.0, 273.0, 448.0, 699.0, 1246.0, 2173.0, 4392.0, 8942.0, 21255.0, 56364.0, 244036.0, 559658.0, 92269.0, 30941.0, 12612.0, 5724.0, 2887.0, 1552.0, 834.0, 548.0, 308.0, 229.0, 160.0, 107.0, 76.0, 50.0, 32.0, 26.0, 24.0, 23.0, 12.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.196044921875, -0.19031333923339844, -0.18458175659179688, -0.1788501739501953, -0.17311859130859375, -0.1673870086669922, -0.16165542602539062, -0.15592384338378906, -0.1501922607421875, -0.14446067810058594, -0.13872909545898438, -0.1329975128173828, -0.12726593017578125, -0.12153434753417969, -0.11580276489257812, -0.11007118225097656, -0.104339599609375, -0.09860801696777344, -0.09287643432617188, -0.08714485168457031, -0.08141326904296875, -0.07568168640136719, -0.06995010375976562, -0.06421852111816406, -0.0584869384765625, -0.05275535583496094, -0.047023773193359375, -0.04129219055175781, -0.03556060791015625, -0.029829025268554688, -0.024097442626953125, -0.018365859985351562, -0.01263427734375, -0.0069026947021484375, -0.001171112060546875, 0.0045604705810546875, 0.01029205322265625, 0.016023635864257812, 0.021755218505859375, 0.027486801147460938, 0.0332183837890625, 0.03894996643066406, 0.044681549072265625, 0.05041313171386719, 0.05614471435546875, 0.06187629699707031, 0.06760787963867188, 0.07333946228027344, 0.079071044921875, 0.08480262756347656, 0.09053421020507812, 0.09626579284667969, 0.10199737548828125, 0.10772895812988281, 0.11346054077148438, 0.11919212341308594, 0.1249237060546875, 0.13065528869628906, 0.13638687133789062, 0.1421184539794922, 0.14785003662109375, 0.1535816192626953, 0.15931320190429688, 0.16504478454589844, 0.1707763671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 5.0, 6.0, 8.0, 11.0, 14.0, 10.0, 18.0, 17.0, 18.0, 28.0, 34.0, 54.0, 50.0, 66.0, 47.0, 56.0, 66.0, 50.0, 58.0, 60.0, 63.0, 50.0, 29.0, 44.0, 24.0, 34.0, 18.0, 14.0, 13.0, 5.0, 6.0, 3.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5216445922851562, -0.5027618408203125, -0.48387908935546875, -0.464996337890625, -0.44611358642578125, -0.4272308349609375, -0.40834808349609375, -0.38946533203125, -0.37058258056640625, -0.3516998291015625, -0.33281707763671875, -0.313934326171875, -0.29505157470703125, -0.2761688232421875, -0.25728607177734375, -0.2384033203125, -0.21952056884765625, -0.2006378173828125, -0.18175506591796875, -0.162872314453125, -0.14398956298828125, -0.1251068115234375, -0.10622406005859375, -0.08734130859375, -0.06845855712890625, -0.0495758056640625, -0.03069305419921875, -0.011810302734375, 0.00707244873046875, 0.0259552001953125, 0.04483795166015625, 0.063720703125, 0.08260345458984375, 0.1014862060546875, 0.12036895751953125, 0.139251708984375, 0.15813446044921875, 0.1770172119140625, 0.19589996337890625, 0.21478271484375, 0.23366546630859375, 0.2525482177734375, 0.27143096923828125, 0.290313720703125, 0.30919647216796875, 0.3280792236328125, 0.34696197509765625, 0.3658447265625, 0.38472747802734375, 0.4036102294921875, 0.42249298095703125, 0.441375732421875, 0.46025848388671875, 0.4791412353515625, 0.49802398681640625, 0.51690673828125, 0.5357894897460938, 0.5546722412109375, 0.5735549926757812, 0.592437744140625, 0.6113204956054688, 0.6302032470703125, 0.6490859985351562, 0.66796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 9.0, 8.0, 8.0, 12.0, 10.0, 22.0, 17.0, 20.0, 37.0, 49.0, 66.0, 80.0, 139.0, 404.0, 2014.0, 46598.0, 970749.0, 25869.0, 1553.0, 382.0, 140.0, 93.0, 49.0, 42.0, 34.0, 34.0, 15.0, 20.0, 24.0, 16.0, 8.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.80517578125, -0.7824478149414062, -0.7597198486328125, -0.7369918823242188, -0.714263916015625, -0.6915359497070312, -0.6688079833984375, -0.6460800170898438, -0.62335205078125, -0.6006240844726562, -0.5778961181640625, -0.5551681518554688, -0.532440185546875, -0.5097122192382812, -0.4869842529296875, -0.46425628662109375, -0.4415283203125, -0.41880035400390625, -0.3960723876953125, -0.37334442138671875, -0.350616455078125, -0.32788848876953125, -0.3051605224609375, -0.28243255615234375, -0.25970458984375, -0.23697662353515625, -0.2142486572265625, -0.19152069091796875, -0.168792724609375, -0.14606475830078125, -0.1233367919921875, -0.10060882568359375, -0.077880859375, -0.05515289306640625, -0.0324249267578125, -0.00969696044921875, 0.013031005859375, 0.03575897216796875, 0.0584869384765625, 0.08121490478515625, 0.10394287109375, 0.12667083740234375, 0.1493988037109375, 0.17212677001953125, 0.194854736328125, 0.21758270263671875, 0.2403106689453125, 0.26303863525390625, 0.2857666015625, 0.30849456787109375, 0.3312225341796875, 0.35395050048828125, 0.376678466796875, 0.39940643310546875, 0.4221343994140625, 0.44486236572265625, 0.46759033203125, 0.49031829833984375, 0.5130462646484375, 0.5357742309570312, 0.558502197265625, 0.5812301635742188, 0.6039581298828125, 0.6266860961914062, 0.6494140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 13.0, 5.0, 10.0, 6.0, 15.0, 12.0, 14.0, 23.0, 28.0, 39.0, 34.0, 47.0, 45.0, 51.0, 64.0, 60.0, 53.0, 54.0, 57.0, 51.0, 44.0, 53.0, 39.0, 26.0, 22.0, 25.0, 19.0, 24.0, 13.0, 12.0, 9.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61279296875, -0.59356689453125, -0.5743408203125, -0.55511474609375, -0.535888671875, -0.51666259765625, -0.4974365234375, -0.47821044921875, -0.458984375, -0.43975830078125, -0.4205322265625, -0.40130615234375, -0.382080078125, -0.36285400390625, -0.3436279296875, -0.32440185546875, -0.30517578125, -0.28594970703125, -0.2667236328125, -0.24749755859375, -0.228271484375, -0.20904541015625, -0.1898193359375, -0.17059326171875, -0.1513671875, -0.13214111328125, -0.1129150390625, -0.09368896484375, -0.074462890625, -0.05523681640625, -0.0360107421875, -0.01678466796875, 0.00244140625, 0.02166748046875, 0.0408935546875, 0.06011962890625, 0.079345703125, 0.09857177734375, 0.1177978515625, 0.13702392578125, 0.15625, 0.17547607421875, 0.1947021484375, 0.21392822265625, 0.233154296875, 0.25238037109375, 0.2716064453125, 0.29083251953125, 0.31005859375, 0.32928466796875, 0.3485107421875, 0.36773681640625, 0.386962890625, 0.40618896484375, 0.4254150390625, 0.44464111328125, 0.4638671875, 0.48309326171875, 0.5023193359375, 0.52154541015625, 0.540771484375, 0.55999755859375, 0.5792236328125, 0.59844970703125, 0.61767578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 7.0, 8.0, 15.0, 25.0, 45.0, 99.0, 212.0, 552.0, 1684.0, 9674.0, 318866.0, 702227.0, 12258.0, 1840.0, 566.0, 261.0, 87.0, 58.0, 19.0, 21.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14550018310546875, -0.1389007568359375, -0.13230133056640625, -0.125701904296875, -0.11910247802734375, -0.1125030517578125, -0.10590362548828125, -0.09930419921875, -0.09270477294921875, -0.0861053466796875, -0.07950592041015625, -0.072906494140625, -0.06630706787109375, -0.0597076416015625, -0.05310821533203125, -0.0465087890625, -0.03990936279296875, -0.0333099365234375, -0.02671051025390625, -0.020111083984375, -0.01351165771484375, -0.0069122314453125, -0.00031280517578125, 0.00628662109375, 0.01288604736328125, 0.0194854736328125, 0.02608489990234375, 0.032684326171875, 0.03928375244140625, 0.0458831787109375, 0.05248260498046875, 0.05908203125, 0.06568145751953125, 0.0722808837890625, 0.07888031005859375, 0.085479736328125, 0.09207916259765625, 0.0986785888671875, 0.10527801513671875, 0.11187744140625, 0.11847686767578125, 0.1250762939453125, 0.13167572021484375, 0.138275146484375, 0.14487457275390625, 0.1514739990234375, 0.15807342529296875, 0.1646728515625, 0.17127227783203125, 0.1778717041015625, 0.18447113037109375, 0.191070556640625, 0.19766998291015625, 0.2042694091796875, 0.21086883544921875, 0.21746826171875, 0.22406768798828125, 0.2306671142578125, 0.23726654052734375, 0.243865966796875, 0.25046539306640625, 0.2570648193359375, 0.26366424560546875, 0.270263671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 7.0, 2.0, 8.0, 15.0, 19.0, 20.0, 30.0, 41.0, 76.0, 212.0, 291.0, 98.0, 50.0, 41.0, 19.0, 16.0, 20.0, 14.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4497509002685547e-05, -2.3801811039447784e-05, -2.3106113076210022e-05, -2.241041511297226e-05, -2.1714717149734497e-05, -2.1019019186496735e-05, -2.0323321223258972e-05, -1.962762326002121e-05, -1.8931925296783447e-05, -1.8236227333545685e-05, -1.7540529370307922e-05, -1.684483140707016e-05, -1.6149133443832397e-05, -1.5453435480594635e-05, -1.4757737517356873e-05, -1.406203955411911e-05, -1.3366341590881348e-05, -1.2670643627643585e-05, -1.1974945664405823e-05, -1.127924770116806e-05, -1.0583549737930298e-05, -9.887851774692535e-06, -9.192153811454773e-06, -8.49645584821701e-06, -7.800757884979248e-06, -7.105059921741486e-06, -6.409361958503723e-06, -5.713663995265961e-06, -5.017966032028198e-06, -4.322268068790436e-06, -3.6265701055526733e-06, -2.930872142314911e-06, -2.2351741790771484e-06, -1.539476215839386e-06, -8.437782526016235e-07, -1.4808028936386108e-07, 5.476176738739014e-07, 1.2433156371116638e-06, 1.9390136003494263e-06, 2.6347115635871887e-06, 3.330409526824951e-06, 4.026107490062714e-06, 4.721805453300476e-06, 5.4175034165382385e-06, 6.113201379776001e-06, 6.8088993430137634e-06, 7.504597306251526e-06, 8.200295269489288e-06, 8.89599323272705e-06, 9.591691195964813e-06, 1.0287389159202576e-05, 1.0983087122440338e-05, 1.16787850856781e-05, 1.2374483048915863e-05, 1.3070181012153625e-05, 1.3765878975391388e-05, 1.446157693862915e-05, 1.5157274901866913e-05, 1.5852972865104675e-05, 1.6548670828342438e-05, 1.72443687915802e-05, 1.7940066754817963e-05, 1.8635764718055725e-05, 1.9331462681293488e-05, 2.002716064453125e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 7.0, 12.0, 18.0, 36.0, 42.0, 63.0, 72.0, 139.0, 195.0, 318.0, 559.0, 1172.0, 3501.0, 24299.0, 855156.0, 149600.0, 9192.0, 2107.0, 779.0, 470.0, 257.0, 179.0, 119.0, 77.0, 64.0, 43.0, 19.0, 18.0, 13.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.26708984375, -0.2606983184814453, -0.2543067932128906, -0.24791526794433594, -0.24152374267578125, -0.23513221740722656, -0.22874069213867188, -0.2223491668701172, -0.2159576416015625, -0.2095661163330078, -0.20317459106445312, -0.19678306579589844, -0.19039154052734375, -0.18400001525878906, -0.17760848999023438, -0.1712169647216797, -0.164825439453125, -0.1584339141845703, -0.15204238891601562, -0.14565086364746094, -0.13925933837890625, -0.13286781311035156, -0.12647628784179688, -0.12008476257324219, -0.1136932373046875, -0.10730171203613281, -0.10091018676757812, -0.09451866149902344, -0.08812713623046875, -0.08173561096191406, -0.07534408569335938, -0.06895256042480469, -0.06256103515625, -0.05616950988769531, -0.049777984619140625, -0.04338645935058594, -0.03699493408203125, -0.030603408813476562, -0.024211883544921875, -0.017820358276367188, -0.0114288330078125, -0.0050373077392578125, 0.001354217529296875, 0.0077457427978515625, 0.01413726806640625, 0.020528793334960938, 0.026920318603515625, 0.03331184387207031, 0.039703369140625, 0.04609489440917969, 0.052486419677734375, 0.05887794494628906, 0.06526947021484375, 0.07166099548339844, 0.07805252075195312, 0.08444404602050781, 0.0908355712890625, 0.09722709655761719, 0.10361862182617188, 0.11001014709472656, 0.11640167236328125, 0.12279319763183594, 0.12918472290039062, 0.1355762481689453, 0.1419677734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 8.0, 13.0, 20.0, 25.0, 36.0, 48.0, 66.0, 114.0, 311.0, 107.0, 64.0, 47.0, 32.0, 28.0, 21.0, 9.0, 8.0, 9.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0455322265625, -0.04398965835571289, -0.04244709014892578, -0.04090452194213867, -0.03936195373535156, -0.03781938552856445, -0.036276817321777344, -0.034734249114990234, -0.033191680908203125, -0.031649112701416016, -0.030106544494628906, -0.028563976287841797, -0.027021408081054688, -0.025478839874267578, -0.02393627166748047, -0.02239370346069336, -0.02085113525390625, -0.01930856704711914, -0.01776599884033203, -0.016223430633544922, -0.014680862426757812, -0.013138294219970703, -0.011595726013183594, -0.010053157806396484, -0.008510589599609375, -0.006968021392822266, -0.005425453186035156, -0.003882884979248047, -0.0023403167724609375, -0.0007977485656738281, 0.0007448196411132812, 0.0022873878479003906, 0.0038299560546875, 0.005372524261474609, 0.006915092468261719, 0.008457660675048828, 0.010000228881835938, 0.011542797088623047, 0.013085365295410156, 0.014627933502197266, 0.016170501708984375, 0.017713069915771484, 0.019255638122558594, 0.020798206329345703, 0.022340774536132812, 0.023883342742919922, 0.02542591094970703, 0.02696847915649414, 0.02851104736328125, 0.03005361557006836, 0.03159618377685547, 0.03313875198364258, 0.03468132019042969, 0.0362238883972168, 0.037766456604003906, 0.039309024810791016, 0.040851593017578125, 0.042394161224365234, 0.043936729431152344, 0.04547929763793945, 0.04702186584472656, 0.04856443405151367, 0.05010700225830078, 0.05164957046508789, 0.053192138671875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 11.0, 19.0, 35.0, 85.0, 199.0, 253.0, 203.0, 92.0, 53.0, 25.0, 11.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.837075710296631, -2.7774691581726074, -2.717862606048584, -2.6582562923431396, -2.598649740219116, -2.5390431880950928, -2.4794368743896484, -2.419830322265625, -2.3602237701416016, -2.300617218017578, -2.2410106658935547, -2.1814043521881104, -2.121797800064087, -2.0621912479400635, -2.002584934234619, -1.9429783821105957, -1.8833718299865723, -1.8237652778625488, -1.764158844947815, -1.704552412033081, -1.6449458599090576, -1.5853393077850342, -1.5257328748703003, -1.4661264419555664, -1.406519889831543, -1.3469133377075195, -1.2873069047927856, -1.2277004718780518, -1.1680939197540283, -1.1084873676300049, -1.048880934715271, -0.9892744421958923, -0.9296679496765137, -0.870061457157135, -0.8104549646377563, -0.7508484721183777, -0.691241979598999, -0.6316354870796204, -0.5720289945602417, -0.512422502040863, -0.4528160095214844, -0.3932095170021057, -0.33360302448272705, -0.2739965319633484, -0.21439003944396973, -0.15478354692459106, -0.0951770544052124, -0.03557056188583374, 0.024035930633544922, 0.08364242315292358, 0.14324891567230225, 0.2028554081916809, 0.26246190071105957, 0.32206839323043823, 0.3816748857498169, 0.44128137826919556, 0.5008878707885742, 0.5604943633079529, 0.6201008558273315, 0.6797073483467102, 0.7393138408660889, 0.7989203333854675, 0.8585268259048462, 0.9181333184242249, 0.9777398109436035]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 6.0, 12.0, 13.0, 13.0, 30.0, 16.0, 18.0, 26.0, 30.0, 27.0, 35.0, 32.0, 28.0, 37.0, 41.0, 37.0, 48.0, 40.0, 42.0, 55.0, 45.0, 37.0, 31.0, 32.0, 34.0, 30.0, 21.0, 19.0, 23.0, 17.0, 21.0, 12.0, 9.0, 15.0, 12.0, 8.0, 8.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7865099310874939, -0.7614437937736511, -0.7363776564598083, -0.7113115191459656, -0.6862453818321228, -0.66117924451828, -0.6361130475997925, -0.6110469102859497, -0.5859807729721069, -0.5609146356582642, -0.5358484983444214, -0.5107823610305786, -0.48571622371673584, -0.46065008640289307, -0.4355839192867279, -0.41051778197288513, -0.38545167446136475, -0.360385537147522, -0.3353193998336792, -0.3102532625198364, -0.28518712520599365, -0.2601209878921509, -0.23505482077598572, -0.20998868346214294, -0.18492254614830017, -0.1598564088344574, -0.13479027152061462, -0.10972411930561066, -0.08465798199176788, -0.05959184467792511, -0.03452569246292114, -0.00945955514907837, 0.01560664176940918, 0.04067278280854225, 0.06573892384767532, 0.0908050686120987, 0.11587120592594147, 0.14093734323978424, 0.1660034954547882, 0.19106963276863098, 0.21613577008247375, 0.24120190739631653, 0.2662680447101593, 0.29133421182632446, 0.31640034914016724, 0.34146648645401, 0.3665326237678528, 0.39159876108169556, 0.41666489839553833, 0.4417310357093811, 0.4667971730232239, 0.49186331033706665, 0.5169294476509094, 0.5419955849647522, 0.5670617818832397, 0.5921279191970825, 0.6171940565109253, 0.6422601938247681, 0.6673263311386108, 0.6923924684524536, 0.7174586057662964, 0.7425247430801392, 0.7675908803939819, 0.7926570177078247, 0.8177231550216675]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 10.0, 5.0, 11.0, 22.0, 18.0, 27.0, 37.0, 55.0, 81.0, 117.0, 172.0, 257.0, 393.0, 598.0, 1036.0, 2005.0, 4166.0, 14365.0, 147184.0, 3508166.0, 478432.0, 25545.0, 5891.0, 2398.0, 1238.0, 743.0, 417.0, 270.0, 196.0, 122.0, 88.0, 68.0, 47.0, 19.0, 24.0, 10.0, 10.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.6826171875, -0.6587905883789062, -0.6349639892578125, -0.6111373901367188, -0.587310791015625, -0.5634841918945312, -0.5396575927734375, -0.5158309936523438, -0.49200439453125, -0.46817779541015625, -0.4443511962890625, -0.42052459716796875, -0.396697998046875, -0.37287139892578125, -0.3490447998046875, -0.32521820068359375, -0.3013916015625, -0.27756500244140625, -0.2537384033203125, -0.22991180419921875, -0.206085205078125, -0.18225860595703125, -0.1584320068359375, -0.13460540771484375, -0.11077880859375, -0.08695220947265625, -0.0631256103515625, -0.03929901123046875, -0.015472412109375, 0.00835418701171875, 0.0321807861328125, 0.05600738525390625, 0.079833984375, 0.10366058349609375, 0.1274871826171875, 0.15131378173828125, 0.175140380859375, 0.19896697998046875, 0.2227935791015625, 0.24662017822265625, 0.27044677734375, 0.29427337646484375, 0.3180999755859375, 0.34192657470703125, 0.365753173828125, 0.38957977294921875, 0.4134063720703125, 0.43723297119140625, 0.4610595703125, 0.48488616943359375, 0.5087127685546875, 0.5325393676757812, 0.556365966796875, 0.5801925659179688, 0.6040191650390625, 0.6278457641601562, 0.65167236328125, 0.6754989624023438, 0.6993255615234375, 0.7231521606445312, 0.746978759765625, 0.7708053588867188, 0.7946319580078125, 0.8184585571289062, 0.84228515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 11.0, 5.0, 3.0, 8.0, 6.0, 20.0, 22.0, 18.0, 36.0, 33.0, 36.0, 40.0, 42.0, 56.0, 53.0, 63.0, 65.0, 70.0, 74.0, 51.0, 53.0, 55.0, 37.0, 47.0, 25.0, 13.0, 18.0, 10.0, 8.0, 10.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3595390319824219, -0.34871673583984375, -0.3378944396972656, -0.3270721435546875, -0.3162498474121094, -0.30542755126953125, -0.2946052551269531, -0.283782958984375, -0.2729606628417969, -0.26213836669921875, -0.2513160705566406, -0.2404937744140625, -0.22967147827148438, -0.21884918212890625, -0.20802688598632812, -0.19720458984375, -0.18638229370117188, -0.17555999755859375, -0.16473770141601562, -0.1539154052734375, -0.14309310913085938, -0.13227081298828125, -0.12144851684570312, -0.110626220703125, -0.09980392456054688, -0.08898162841796875, -0.07815933227539062, -0.0673370361328125, -0.056514739990234375, -0.04569244384765625, -0.034870147705078125, -0.0240478515625, -0.013225555419921875, -0.00240325927734375, 0.008419036865234375, 0.0192413330078125, 0.030063629150390625, 0.04088592529296875, 0.051708221435546875, 0.062530517578125, 0.07335281372070312, 0.08417510986328125, 0.09499740600585938, 0.1058197021484375, 0.11664199829101562, 0.12746429443359375, 0.13828659057617188, 0.14910888671875, 0.15993118286132812, 0.17075347900390625, 0.18157577514648438, 0.1923980712890625, 0.20322036743164062, 0.21404266357421875, 0.22486495971679688, 0.235687255859375, 0.24650955200195312, 0.25733184814453125, 0.2681541442871094, 0.2789764404296875, 0.2897987365722656, 0.30062103271484375, 0.3114433288574219, 0.322265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 13.0, 14.0, 21.0, 28.0, 28.0, 60.0, 116.0, 174.0, 354.0, 801.0, 2048.0, 6818.0, 41918.0, 3486077.0, 627117.0, 21514.0, 4472.0, 1479.0, 618.0, 235.0, 146.0, 84.0, 59.0, 23.0, 17.0, 11.0, 9.0, 12.0, 10.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.076171875, -1.046966552734375, -1.01776123046875, -0.988555908203125, -0.9593505859375, -0.930145263671875, -0.90093994140625, -0.871734619140625, -0.842529296875, -0.813323974609375, -0.78411865234375, -0.754913330078125, -0.7257080078125, -0.696502685546875, -0.66729736328125, -0.638092041015625, -0.60888671875, -0.579681396484375, -0.55047607421875, -0.521270751953125, -0.4920654296875, -0.462860107421875, -0.43365478515625, -0.404449462890625, -0.375244140625, -0.346038818359375, -0.31683349609375, -0.287628173828125, -0.2584228515625, -0.229217529296875, -0.20001220703125, -0.170806884765625, -0.1416015625, -0.112396240234375, -0.08319091796875, -0.053985595703125, -0.0247802734375, 0.004425048828125, 0.03363037109375, 0.062835693359375, 0.092041015625, 0.121246337890625, 0.15045166015625, 0.179656982421875, 0.2088623046875, 0.238067626953125, 0.26727294921875, 0.296478271484375, 0.32568359375, 0.354888916015625, 0.38409423828125, 0.413299560546875, 0.4425048828125, 0.471710205078125, 0.50091552734375, 0.530120849609375, 0.559326171875, 0.588531494140625, 0.61773681640625, 0.646942138671875, 0.6761474609375, 0.705352783203125, 0.73455810546875, 0.763763427734375, 0.79296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 4.0, 8.0, 13.0, 13.0, 19.0, 21.0, 32.0, 62.0, 141.0, 290.0, 764.0, 1202.0, 791.0, 330.0, 155.0, 85.0, 39.0, 28.0, 35.0, 10.0, 9.0, 11.0, 1.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.1463298797607422, -0.13921737670898438, -0.13210487365722656, -0.12499237060546875, -0.11787986755371094, -0.11076736450195312, -0.10365486145019531, -0.0965423583984375, -0.08942985534667969, -0.08231735229492188, -0.07520484924316406, -0.06809234619140625, -0.06097984313964844, -0.053867340087890625, -0.04675483703613281, -0.039642333984375, -0.03252983093261719, -0.025417327880859375, -0.018304824829101562, -0.01119232177734375, -0.0040798187255859375, 0.003032684326171875, 0.010145187377929688, 0.0172576904296875, 0.024370193481445312, 0.031482696533203125, 0.03859519958496094, 0.04570770263671875, 0.05282020568847656, 0.059932708740234375, 0.06704521179199219, 0.07415771484375, 0.08127021789550781, 0.08838272094726562, 0.09549522399902344, 0.10260772705078125, 0.10972023010253906, 0.11683273315429688, 0.12394523620605469, 0.1310577392578125, 0.1381702423095703, 0.14528274536132812, 0.15239524841308594, 0.15950775146484375, 0.16662025451660156, 0.17373275756835938, 0.1808452606201172, 0.187957763671875, 0.1950702667236328, 0.20218276977539062, 0.20929527282714844, 0.21640777587890625, 0.22352027893066406, 0.23063278198242188, 0.2377452850341797, 0.2448577880859375, 0.2519702911376953, 0.2590827941894531, 0.26619529724121094, 0.27330780029296875, 0.28042030334472656, 0.2875328063964844, 0.2946453094482422, 0.3017578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 12.0, 37.0, 76.0, 108.0, 170.0, 216.0, 152.0, 95.0, 48.0, 36.0, 14.0, 15.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3474003076553345, -1.3131623268127441, -1.2789243459701538, -1.2446863651275635, -1.2104483842849731, -1.1762104034423828, -1.1419724225997925, -1.1077344417572021, -1.0734963417053223, -1.039258360862732, -1.0050203800201416, -0.9707823991775513, -0.9365444183349609, -0.9023064374923706, -0.8680683970451355, -0.8338304162025452, -0.7995924949645996, -0.7653545141220093, -0.731116533279419, -0.6968785524368286, -0.6626405715942383, -0.628402590751648, -0.5941645503044128, -0.5599265694618225, -0.5256885886192322, -0.49145060777664185, -0.4572126269340515, -0.4229746162891388, -0.38873663544654846, -0.35449865460395813, -0.3202606439590454, -0.2860226631164551, -0.2517847418785095, -0.2175467610359192, -0.18330876529216766, -0.14907076954841614, -0.1148327887058258, -0.08059480786323547, -0.04635681211948395, -0.012118816375732422, 0.02211916446685791, 0.05635715276002884, 0.09059514105319977, 0.1248331293463707, 0.15907111763954163, 0.19330909848213196, 0.22754709422588348, 0.261785089969635, 0.29602307081222534, 0.3302610516548157, 0.364499032497406, 0.3987370431423187, 0.43297502398490906, 0.4672130048274994, 0.5014510154724121, 0.5356889963150024, 0.5699269771575928, 0.6041649580001831, 0.6384029388427734, 0.6726409196853638, 0.7068789005279541, 0.7411168813705444, 0.7753549218177795, 0.8095929026603699, 0.8438308835029602]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 12.0, 17.0, 12.0, 11.0, 26.0, 20.0, 22.0, 27.0, 26.0, 28.0, 33.0, 38.0, 44.0, 33.0, 43.0, 51.0, 39.0, 52.0, 44.0, 42.0, 51.0, 30.0, 32.0, 45.0, 45.0, 25.0, 20.0, 23.0, 21.0, 20.0, 14.0, 14.0, 5.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3229515254497528, -0.31225916743278503, -0.3015667796134949, -0.2908744215965271, -0.2801820635795593, -0.26948967576026917, -0.2587973177433014, -0.24810494482517242, -0.23741257190704346, -0.2267201989889145, -0.21602782607078552, -0.20533546805381775, -0.19464309513568878, -0.18395072221755981, -0.17325836420059204, -0.16256599128246307, -0.1518736183643341, -0.14118124544620514, -0.13048887252807617, -0.1197965145111084, -0.10910414159297943, -0.09841176867485046, -0.0877194032073021, -0.07702703773975372, -0.06633466482162476, -0.05564229562878609, -0.04494992643594742, -0.03425755724310875, -0.02356518805027008, -0.012872818857431412, -0.002180449664592743, 0.008511915802955627, 0.019204288721084595, 0.029896657913923264, 0.04058902710676193, 0.0512813962996006, 0.06197376549243927, 0.07266613841056824, 0.08335850387811661, 0.09405086934566498, 0.10474324226379395, 0.11543561518192291, 0.12612798810005188, 0.13682034611701965, 0.14751271903514862, 0.1582050919532776, 0.16889744997024536, 0.17958982288837433, 0.1902821958065033, 0.20097456872463226, 0.21166694164276123, 0.222359299659729, 0.23305167257785797, 0.24374404549598694, 0.2544364035129547, 0.2651287913322449, 0.27582114934921265, 0.2865135073661804, 0.2972058951854706, 0.30789825320243835, 0.3185906410217285, 0.3292829990386963, 0.33997535705566406, 0.35066771507263184, 0.361360102891922]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 9.0, 9.0, 19.0, 21.0, 25.0, 34.0, 57.0, 116.0, 186.0, 384.0, 750.0, 1617.0, 3582.0, 9799.0, 36458.0, 391295.0, 539358.0, 45711.0, 11466.0, 4125.0, 1749.0, 838.0, 388.0, 217.0, 139.0, 69.0, 39.0, 33.0, 19.0, 14.0, 9.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.265869140625, -0.25806427001953125, -0.2502593994140625, -0.24245452880859375, -0.234649658203125, -0.22684478759765625, -0.2190399169921875, -0.21123504638671875, -0.20343017578125, -0.19562530517578125, -0.1878204345703125, -0.18001556396484375, -0.172210693359375, -0.16440582275390625, -0.1566009521484375, -0.14879608154296875, -0.1409912109375, -0.13318634033203125, -0.1253814697265625, -0.11757659912109375, -0.109771728515625, -0.10196685791015625, -0.0941619873046875, -0.08635711669921875, -0.07855224609375, -0.07074737548828125, -0.0629425048828125, -0.05513763427734375, -0.047332763671875, -0.03952789306640625, -0.0317230224609375, -0.02391815185546875, -0.01611328125, -0.00830841064453125, -0.0005035400390625, 0.00730133056640625, 0.015106201171875, 0.02291107177734375, 0.0307159423828125, 0.03852081298828125, 0.04632568359375, 0.05413055419921875, 0.0619354248046875, 0.06974029541015625, 0.077545166015625, 0.08535003662109375, 0.0931549072265625, 0.10095977783203125, 0.1087646484375, 0.11656951904296875, 0.1243743896484375, 0.13217926025390625, 0.139984130859375, 0.14778900146484375, 0.1555938720703125, 0.16339874267578125, 0.17120361328125, 0.17900848388671875, 0.1868133544921875, 0.19461822509765625, 0.202423095703125, 0.21022796630859375, 0.2180328369140625, 0.22583770751953125, 0.233642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 5.0, 12.0, 22.0, 18.0, 20.0, 20.0, 19.0, 31.0, 34.0, 39.0, 32.0, 46.0, 37.0, 42.0, 52.0, 41.0, 46.0, 53.0, 50.0, 31.0, 29.0, 45.0, 35.0, 39.0, 37.0, 15.0, 22.0, 23.0, 15.0, 17.0, 13.0, 15.0, 5.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22100448608398438, -0.21361541748046875, -0.20622634887695312, -0.1988372802734375, -0.19144821166992188, -0.18405914306640625, -0.17667007446289062, -0.169281005859375, -0.16189193725585938, -0.15450286865234375, -0.14711380004882812, -0.1397247314453125, -0.13233566284179688, -0.12494659423828125, -0.11755752563476562, -0.11016845703125, -0.10277938842773438, -0.09539031982421875, -0.08800125122070312, -0.0806121826171875, -0.07322311401367188, -0.06583404541015625, -0.058444976806640625, -0.051055908203125, -0.043666839599609375, -0.03627777099609375, -0.028888702392578125, -0.0214996337890625, -0.014110565185546875, -0.00672149658203125, 0.000667572021484375, 0.008056640625, 0.015445709228515625, 0.02283477783203125, 0.030223846435546875, 0.0376129150390625, 0.045001983642578125, 0.05239105224609375, 0.059780120849609375, 0.067169189453125, 0.07455825805664062, 0.08194732666015625, 0.08933639526367188, 0.0967254638671875, 0.10411453247070312, 0.11150360107421875, 0.11889266967773438, 0.12628173828125, 0.13367080688476562, 0.14105987548828125, 0.14844894409179688, 0.1558380126953125, 0.16322708129882812, 0.17061614990234375, 0.17800521850585938, 0.185394287109375, 0.19278335571289062, 0.20017242431640625, 0.20756149291992188, 0.2149505615234375, 0.22233963012695312, 0.22972869873046875, 0.23711776733398438, 0.2445068359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 11.0, 20.0, 28.0, 37.0, 68.0, 85.0, 120.0, 170.0, 279.0, 448.0, 691.0, 1181.0, 1945.0, 3568.0, 6779.0, 14572.0, 35874.0, 114657.0, 422093.0, 312213.0, 81087.0, 27549.0, 11791.0, 5752.0, 3030.0, 1722.0, 1043.0, 618.0, 391.0, 225.0, 150.0, 128.0, 75.0, 53.0, 30.0, 16.0, 14.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09893798828125, -0.09583282470703125, -0.0927276611328125, -0.08962249755859375, -0.086517333984375, -0.08341217041015625, -0.0803070068359375, -0.07720184326171875, -0.0740966796875, -0.07099151611328125, -0.0678863525390625, -0.06478118896484375, -0.061676025390625, -0.05857086181640625, -0.0554656982421875, -0.05236053466796875, -0.04925537109375, -0.04615020751953125, -0.0430450439453125, -0.03993988037109375, -0.036834716796875, -0.03372955322265625, -0.0306243896484375, -0.02751922607421875, -0.0244140625, -0.02130889892578125, -0.0182037353515625, -0.01509857177734375, -0.011993408203125, -0.00888824462890625, -0.0057830810546875, -0.00267791748046875, 0.00042724609375, 0.00353240966796875, 0.0066375732421875, 0.00974273681640625, 0.012847900390625, 0.01595306396484375, 0.0190582275390625, 0.02216339111328125, 0.0252685546875, 0.02837371826171875, 0.0314788818359375, 0.03458404541015625, 0.037689208984375, 0.04079437255859375, 0.0438995361328125, 0.04700469970703125, 0.05010986328125, 0.05321502685546875, 0.0563201904296875, 0.05942535400390625, 0.062530517578125, 0.06563568115234375, 0.0687408447265625, 0.07184600830078125, 0.074951171875, 0.07805633544921875, 0.0811614990234375, 0.08426666259765625, 0.087371826171875, 0.09047698974609375, 0.0935821533203125, 0.09668731689453125, 0.09979248046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 8.0, 5.0, 5.0, 13.0, 22.0, 14.0, 29.0, 25.0, 31.0, 25.0, 28.0, 41.0, 46.0, 59.0, 49.0, 62.0, 52.0, 55.0, 48.0, 55.0, 41.0, 34.0, 32.0, 32.0, 32.0, 37.0, 23.0, 12.0, 15.0, 9.0, 13.0, 9.0, 12.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5111312866210938, -0.4944305419921875, -0.47772979736328125, -0.461029052734375, -0.44432830810546875, -0.4276275634765625, -0.41092681884765625, -0.39422607421875, -0.37752532958984375, -0.3608245849609375, -0.34412384033203125, -0.327423095703125, -0.31072235107421875, -0.2940216064453125, -0.27732086181640625, -0.2606201171875, -0.24391937255859375, -0.2272186279296875, -0.21051788330078125, -0.193817138671875, -0.17711639404296875, -0.1604156494140625, -0.14371490478515625, -0.12701416015625, -0.11031341552734375, -0.0936126708984375, -0.07691192626953125, -0.060211181640625, -0.04351043701171875, -0.0268096923828125, -0.01010894775390625, 0.006591796875, 0.02329254150390625, 0.0399932861328125, 0.05669403076171875, 0.073394775390625, 0.09009552001953125, 0.1067962646484375, 0.12349700927734375, 0.14019775390625, 0.15689849853515625, 0.1735992431640625, 0.19029998779296875, 0.207000732421875, 0.22370147705078125, 0.2404022216796875, 0.25710296630859375, 0.2738037109375, 0.29050445556640625, 0.3072052001953125, 0.32390594482421875, 0.340606689453125, 0.35730743408203125, 0.3740081787109375, 0.39070892333984375, 0.40740966796875, 0.42411041259765625, 0.4408111572265625, 0.45751190185546875, 0.474212646484375, 0.49091339111328125, 0.5076141357421875, 0.5243148803710938, 0.541015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 5.0, 12.0, 10.0, 25.0, 27.0, 75.0, 99.0, 182.0, 334.0, 607.0, 1370.0, 3362.0, 9684.0, 35866.0, 181399.0, 567005.0, 194186.0, 37909.0, 10132.0, 3474.0, 1347.0, 643.0, 345.0, 188.0, 100.0, 53.0, 42.0, 22.0, 19.0, 12.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0241241455078125, -0.023247480392456055, -0.02237081527709961, -0.021494150161743164, -0.02061748504638672, -0.019740819931030273, -0.018864154815673828, -0.017987489700317383, -0.017110824584960938, -0.016234159469604492, -0.015357494354248047, -0.014480829238891602, -0.013604164123535156, -0.012727499008178711, -0.011850833892822266, -0.01097416877746582, -0.010097503662109375, -0.00922083854675293, -0.008344173431396484, -0.007467508316040039, -0.006590843200683594, -0.0057141780853271484, -0.004837512969970703, -0.003960847854614258, -0.0030841827392578125, -0.002207517623901367, -0.0013308525085449219, -0.00045418739318847656, 0.00042247772216796875, 0.001299142837524414, 0.0021758079528808594, 0.0030524730682373047, 0.00392913818359375, 0.004805803298950195, 0.005682468414306641, 0.006559133529663086, 0.007435798645019531, 0.008312463760375977, 0.009189128875732422, 0.010065793991088867, 0.010942459106445312, 0.011819124221801758, 0.012695789337158203, 0.013572454452514648, 0.014449119567871094, 0.015325784683227539, 0.016202449798583984, 0.01707911491394043, 0.017955780029296875, 0.01883244514465332, 0.019709110260009766, 0.02058577537536621, 0.021462440490722656, 0.0223391056060791, 0.023215770721435547, 0.024092435836791992, 0.024969100952148438, 0.025845766067504883, 0.026722431182861328, 0.027599096298217773, 0.02847576141357422, 0.029352426528930664, 0.03022909164428711, 0.031105756759643555, 0.031982421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 10.0, 9.0, 16.0, 11.0, 27.0, 29.0, 36.0, 61.0, 42.0, 83.0, 82.0, 107.0, 83.0, 84.0, 67.0, 66.0, 41.0, 38.0, 21.0, 22.0, 18.0, 6.0, 8.0, 3.0, 2.0, 7.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0398216545581818e-05, -1.0007992386817932e-05, -9.617768228054047e-06, -9.227544069290161e-06, -8.837319910526276e-06, -8.44709575176239e-06, -8.056871592998505e-06, -7.666647434234619e-06, -7.276423275470734e-06, -6.886199116706848e-06, -6.495974957942963e-06, -6.105750799179077e-06, -5.715526640415192e-06, -5.325302481651306e-06, -4.935078322887421e-06, -4.544854164123535e-06, -4.15463000535965e-06, -3.764405846595764e-06, -3.3741816878318787e-06, -2.983957529067993e-06, -2.5937333703041077e-06, -2.203509211540222e-06, -1.8132850527763367e-06, -1.4230608940124512e-06, -1.0328367352485657e-06, -6.426125764846802e-07, -2.523884177207947e-07, 1.3783574104309082e-07, 5.280598998069763e-07, 9.182840585708618e-07, 1.3085082173347473e-06, 1.6987323760986328e-06, 2.0889565348625183e-06, 2.479180693626404e-06, 2.8694048523902893e-06, 3.259629011154175e-06, 3.6498531699180603e-06, 4.040077328681946e-06, 4.430301487445831e-06, 4.820525646209717e-06, 5.210749804973602e-06, 5.600973963737488e-06, 5.991198122501373e-06, 6.381422281265259e-06, 6.771646440029144e-06, 7.16187059879303e-06, 7.552094757556915e-06, 7.9423189163208e-06, 8.332543075084686e-06, 8.722767233848572e-06, 9.112991392612457e-06, 9.503215551376343e-06, 9.893439710140228e-06, 1.0283663868904114e-05, 1.0673888027668e-05, 1.1064112186431885e-05, 1.145433634519577e-05, 1.1844560503959656e-05, 1.2234784662723541e-05, 1.2625008821487427e-05, 1.3015232980251312e-05, 1.3405457139015198e-05, 1.3795681297779083e-05, 1.4185905456542969e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 11.0, 9.0, 19.0, 29.0, 38.0, 62.0, 78.0, 104.0, 197.0, 279.0, 495.0, 903.0, 1738.0, 3275.0, 7195.0, 16942.0, 45026.0, 129020.0, 318710.0, 319082.0, 128580.0, 45373.0, 16915.0, 7134.0, 3276.0, 1751.0, 878.0, 533.0, 297.0, 205.0, 120.0, 83.0, 57.0, 41.0, 20.0, 26.0, 16.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0204010009765625, -0.019763469696044922, -0.019125938415527344, -0.018488407135009766, -0.017850875854492188, -0.01721334457397461, -0.01657581329345703, -0.015938282012939453, -0.015300750732421875, -0.014663219451904297, -0.014025688171386719, -0.01338815689086914, -0.012750625610351562, -0.012113094329833984, -0.011475563049316406, -0.010838031768798828, -0.01020050048828125, -0.009562969207763672, -0.008925437927246094, -0.008287906646728516, -0.0076503753662109375, -0.007012844085693359, -0.006375312805175781, -0.005737781524658203, -0.005100250244140625, -0.004462718963623047, -0.0038251876831054688, -0.0031876564025878906, -0.0025501251220703125, -0.0019125938415527344, -0.0012750625610351562, -0.0006375312805175781, 0.0, 0.0006375312805175781, 0.0012750625610351562, 0.0019125938415527344, 0.0025501251220703125, 0.0031876564025878906, 0.0038251876831054688, 0.004462718963623047, 0.005100250244140625, 0.005737781524658203, 0.006375312805175781, 0.007012844085693359, 0.0076503753662109375, 0.008287906646728516, 0.008925437927246094, 0.009562969207763672, 0.01020050048828125, 0.010838031768798828, 0.011475563049316406, 0.012113094329833984, 0.012750625610351562, 0.01338815689086914, 0.014025688171386719, 0.014663219451904297, 0.015300750732421875, 0.015938282012939453, 0.01657581329345703, 0.01721334457397461, 0.017850875854492188, 0.018488407135009766, 0.019125938415527344, 0.019763469696044922, 0.0204010009765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 7.0, 4.0, 7.0, 8.0, 12.0, 18.0, 13.0, 18.0, 23.0, 13.0, 29.0, 31.0, 42.0, 44.0, 39.0, 55.0, 47.0, 53.0, 60.0, 49.0, 59.0, 27.0, 56.0, 39.0, 38.0, 23.0, 24.0, 31.0, 18.0, 16.0, 23.0, 15.0, 15.0, 7.0, 8.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005664825439453125, -0.005479335784912109, -0.005293846130371094, -0.005108356475830078, -0.0049228668212890625, -0.004737377166748047, -0.004551887512207031, -0.004366397857666016, -0.004180908203125, -0.003995418548583984, -0.0038099288940429688, -0.003624439239501953, -0.0034389495849609375, -0.003253459930419922, -0.0030679702758789062, -0.0028824806213378906, -0.002696990966796875, -0.0025115013122558594, -0.0023260116577148438, -0.002140522003173828, -0.0019550323486328125, -0.0017695426940917969, -0.0015840530395507812, -0.0013985633850097656, -0.00121307373046875, -0.0010275840759277344, -0.0008420944213867188, -0.0006566047668457031, -0.0004711151123046875, -0.0002856254577636719, -0.00010013580322265625, 8.535385131835938e-05, 0.000270843505859375, 0.0004563331604003906, 0.0006418228149414062, 0.0008273124694824219, 0.0010128021240234375, 0.0011982917785644531, 0.0013837814331054688, 0.0015692710876464844, 0.0017547607421875, 0.0019402503967285156, 0.0021257400512695312, 0.002311229705810547, 0.0024967193603515625, 0.002682209014892578, 0.0028676986694335938, 0.0030531883239746094, 0.003238677978515625, 0.0034241676330566406, 0.0036096572875976562, 0.003795146942138672, 0.0039806365966796875, 0.004166126251220703, 0.004351615905761719, 0.004537105560302734, 0.00472259521484375, 0.004908084869384766, 0.005093574523925781, 0.005279064178466797, 0.0054645538330078125, 0.005650043487548828, 0.005835533142089844, 0.006021022796630859, 0.006206512451171875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 8.0, 13.0, 29.0, 49.0, 80.0, 137.0, 202.0, 185.0, 124.0, 74.0, 37.0, 16.0, 19.0, 11.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7547540664672852, -0.7331125736236572, -0.7114710807800293, -0.6898295879364014, -0.6681880950927734, -0.6465466022491455, -0.6249051094055176, -0.6032635569572449, -0.5816220641136169, -0.559980571269989, -0.5383390784263611, -0.5166975855827332, -0.49505606293678284, -0.4734145700931549, -0.451773077249527, -0.43013155460357666, -0.4084900915622711, -0.3868485987186432, -0.36520710587501526, -0.34356558322906494, -0.321924090385437, -0.3002825975418091, -0.27864110469818115, -0.2569996118545532, -0.2353581041097641, -0.21371661126613617, -0.19207510352134705, -0.17043361067771912, -0.1487921178340912, -0.12715061008930206, -0.10550911724567413, -0.08386760950088501, -0.06222611665725708, -0.04058461636304855, -0.018943119794130325, 0.002698376774787903, 0.02433987706899643, 0.045981377363204956, 0.06762287020683289, 0.08926437795162201, 0.11090587079524994, 0.13254736363887787, 0.154188871383667, 0.17583036422729492, 0.19747185707092285, 0.21911336481571198, 0.2407548576593399, 0.26239636540412903, 0.28403785824775696, 0.3056793510913849, 0.3273208439350128, 0.34896236658096313, 0.37060385942459106, 0.392245352268219, 0.4138868451118469, 0.43552833795547485, 0.4571698307991028, 0.4788113236427307, 0.5004528164863586, 0.5220943093299866, 0.5437358021736145, 0.5653773546218872, 0.5870188474655151, 0.6086603403091431, 0.630301833152771]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 13.0, 13.0, 10.0, 13.0, 16.0, 23.0, 20.0, 26.0, 21.0, 28.0, 41.0, 39.0, 40.0, 36.0, 38.0, 48.0, 36.0, 49.0, 45.0, 56.0, 44.0, 32.0, 43.0, 37.0, 47.0, 24.0, 20.0, 31.0, 21.0, 21.0, 14.0, 15.0, 8.0, 6.0, 5.0, 2.0, 5.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22479639947414398, -0.21756847202777863, -0.21034054458141327, -0.2031126171350479, -0.19588468968868256, -0.1886567622423172, -0.18142881989479065, -0.1742008924484253, -0.16697296500205994, -0.15974503755569458, -0.15251711010932922, -0.14528918266296387, -0.1380612552165985, -0.13083332777023315, -0.1236053928732872, -0.11637746542692184, -0.10914954543113708, -0.10192161798477173, -0.09469369053840637, -0.08746576309204102, -0.08023783564567566, -0.0730099081993103, -0.06578197330236435, -0.05855404585599899, -0.051326118409633636, -0.04409819096326828, -0.036870263516902924, -0.02964233234524727, -0.022414404898881912, -0.015186477452516556, -0.007958546280860901, -0.0007306188344955444, 0.006497308611869812, 0.013725236989557743, 0.020953165367245674, 0.02818109467625618, 0.035409022122621536, 0.04263694956898689, 0.04986488074064255, 0.057092808187007904, 0.06432073563337326, 0.07154866307973862, 0.07877659052610397, 0.08600452542304993, 0.09323245286941528, 0.10046038031578064, 0.107688307762146, 0.11491623520851135, 0.12214416265487671, 0.12937209010124207, 0.13660001754760742, 0.14382794499397278, 0.15105587244033813, 0.1582837998867035, 0.16551172733306885, 0.1727396547794342, 0.17996758222579956, 0.18719550967216492, 0.19442343711853027, 0.20165136456489563, 0.208879292011261, 0.21610721945762634, 0.2233351469039917, 0.23056307435035706, 0.2377910166978836]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 18.0, 8.0, 20.0, 31.0, 31.0, 45.0, 80.0, 112.0, 152.0, 240.0, 400.0, 767.0, 1277.0, 2590.0, 7216.0, 26726.0, 163875.0, 704753.0, 109247.0, 19914.0, 5934.0, 2303.0, 1104.0, 628.0, 356.0, 244.0, 157.0, 96.0, 50.0, 48.0, 35.0, 27.0, 19.0, 13.0, 7.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29833984375, -0.28745269775390625, -0.2765655517578125, -0.26567840576171875, -0.254791259765625, -0.24390411376953125, -0.2330169677734375, -0.22212982177734375, -0.21124267578125, -0.20035552978515625, -0.1894683837890625, -0.17858123779296875, -0.167694091796875, -0.15680694580078125, -0.1459197998046875, -0.13503265380859375, -0.1241455078125, -0.11325836181640625, -0.1023712158203125, -0.09148406982421875, -0.080596923828125, -0.06970977783203125, -0.0588226318359375, -0.04793548583984375, -0.03704833984375, -0.02616119384765625, -0.0152740478515625, -0.00438690185546875, 0.006500244140625, 0.01738739013671875, 0.0282745361328125, 0.03916168212890625, 0.050048828125, 0.06093597412109375, 0.0718231201171875, 0.08271026611328125, 0.093597412109375, 0.10448455810546875, 0.1153717041015625, 0.12625885009765625, 0.13714599609375, 0.14803314208984375, 0.1589202880859375, 0.16980743408203125, 0.180694580078125, 0.19158172607421875, 0.2024688720703125, 0.21335601806640625, 0.2242431640625, 0.23513031005859375, 0.2460174560546875, 0.25690460205078125, 0.267791748046875, 0.27867889404296875, 0.2895660400390625, 0.30045318603515625, 0.31134033203125, 0.32222747802734375, 0.3331146240234375, 0.34400177001953125, 0.354888916015625, 0.36577606201171875, 0.3766632080078125, 0.38755035400390625, 0.3984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 10.0, 14.0, 9.0, 16.0, 12.0, 29.0, 20.0, 38.0, 33.0, 52.0, 38.0, 50.0, 53.0, 51.0, 53.0, 40.0, 47.0, 58.0, 56.0, 48.0, 43.0, 37.0, 26.0, 35.0, 26.0, 21.0, 14.0, 17.0, 8.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.43991851806640625, -0.4242706298828125, -0.40862274169921875, -0.392974853515625, -0.37732696533203125, -0.3616790771484375, -0.34603118896484375, -0.33038330078125, -0.31473541259765625, -0.2990875244140625, -0.28343963623046875, -0.267791748046875, -0.25214385986328125, -0.2364959716796875, -0.22084808349609375, -0.2052001953125, -0.18955230712890625, -0.1739044189453125, -0.15825653076171875, -0.142608642578125, -0.12696075439453125, -0.1113128662109375, -0.09566497802734375, -0.08001708984375, -0.06436920166015625, -0.0487213134765625, -0.03307342529296875, -0.017425537109375, -0.00177764892578125, 0.0138702392578125, 0.02951812744140625, 0.045166015625, 0.06081390380859375, 0.0764617919921875, 0.09210968017578125, 0.107757568359375, 0.12340545654296875, 0.1390533447265625, 0.15470123291015625, 0.17034912109375, 0.18599700927734375, 0.2016448974609375, 0.21729278564453125, 0.232940673828125, 0.24858856201171875, 0.2642364501953125, 0.27988433837890625, 0.2955322265625, 0.31118011474609375, 0.3268280029296875, 0.34247589111328125, 0.358123779296875, 0.37377166748046875, 0.3894195556640625, 0.40506744384765625, 0.42071533203125, 0.43636322021484375, 0.4520111083984375, 0.46765899658203125, 0.483306884765625, 0.49895477294921875, 0.5146026611328125, 0.5302505493164062, 0.5458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 4.0, 6.0, 15.0, 9.0, 11.0, 17.0, 29.0, 30.0, 43.0, 50.0, 112.0, 236.0, 646.0, 3289.0, 110254.0, 923446.0, 8400.0, 1210.0, 341.0, 138.0, 72.0, 39.0, 33.0, 26.0, 28.0, 13.0, 14.0, 9.0, 8.0, 9.0, 4.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3251953125, -1.2895736694335938, -1.2539520263671875, -1.2183303833007812, -1.182708740234375, -1.1470870971679688, -1.1114654541015625, -1.0758438110351562, -1.04022216796875, -1.0046005249023438, -0.9689788818359375, -0.9333572387695312, -0.897735595703125, -0.8621139526367188, -0.8264923095703125, -0.7908706665039062, -0.7552490234375, -0.7196273803710938, -0.6840057373046875, -0.6483840942382812, -0.612762451171875, -0.5771408081054688, -0.5415191650390625, -0.5058975219726562, -0.47027587890625, -0.43465423583984375, -0.3990325927734375, -0.36341094970703125, -0.327789306640625, -0.29216766357421875, -0.2565460205078125, -0.22092437744140625, -0.185302734375, -0.14968109130859375, -0.1140594482421875, -0.07843780517578125, -0.042816162109375, -0.00719451904296875, 0.0284271240234375, 0.06404876708984375, 0.09967041015625, 0.13529205322265625, 0.1709136962890625, 0.20653533935546875, 0.242156982421875, 0.27777862548828125, 0.3134002685546875, 0.34902191162109375, 0.3846435546875, 0.42026519775390625, 0.4558868408203125, 0.49150848388671875, 0.527130126953125, 0.5627517700195312, 0.5983734130859375, 0.6339950561523438, 0.66961669921875, 0.7052383422851562, 0.7408599853515625, 0.7764816284179688, 0.812103271484375, 0.8477249145507812, 0.8833465576171875, 0.9189682006835938, 0.95458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 9.0, 7.0, 12.0, 19.0, 30.0, 31.0, 35.0, 30.0, 56.0, 54.0, 42.0, 52.0, 58.0, 63.0, 68.0, 63.0, 61.0, 55.0, 43.0, 24.0, 30.0, 27.0, 26.0, 18.0, 12.0, 11.0, 10.0, 11.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73046875, -0.7108688354492188, -0.6912689208984375, -0.6716690063476562, -0.652069091796875, -0.6324691772460938, -0.6128692626953125, -0.5932693481445312, -0.57366943359375, -0.5540695190429688, -0.5344696044921875, -0.5148696899414062, -0.495269775390625, -0.47566986083984375, -0.4560699462890625, -0.43647003173828125, -0.4168701171875, -0.39727020263671875, -0.3776702880859375, -0.35807037353515625, -0.338470458984375, -0.31887054443359375, -0.2992706298828125, -0.27967071533203125, -0.26007080078125, -0.24047088623046875, -0.2208709716796875, -0.20127105712890625, -0.181671142578125, -0.16207122802734375, -0.1424713134765625, -0.12287139892578125, -0.103271484375, -0.08367156982421875, -0.0640716552734375, -0.04447174072265625, -0.024871826171875, -0.00527191162109375, 0.0143280029296875, 0.03392791748046875, 0.05352783203125, 0.07312774658203125, 0.0927276611328125, 0.11232757568359375, 0.131927490234375, 0.15152740478515625, 0.1711273193359375, 0.19072723388671875, 0.2103271484375, 0.22992706298828125, 0.2495269775390625, 0.26912689208984375, 0.288726806640625, 0.30832672119140625, 0.3279266357421875, 0.34752655029296875, 0.36712646484375, 0.38672637939453125, 0.4063262939453125, 0.42592620849609375, 0.445526123046875, 0.46512603759765625, 0.4847259521484375, 0.5043258666992188, 0.52392578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 15.0, 23.0, 21.0, 46.0, 63.0, 100.0, 177.0, 366.0, 776.0, 2459.0, 9830.0, 60643.0, 791727.0, 158488.0, 17575.0, 3980.0, 1181.0, 472.0, 204.0, 117.0, 71.0, 47.0, 29.0, 25.0, 14.0, 19.0, 15.0, 13.0, 5.0, 8.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1466064453125, -0.14225387573242188, -0.13790130615234375, -0.13354873657226562, -0.1291961669921875, -0.12484359741210938, -0.12049102783203125, -0.11613845825195312, -0.111785888671875, -0.10743331909179688, -0.10308074951171875, -0.09872817993164062, -0.0943756103515625, -0.09002304077148438, -0.08567047119140625, -0.08131790161132812, -0.07696533203125, -0.07261276245117188, -0.06826019287109375, -0.06390762329101562, -0.0595550537109375, -0.055202484130859375, -0.05084991455078125, -0.046497344970703125, -0.042144775390625, -0.037792205810546875, -0.03343963623046875, -0.029087066650390625, -0.0247344970703125, -0.020381927490234375, -0.01602935791015625, -0.011676788330078125, -0.00732421875, -0.002971649169921875, 0.00138092041015625, 0.005733489990234375, 0.0100860595703125, 0.014438629150390625, 0.01879119873046875, 0.023143768310546875, 0.027496337890625, 0.031848907470703125, 0.03620147705078125, 0.040554046630859375, 0.0449066162109375, 0.049259185791015625, 0.05361175537109375, 0.057964324951171875, 0.06231689453125, 0.06666946411132812, 0.07102203369140625, 0.07537460327148438, 0.0797271728515625, 0.08407974243164062, 0.08843231201171875, 0.09278488159179688, 0.097137451171875, 0.10149002075195312, 0.10584259033203125, 0.11019515991210938, 0.1145477294921875, 0.11890029907226562, 0.12325286865234375, 0.12760543823242188, 0.1319580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 6.0, 10.0, 12.0, 23.0, 31.0, 41.0, 54.0, 72.0, 127.0, 144.0, 127.0, 100.0, 68.0, 46.0, 35.0, 23.0, 15.0, 18.0, 7.0, 5.0, 4.0, 6.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7762184143066406e-05, -1.7202459275722504e-05, -1.66427344083786e-05, -1.60830095410347e-05, -1.5523284673690796e-05, -1.4963559806346893e-05, -1.440383493900299e-05, -1.3844110071659088e-05, -1.3284385204315186e-05, -1.2724660336971283e-05, -1.216493546962738e-05, -1.1605210602283478e-05, -1.1045485734939575e-05, -1.0485760867595673e-05, -9.92603600025177e-06, -9.366311132907867e-06, -8.806586265563965e-06, -8.246861398220062e-06, -7.68713653087616e-06, -7.127411663532257e-06, -6.5676867961883545e-06, -6.007961928844452e-06, -5.448237061500549e-06, -4.888512194156647e-06, -4.328787326812744e-06, -3.7690624594688416e-06, -3.209337592124939e-06, -2.6496127247810364e-06, -2.089887857437134e-06, -1.5301629900932312e-06, -9.704381227493286e-07, -4.10713255405426e-07, 1.4901161193847656e-07, 7.087364792823792e-07, 1.2684613466262817e-06, 1.8281862139701843e-06, 2.387911081314087e-06, 2.9476359486579895e-06, 3.507360816001892e-06, 4.067085683345795e-06, 4.626810550689697e-06, 5.1865354180336e-06, 5.7462602853775024e-06, 6.305985152721405e-06, 6.865710020065308e-06, 7.42543488740921e-06, 7.985159754753113e-06, 8.544884622097015e-06, 9.104609489440918e-06, 9.66433435678482e-06, 1.0224059224128723e-05, 1.0783784091472626e-05, 1.1343508958816528e-05, 1.1903233826160431e-05, 1.2462958693504333e-05, 1.3022683560848236e-05, 1.3582408428192139e-05, 1.4142133295536041e-05, 1.4701858162879944e-05, 1.5261583030223846e-05, 1.582130789756775e-05, 1.638103276491165e-05, 1.6940757632255554e-05, 1.7500482499599457e-05, 1.806020736694336e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 16.0, 27.0, 44.0, 47.0, 63.0, 114.0, 168.0, 267.0, 492.0, 1093.0, 3180.0, 16029.0, 311102.0, 684747.0, 24267.0, 4068.0, 1328.0, 590.0, 329.0, 219.0, 134.0, 78.0, 58.0, 34.0, 12.0, 12.0, 4.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.224609375, -0.21871376037597656, -0.21281814575195312, -0.2069225311279297, -0.20102691650390625, -0.1951313018798828, -0.18923568725585938, -0.18334007263183594, -0.1774444580078125, -0.17154884338378906, -0.16565322875976562, -0.1597576141357422, -0.15386199951171875, -0.1479663848876953, -0.14207077026367188, -0.13617515563964844, -0.130279541015625, -0.12438392639160156, -0.11848831176757812, -0.11259269714355469, -0.10669708251953125, -0.10080146789550781, -0.09490585327148438, -0.08901023864746094, -0.0831146240234375, -0.07721900939941406, -0.07132339477539062, -0.06542778015136719, -0.05953216552734375, -0.05363655090332031, -0.047740936279296875, -0.04184532165527344, -0.03594970703125, -0.030054092407226562, -0.024158477783203125, -0.018262863159179688, -0.01236724853515625, -0.0064716339111328125, -0.000576019287109375, 0.0053195953369140625, 0.0112152099609375, 0.017110824584960938, 0.023006439208984375, 0.028902053833007812, 0.03479766845703125, 0.04069328308105469, 0.046588897705078125, 0.05248451232910156, 0.058380126953125, 0.06427574157714844, 0.07017135620117188, 0.07606697082519531, 0.08196258544921875, 0.08785820007324219, 0.09375381469726562, 0.09964942932128906, 0.1055450439453125, 0.11144065856933594, 0.11733627319335938, 0.12323188781738281, 0.12912750244140625, 0.1350231170654297, 0.14091873168945312, 0.14681434631347656, 0.1527099609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 10.0, 17.0, 19.0, 16.0, 22.0, 53.0, 72.0, 121.0, 192.0, 161.0, 110.0, 67.0, 51.0, 24.0, 19.0, 13.0, 16.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053070068359375, -0.051023006439208984, -0.04897594451904297, -0.04692888259887695, -0.04488182067871094, -0.04283475875854492, -0.040787696838378906, -0.03874063491821289, -0.036693572998046875, -0.03464651107788086, -0.032599449157714844, -0.030552387237548828, -0.028505325317382812, -0.026458263397216797, -0.02441120147705078, -0.022364139556884766, -0.02031707763671875, -0.018270015716552734, -0.01622295379638672, -0.014175891876220703, -0.012128829956054688, -0.010081768035888672, -0.008034706115722656, -0.005987644195556641, -0.003940582275390625, -0.0018935203552246094, 0.00015354156494140625, 0.002200603485107422, 0.0042476654052734375, 0.006294727325439453, 0.008341789245605469, 0.010388851165771484, 0.0124359130859375, 0.014482975006103516, 0.01653003692626953, 0.018577098846435547, 0.020624160766601562, 0.022671222686767578, 0.024718284606933594, 0.02676534652709961, 0.028812408447265625, 0.03085947036743164, 0.032906532287597656, 0.03495359420776367, 0.03700065612792969, 0.0390477180480957, 0.04109477996826172, 0.043141841888427734, 0.04518890380859375, 0.047235965728759766, 0.04928302764892578, 0.0513300895690918, 0.05337715148925781, 0.05542421340942383, 0.057471275329589844, 0.05951833724975586, 0.061565399169921875, 0.06361246109008789, 0.0656595230102539, 0.06770658493041992, 0.06975364685058594, 0.07180070877075195, 0.07384777069091797, 0.07589483261108398, 0.07794189453125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 10.0, 14.0, 28.0, 24.0, 63.0, 90.0, 151.0, 158.0, 169.0, 114.0, 77.0, 36.0, 28.0, 15.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4249154329299927, -1.3880575895309448, -1.351199746131897, -1.3143419027328491, -1.2774841785430908, -1.240626335144043, -1.2037684917449951, -1.1669106483459473, -1.1300528049468994, -1.0931949615478516, -1.0563371181488037, -1.0194792747497559, -0.9826214909553528, -0.9457636475563049, -0.9089058637619019, -0.872048020362854, -0.8351901769638062, -0.7983323335647583, -0.7614744901657104, -0.7246167063713074, -0.6877588629722595, -0.6509010195732117, -0.6140432357788086, -0.5771853923797607, -0.5403275489807129, -0.503469705581665, -0.4666118919849396, -0.4297540783882141, -0.39289623498916626, -0.3560383915901184, -0.31918057799339294, -0.2823227643966675, -0.24546504020690918, -0.20860721170902252, -0.17174938321113586, -0.1348915547132492, -0.09803372621536255, -0.06117589771747589, -0.024318069219589233, 0.01253974437713623, 0.04939758777618408, 0.08625541627407074, 0.1231132447719574, 0.15997107326984406, 0.1968289017677307, 0.23368673026561737, 0.27054455876350403, 0.3074023723602295, 0.34426021575927734, 0.3811180591583252, 0.41797587275505066, 0.4548336863517761, 0.491691529750824, 0.5285493731498718, 0.5654071569442749, 0.6022650003433228, 0.6391228437423706, 0.6759806871414185, 0.7128385305404663, 0.7496963143348694, 0.7865541577339172, 0.8234120011329651, 0.8602697849273682, 0.897127628326416, 0.9339854717254639]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 13.0, 20.0, 12.0, 15.0, 13.0, 14.0, 21.0, 35.0, 37.0, 23.0, 30.0, 29.0, 38.0, 39.0, 41.0, 41.0, 42.0, 36.0, 36.0, 43.0, 34.0, 35.0, 44.0, 37.0, 30.0, 26.0, 32.0, 33.0, 19.0, 13.0, 18.0, 15.0, 21.0, 6.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.8621527552604675, -0.8366901874542236, -0.8112276196479797, -0.7857650518417358, -0.7603024840354919, -0.734839916229248, -0.7093773484230042, -0.6839147806167603, -0.6584522128105164, -0.6329896450042725, -0.6075270771980286, -0.5820645093917847, -0.5566019415855408, -0.5311393737792969, -0.505676805973053, -0.4802142381668091, -0.4547517001628876, -0.4292891323566437, -0.4038265645503998, -0.3783639967441559, -0.352901428937912, -0.3274388909339905, -0.3019763231277466, -0.2765137553215027, -0.2510511875152588, -0.2255886197090149, -0.200126051902771, -0.1746634840965271, -0.1492009162902832, -0.1237383633852005, -0.0982757955789566, -0.07281322777271271, -0.04735064506530762, -0.02188807912170887, 0.0035744868218898773, 0.029037050902843475, 0.05449961870908737, 0.07996217906475067, 0.10542474687099457, 0.13088731467723846, 0.15634988248348236, 0.18181245028972626, 0.20727501809597015, 0.23273757100105286, 0.25820013880729675, 0.28366270661354065, 0.30912527441978455, 0.33458784222602844, 0.36005041003227234, 0.38551297783851624, 0.41097554564476013, 0.43643811345100403, 0.4619006812572479, 0.48736321926116943, 0.5128257870674133, 0.5382883548736572, 0.5637509226799011, 0.589213490486145, 0.6146760582923889, 0.6401386260986328, 0.6656011939048767, 0.6910637617111206, 0.7165263295173645, 0.7419888973236084, 0.7674514651298523]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 10.0, 3.0, 5.0, 8.0, 8.0, 13.0, 23.0, 35.0, 34.0, 42.0, 85.0, 127.0, 216.0, 316.0, 538.0, 1035.0, 2078.0, 5484.0, 34678.0, 1549681.0, 2533678.0, 53223.0, 7802.0, 2492.0, 1086.0, 581.0, 345.0, 229.0, 131.0, 93.0, 61.0, 49.0, 22.0, 24.0, 13.0, 11.0, 10.0, 11.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.890625, -0.8666000366210938, -0.8425750732421875, -0.8185501098632812, -0.794525146484375, -0.7705001831054688, -0.7464752197265625, -0.7224502563476562, -0.69842529296875, -0.6744003295898438, -0.6503753662109375, -0.6263504028320312, -0.602325439453125, -0.5783004760742188, -0.5542755126953125, -0.5302505493164062, -0.5062255859375, -0.48220062255859375, -0.4581756591796875, -0.43415069580078125, -0.410125732421875, -0.38610076904296875, -0.3620758056640625, -0.33805084228515625, -0.31402587890625, -0.29000091552734375, -0.2659759521484375, -0.24195098876953125, -0.217926025390625, -0.19390106201171875, -0.1698760986328125, -0.14585113525390625, -0.121826171875, -0.09780120849609375, -0.0737762451171875, -0.04975128173828125, -0.025726318359375, -0.00170135498046875, 0.0223236083984375, 0.04634857177734375, 0.07037353515625, 0.09439849853515625, 0.1184234619140625, 0.14244842529296875, 0.166473388671875, 0.19049835205078125, 0.2145233154296875, 0.23854827880859375, 0.2625732421875, 0.28659820556640625, 0.3106231689453125, 0.33464813232421875, 0.358673095703125, 0.38269805908203125, 0.4067230224609375, 0.43074798583984375, 0.45477294921875, 0.47879791259765625, 0.5028228759765625, 0.5268478393554688, 0.550872802734375, 0.5748977661132812, 0.5989227294921875, 0.6229476928710938, 0.64697265625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 11.0, 14.0, 18.0, 18.0, 27.0, 17.0, 26.0, 35.0, 43.0, 41.0, 46.0, 35.0, 64.0, 69.0, 60.0, 53.0, 51.0, 66.0, 34.0, 50.0, 33.0, 33.0, 28.0, 28.0, 21.0, 21.0, 11.0, 9.0, 8.0, 8.0, 7.0, 2.0, 6.0, 4.0, 0.0, 1.0, 3.0], "bins": [-0.413330078125, -0.4033489227294922, -0.3933677673339844, -0.38338661193847656, -0.37340545654296875, -0.36342430114746094, -0.3534431457519531, -0.3434619903564453, -0.3334808349609375, -0.3234996795654297, -0.3135185241699219, -0.30353736877441406, -0.29355621337890625, -0.28357505798339844, -0.2735939025878906, -0.2636127471923828, -0.253631591796875, -0.2436504364013672, -0.23366928100585938, -0.22368812561035156, -0.21370697021484375, -0.20372581481933594, -0.19374465942382812, -0.1837635040283203, -0.1737823486328125, -0.1638011932373047, -0.15382003784179688, -0.14383888244628906, -0.13385772705078125, -0.12387657165527344, -0.11389541625976562, -0.10391426086425781, -0.09393310546875, -0.08395195007324219, -0.07397079467773438, -0.06398963928222656, -0.05400848388671875, -0.04402732849121094, -0.034046173095703125, -0.024065017700195312, -0.0140838623046875, -0.0041027069091796875, 0.005878448486328125, 0.015859603881835938, 0.02584075927734375, 0.03582191467285156, 0.045803070068359375, 0.05578422546386719, 0.065765380859375, 0.07574653625488281, 0.08572769165039062, 0.09570884704589844, 0.10569000244140625, 0.11567115783691406, 0.12565231323242188, 0.1356334686279297, 0.1456146240234375, 0.1555957794189453, 0.16557693481445312, 0.17555809020996094, 0.18553924560546875, 0.19552040100097656, 0.20550155639648438, 0.2154827117919922, 0.2254638671875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 13.0, 16.0, 21.0, 42.0, 54.0, 138.0, 259.0, 469.0, 1027.0, 2764.0, 9440.0, 67206.0, 3656740.0, 426244.0, 22098.0, 4744.0, 1601.0, 619.0, 330.0, 178.0, 98.0, 63.0, 30.0, 19.0, 19.0, 11.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8544921875, -0.8299026489257812, -0.8053131103515625, -0.7807235717773438, -0.756134033203125, -0.7315444946289062, -0.7069549560546875, -0.6823654174804688, -0.65777587890625, -0.6331863403320312, -0.6085968017578125, -0.5840072631835938, -0.559417724609375, -0.5348281860351562, -0.5102386474609375, -0.48564910888671875, -0.4610595703125, -0.43647003173828125, -0.4118804931640625, -0.38729095458984375, -0.362701416015625, -0.33811187744140625, -0.3135223388671875, -0.28893280029296875, -0.26434326171875, -0.23975372314453125, -0.2151641845703125, -0.19057464599609375, -0.165985107421875, -0.14139556884765625, -0.1168060302734375, -0.09221649169921875, -0.067626953125, -0.04303741455078125, -0.0184478759765625, 0.00614166259765625, 0.030731201171875, 0.05532073974609375, 0.0799102783203125, 0.10449981689453125, 0.12908935546875, 0.15367889404296875, 0.1782684326171875, 0.20285797119140625, 0.227447509765625, 0.25203704833984375, 0.2766265869140625, 0.30121612548828125, 0.3258056640625, 0.35039520263671875, 0.3749847412109375, 0.39957427978515625, 0.424163818359375, 0.44875335693359375, 0.4733428955078125, 0.49793243408203125, 0.52252197265625, 0.5471115112304688, 0.5717010498046875, 0.5962905883789062, 0.620880126953125, 0.6454696655273438, 0.6700592041015625, 0.6946487426757812, 0.71923828125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 8.0, 6.0, 3.0, 11.0, 12.0, 15.0, 33.0, 22.0, 44.0, 94.0, 142.0, 341.0, 593.0, 906.0, 779.0, 498.0, 239.0, 128.0, 72.0, 42.0, 24.0, 14.0, 15.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1684112548828125, -0.162750244140625, -0.1570892333984375, -0.15142822265625, -0.1457672119140625, -0.140106201171875, -0.1344451904296875, -0.1287841796875, -0.1231231689453125, -0.117462158203125, -0.1118011474609375, -0.10614013671875, -0.1004791259765625, -0.094818115234375, -0.0891571044921875, -0.08349609375, -0.0778350830078125, -0.072174072265625, -0.0665130615234375, -0.06085205078125, -0.0551910400390625, -0.049530029296875, -0.0438690185546875, -0.0382080078125, -0.0325469970703125, -0.026885986328125, -0.0212249755859375, -0.01556396484375, -0.0099029541015625, -0.004241943359375, 0.0014190673828125, 0.007080078125, 0.0127410888671875, 0.018402099609375, 0.0240631103515625, 0.02972412109375, 0.0353851318359375, 0.041046142578125, 0.0467071533203125, 0.0523681640625, 0.0580291748046875, 0.063690185546875, 0.0693511962890625, 0.07501220703125, 0.0806732177734375, 0.086334228515625, 0.0919952392578125, 0.09765625, 0.1033172607421875, 0.108978271484375, 0.1146392822265625, 0.12030029296875, 0.1259613037109375, 0.131622314453125, 0.1372833251953125, 0.1429443359375, 0.1486053466796875, 0.154266357421875, 0.1599273681640625, 0.16558837890625, 0.1712493896484375, 0.176910400390625, 0.1825714111328125, 0.188232421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 13.0, 13.0, 23.0, 22.0, 35.0, 43.0, 62.0, 81.0, 117.0, 100.0, 107.0, 87.0, 86.0, 65.0, 35.0, 34.0, 21.0, 11.0, 14.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6039164662361145, -0.5869348645210266, -0.5699533224105835, -0.5529717206954956, -0.5359901785850525, -0.5190085768699646, -0.5020270347595215, -0.4850454330444336, -0.4680638313293457, -0.4510822594165802, -0.4341006875038147, -0.4171190857887268, -0.4001375138759613, -0.3831559419631958, -0.3661743700504303, -0.3491927981376648, -0.3322112262248993, -0.3152296543121338, -0.2982480823993683, -0.2812665104866028, -0.2642849087715149, -0.2473033368587494, -0.2303217649459839, -0.21334019303321838, -0.1963586062192917, -0.17937703430652618, -0.1623954474925995, -0.14541387557983398, -0.12843230366706848, -0.11145071685314178, -0.09446914494037628, -0.07748756557703018, -0.06050598621368408, -0.04352440685033798, -0.02654283121228218, -0.00956125557422638, 0.0074203237891197205, 0.02440190315246582, 0.04138347506523132, 0.05836505442857742, 0.07534663379192352, 0.09232821315526962, 0.10930979251861572, 0.12629136443138123, 0.14327293634414673, 0.16025452315807343, 0.17723609507083893, 0.19421768188476562, 0.21119925379753113, 0.22818082571029663, 0.24516241252422333, 0.26214396953582764, 0.2791255712509155, 0.29610714316368103, 0.31308871507644653, 0.33007028698921204, 0.34705185890197754, 0.36403343081474304, 0.38101500272750854, 0.39799660444259644, 0.41497817635536194, 0.43195974826812744, 0.44894132018089294, 0.46592289209365845, 0.48290449380874634]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 5.0, 13.0, 11.0, 22.0, 20.0, 23.0, 26.0, 31.0, 33.0, 32.0, 26.0, 34.0, 24.0, 38.0, 49.0, 40.0, 41.0, 48.0, 37.0, 44.0, 36.0, 35.0, 40.0, 24.0, 22.0, 28.0, 28.0, 28.0, 20.0, 18.0, 15.0, 14.0, 12.0, 19.0, 6.0, 8.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23238198459148407, -0.22363820672035217, -0.21489444375038147, -0.20615066587924957, -0.19740688800811768, -0.18866312503814697, -0.17991934716701508, -0.17117556929588318, -0.16243180632591248, -0.15368802845478058, -0.14494426548480988, -0.13620048761367798, -0.12745672464370728, -0.11871294677257538, -0.10996916890144348, -0.10122539848089218, -0.09248162806034088, -0.08373785763978958, -0.07499408721923828, -0.06625030934810638, -0.057506538927555084, -0.048762768507003784, -0.040018994361162186, -0.03127522021532059, -0.022531449794769287, -0.013787677511572838, -0.0050439052283763885, 0.0036998670548200607, 0.01244363933801651, 0.02118740975856781, 0.02993118390440941, 0.03867495805025101, 0.04741871356964111, 0.05616248399019241, 0.06490625441074371, 0.07365003228187561, 0.08239380270242691, 0.09113757312297821, 0.09988135099411011, 0.10862512141466141, 0.11736889183521271, 0.1261126697063446, 0.1348564326763153, 0.1436002105474472, 0.1523439884185791, 0.1610877513885498, 0.1698315292596817, 0.1785753071308136, 0.1873190701007843, 0.1960628479719162, 0.2048066109418869, 0.2135503888130188, 0.2222941517829895, 0.2310379296541214, 0.2397817075252533, 0.248525470495224, 0.2572692632675171, 0.2660130262374878, 0.2747568190097809, 0.2835005819797516, 0.2922443449497223, 0.3009881377220154, 0.3097319006919861, 0.3184756636619568, 0.3272194266319275]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 10.0, 13.0, 20.0, 27.0, 39.0, 73.0, 84.0, 118.0, 214.0, 312.0, 460.0, 759.0, 1270.0, 2170.0, 4156.0, 9171.0, 24218.0, 98379.0, 586832.0, 248921.0, 43965.0, 14166.0, 5990.0, 2918.0, 1600.0, 933.0, 591.0, 389.0, 262.0, 170.0, 106.0, 62.0, 45.0, 36.0, 20.0, 15.0, 9.0, 5.0, 12.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1444091796875, -0.13955307006835938, -0.13469696044921875, -0.12984085083007812, -0.1249847412109375, -0.12012863159179688, -0.11527252197265625, -0.11041641235351562, -0.105560302734375, -0.10070419311523438, -0.09584808349609375, -0.09099197387695312, -0.0861358642578125, -0.08127975463867188, -0.07642364501953125, -0.07156753540039062, -0.06671142578125, -0.061855316162109375, -0.05699920654296875, -0.052143096923828125, -0.0472869873046875, -0.042430877685546875, -0.03757476806640625, -0.032718658447265625, -0.027862548828125, -0.023006439208984375, -0.01815032958984375, -0.013294219970703125, -0.0084381103515625, -0.003582000732421875, 0.00127410888671875, 0.006130218505859375, 0.010986328125, 0.015842437744140625, 0.02069854736328125, 0.025554656982421875, 0.0304107666015625, 0.035266876220703125, 0.04012298583984375, 0.044979095458984375, 0.049835205078125, 0.054691314697265625, 0.05954742431640625, 0.06440353393554688, 0.0692596435546875, 0.07411575317382812, 0.07897186279296875, 0.08382797241210938, 0.08868408203125, 0.09354019165039062, 0.09839630126953125, 0.10325241088867188, 0.1081085205078125, 0.11296463012695312, 0.11782073974609375, 0.12267684936523438, 0.127532958984375, 0.13238906860351562, 0.13724517822265625, 0.14210128784179688, 0.1469573974609375, 0.15181350708007812, 0.15666961669921875, 0.16152572631835938, 0.1663818359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 11.0, 10.0, 13.0, 16.0, 15.0, 23.0, 27.0, 22.0, 37.0, 26.0, 33.0, 33.0, 37.0, 40.0, 42.0, 50.0, 47.0, 46.0, 47.0, 54.0, 46.0, 35.0, 41.0, 31.0, 33.0, 25.0, 32.0, 17.0, 19.0, 13.0, 17.0, 10.0, 6.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163330078125, -0.15766334533691406, -0.15199661254882812, -0.1463298797607422, -0.14066314697265625, -0.1349964141845703, -0.12932968139648438, -0.12366294860839844, -0.1179962158203125, -0.11232948303222656, -0.10666275024414062, -0.10099601745605469, -0.09532928466796875, -0.08966255187988281, -0.08399581909179688, -0.07832908630371094, -0.072662353515625, -0.06699562072753906, -0.061328887939453125, -0.05566215515136719, -0.04999542236328125, -0.04432868957519531, -0.038661956787109375, -0.03299522399902344, -0.0273284912109375, -0.021661758422851562, -0.015995025634765625, -0.010328292846679688, -0.00466156005859375, 0.0010051727294921875, 0.006671905517578125, 0.012338638305664062, 0.01800537109375, 0.023672103881835938, 0.029338836669921875, 0.03500556945800781, 0.04067230224609375, 0.04633903503417969, 0.052005767822265625, 0.05767250061035156, 0.0633392333984375, 0.06900596618652344, 0.07467269897460938, 0.08033943176269531, 0.08600616455078125, 0.09167289733886719, 0.09733963012695312, 0.10300636291503906, 0.108673095703125, 0.11433982849121094, 0.12000656127929688, 0.1256732940673828, 0.13134002685546875, 0.1370067596435547, 0.14267349243164062, 0.14834022521972656, 0.1540069580078125, 0.15967369079589844, 0.16534042358398438, 0.1710071563720703, 0.17667388916015625, 0.1823406219482422, 0.18800735473632812, 0.19367408752441406, 0.1993408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 15.0, 12.0, 18.0, 29.0, 36.0, 57.0, 64.0, 122.0, 171.0, 243.0, 386.0, 551.0, 914.0, 1617.0, 2973.0, 5527.0, 11247.0, 24351.0, 59996.0, 167231.0, 394070.0, 235657.0, 81571.0, 32087.0, 14017.0, 6841.0, 3598.0, 2021.0, 1147.0, 668.0, 437.0, 303.0, 168.0, 112.0, 85.0, 61.0, 52.0, 35.0, 17.0, 9.0, 9.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.0687255859375, -0.06668376922607422, -0.06464195251464844, -0.06260013580322266, -0.060558319091796875, -0.058516502380371094, -0.05647468566894531, -0.05443286895751953, -0.05239105224609375, -0.05034923553466797, -0.04830741882324219, -0.046265602111816406, -0.044223785400390625, -0.042181968688964844, -0.04014015197753906, -0.03809833526611328, -0.0360565185546875, -0.03401470184326172, -0.03197288513183594, -0.029931068420410156, -0.027889251708984375, -0.025847434997558594, -0.023805618286132812, -0.02176380157470703, -0.01972198486328125, -0.01768016815185547, -0.015638351440429688, -0.013596534729003906, -0.011554718017578125, -0.009512901306152344, -0.0074710845947265625, -0.005429267883300781, -0.003387451171875, -0.0013456344604492188, 0.0006961822509765625, 0.0027379989624023438, 0.004779815673828125, 0.006821632385253906, 0.008863449096679688, 0.010905265808105469, 0.01294708251953125, 0.014988899230957031, 0.017030715942382812, 0.019072532653808594, 0.021114349365234375, 0.023156166076660156, 0.025197982788085938, 0.02723979949951172, 0.0292816162109375, 0.03132343292236328, 0.03336524963378906, 0.035407066345214844, 0.037448883056640625, 0.039490699768066406, 0.04153251647949219, 0.04357433319091797, 0.04561614990234375, 0.04765796661376953, 0.04969978332519531, 0.051741600036621094, 0.053783416748046875, 0.055825233459472656, 0.05786705017089844, 0.05990886688232422, 0.06195068359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 7.0, 6.0, 9.0, 28.0, 8.0, 17.0, 22.0, 27.0, 15.0, 25.0, 37.0, 37.0, 35.0, 45.0, 40.0, 44.0, 39.0, 34.0, 64.0, 46.0, 37.0, 41.0, 29.0, 45.0, 36.0, 35.0, 21.0, 21.0, 14.0, 18.0, 17.0, 18.0, 16.0, 11.0, 13.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.3994140625, -0.387939453125, -0.37646484375, -0.364990234375, -0.353515625, -0.342041015625, -0.33056640625, -0.319091796875, -0.3076171875, -0.296142578125, -0.28466796875, -0.273193359375, -0.26171875, -0.250244140625, -0.23876953125, -0.227294921875, -0.2158203125, -0.204345703125, -0.19287109375, -0.181396484375, -0.169921875, -0.158447265625, -0.14697265625, -0.135498046875, -0.1240234375, -0.112548828125, -0.10107421875, -0.089599609375, -0.078125, -0.066650390625, -0.05517578125, -0.043701171875, -0.0322265625, -0.020751953125, -0.00927734375, 0.002197265625, 0.013671875, 0.025146484375, 0.03662109375, 0.048095703125, 0.0595703125, 0.071044921875, 0.08251953125, 0.093994140625, 0.10546875, 0.116943359375, 0.12841796875, 0.139892578125, 0.1513671875, 0.162841796875, 0.17431640625, 0.185791015625, 0.197265625, 0.208740234375, 0.22021484375, 0.231689453125, 0.2431640625, 0.254638671875, 0.26611328125, 0.277587890625, 0.2890625, 0.300537109375, 0.31201171875, 0.323486328125, 0.3349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 8.0, 13.0, 12.0, 20.0, 25.0, 43.0, 74.0, 108.0, 191.0, 301.0, 527.0, 1107.0, 2395.0, 6390.0, 21525.0, 109799.0, 570345.0, 273751.0, 44278.0, 10650.0, 3658.0, 1579.0, 773.0, 376.0, 214.0, 126.0, 88.0, 59.0, 31.0, 32.0, 15.0, 8.0, 10.0, 2.0, 6.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031890869140625, -0.030818462371826172, -0.029746055603027344, -0.028673648834228516, -0.027601242065429688, -0.02652883529663086, -0.02545642852783203, -0.024384021759033203, -0.023311614990234375, -0.022239208221435547, -0.02116680145263672, -0.02009439468383789, -0.019021987915039062, -0.017949581146240234, -0.016877174377441406, -0.015804767608642578, -0.01473236083984375, -0.013659954071044922, -0.012587547302246094, -0.011515140533447266, -0.010442733764648438, -0.00937032699584961, -0.008297920227050781, -0.007225513458251953, -0.006153106689453125, -0.005080699920654297, -0.004008293151855469, -0.0029358863830566406, -0.0018634796142578125, -0.0007910728454589844, 0.00028133392333984375, 0.0013537406921386719, 0.0024261474609375, 0.003498554229736328, 0.004570960998535156, 0.005643367767333984, 0.0067157745361328125, 0.007788181304931641, 0.008860588073730469, 0.009932994842529297, 0.011005401611328125, 0.012077808380126953, 0.013150215148925781, 0.01422262191772461, 0.015295028686523438, 0.016367435455322266, 0.017439842224121094, 0.018512248992919922, 0.01958465576171875, 0.020657062530517578, 0.021729469299316406, 0.022801876068115234, 0.023874282836914062, 0.02494668960571289, 0.02601909637451172, 0.027091503143310547, 0.028163909912109375, 0.029236316680908203, 0.03030872344970703, 0.03138113021850586, 0.03245353698730469, 0.033525943756103516, 0.034598350524902344, 0.03567075729370117, 0.0367431640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 16.0, 16.0, 25.0, 27.0, 31.0, 53.0, 65.0, 77.0, 99.0, 91.0, 105.0, 85.0, 56.0, 60.0, 40.0, 24.0, 27.0, 11.0, 16.0, 8.0, 7.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0347925126552582e-05, -9.90740954875946e-06, -9.466893970966339e-06, -9.026378393173218e-06, -8.585862815380096e-06, -8.145347237586975e-06, -7.704831659793854e-06, -7.264316082000732e-06, -6.823800504207611e-06, -6.38328492641449e-06, -5.942769348621368e-06, -5.502253770828247e-06, -5.061738193035126e-06, -4.621222615242004e-06, -4.180707037448883e-06, -3.7401914596557617e-06, -3.2996758818626404e-06, -2.859160304069519e-06, -2.4186447262763977e-06, -1.9781291484832764e-06, -1.537613570690155e-06, -1.0970979928970337e-06, -6.565824151039124e-07, -2.1606683731079102e-07, 2.2444874048233032e-07, 6.649643182754517e-07, 1.105479896068573e-06, 1.5459954738616943e-06, 1.9865110516548157e-06, 2.427026629447937e-06, 2.8675422072410583e-06, 3.3080577850341797e-06, 3.748573362827301e-06, 4.189088940620422e-06, 4.629604518413544e-06, 5.070120096206665e-06, 5.510635673999786e-06, 5.951151251792908e-06, 6.391666829586029e-06, 6.83218240737915e-06, 7.272697985172272e-06, 7.713213562965393e-06, 8.153729140758514e-06, 8.594244718551636e-06, 9.034760296344757e-06, 9.475275874137878e-06, 9.915791451931e-06, 1.0356307029724121e-05, 1.0796822607517242e-05, 1.1237338185310364e-05, 1.1677853763103485e-05, 1.2118369340896606e-05, 1.2558884918689728e-05, 1.2999400496482849e-05, 1.343991607427597e-05, 1.3880431652069092e-05, 1.4320947229862213e-05, 1.4761462807655334e-05, 1.5201978385448456e-05, 1.5642493963241577e-05, 1.60830095410347e-05, 1.652352511882782e-05, 1.696404069662094e-05, 1.7404556274414062e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 5.0, 7.0, 11.0, 13.0, 24.0, 24.0, 52.0, 77.0, 129.0, 216.0, 391.0, 614.0, 1201.0, 2307.0, 4991.0, 11319.0, 27877.0, 75350.0, 209710.0, 380238.0, 209781.0, 75007.0, 27908.0, 11228.0, 4973.0, 2362.0, 1213.0, 630.0, 358.0, 215.0, 124.0, 79.0, 47.0, 20.0, 24.0, 9.0, 7.0, 4.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0277862548828125, -0.02700352668762207, -0.02622079849243164, -0.02543807029724121, -0.02465534210205078, -0.02387261390686035, -0.023089885711669922, -0.022307157516479492, -0.021524429321289062, -0.020741701126098633, -0.019958972930908203, -0.019176244735717773, -0.018393516540527344, -0.017610788345336914, -0.016828060150146484, -0.016045331954956055, -0.015262603759765625, -0.014479875564575195, -0.013697147369384766, -0.012914419174194336, -0.012131690979003906, -0.011348962783813477, -0.010566234588623047, -0.009783506393432617, -0.009000778198242188, -0.008218050003051758, -0.007435321807861328, -0.0066525936126708984, -0.005869865417480469, -0.005087137222290039, -0.004304409027099609, -0.0035216808319091797, -0.00273895263671875, -0.0019562244415283203, -0.0011734962463378906, -0.00039076805114746094, 0.00039196014404296875, 0.0011746883392333984, 0.001957416534423828, 0.002740144729614258, 0.0035228729248046875, 0.004305601119995117, 0.005088329315185547, 0.0058710575103759766, 0.006653785705566406, 0.007436513900756836, 0.008219242095947266, 0.009001970291137695, 0.009784698486328125, 0.010567426681518555, 0.011350154876708984, 0.012132883071899414, 0.012915611267089844, 0.013698339462280273, 0.014481067657470703, 0.015263795852661133, 0.016046524047851562, 0.016829252243041992, 0.017611980438232422, 0.01839470863342285, 0.01917743682861328, 0.01996016502380371, 0.02074289321899414, 0.02152562141418457, 0.022308349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 6.0, 5.0, 8.0, 9.0, 15.0, 14.0, 25.0, 21.0, 22.0, 26.0, 38.0, 33.0, 61.0, 58.0, 56.0, 59.0, 56.0, 66.0, 63.0, 48.0, 54.0, 44.0, 35.0, 32.0, 40.0, 33.0, 10.0, 9.0, 12.0, 12.0, 9.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005947113037109375, -0.005723774433135986, -0.005500435829162598, -0.005277097225189209, -0.00505375862121582, -0.004830420017242432, -0.004607081413269043, -0.004383742809295654, -0.004160404205322266, -0.003937065601348877, -0.0037137269973754883, -0.0034903883934020996, -0.003267049789428711, -0.0030437111854553223, -0.0028203725814819336, -0.002597033977508545, -0.0023736953735351562, -0.0021503567695617676, -0.001927018165588379, -0.0017036795616149902, -0.0014803409576416016, -0.0012570023536682129, -0.0010336637496948242, -0.0008103251457214355, -0.0005869865417480469, -0.0003636479377746582, -0.00014030933380126953, 8.302927017211914e-05, 0.0003063678741455078, 0.0005297064781188965, 0.0007530450820922852, 0.0009763836860656738, 0.0011997222900390625, 0.0014230608940124512, 0.0016463994979858398, 0.0018697381019592285, 0.002093076705932617, 0.002316415309906006, 0.0025397539138793945, 0.002763092517852783, 0.002986431121826172, 0.0032097697257995605, 0.0034331083297729492, 0.003656446933746338, 0.0038797855377197266, 0.004103124141693115, 0.004326462745666504, 0.004549801349639893, 0.004773139953613281, 0.00499647855758667, 0.005219817161560059, 0.005443155765533447, 0.005666494369506836, 0.005889832973480225, 0.006113171577453613, 0.006336510181427002, 0.006559848785400391, 0.006783187389373779, 0.007006525993347168, 0.007229864597320557, 0.007453203201293945, 0.007676541805267334, 0.007899880409240723, 0.008123219013214111, 0.0083465576171875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 14.0, 14.0, 23.0, 36.0, 61.0, 63.0, 98.0, 109.0, 145.0, 129.0, 78.0, 75.0, 42.0, 45.0, 18.0, 14.0, 11.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.373170405626297, -0.3620213270187378, -0.3508722484111786, -0.3397231698036194, -0.32857412099838257, -0.31742504239082336, -0.30627596378326416, -0.29512688517570496, -0.28397780656814575, -0.27282872796058655, -0.26167964935302734, -0.2505306005477905, -0.23938152194023132, -0.22823244333267212, -0.21708336472511292, -0.2059342861175537, -0.1947852373123169, -0.1836361587047577, -0.17248709499835968, -0.16133801639080048, -0.15018895268440247, -0.13903987407684326, -0.12789079546928406, -0.11674172431230545, -0.10559265315532684, -0.09444358199834824, -0.08329451084136963, -0.07214543223381042, -0.06099636107683182, -0.04984728991985321, -0.038698211312294006, -0.0275491401553154, -0.016400068998336792, -0.005250995978713036, 0.005898077040910721, 0.017047151923179626, 0.028196223080158234, 0.03934529423713684, 0.050494372844696045, 0.06164344400167465, 0.07279251515865326, 0.08394158631563187, 0.09509065747261047, 0.10623973608016968, 0.11738880723714828, 0.1285378783941269, 0.1396869570016861, 0.1508360207080841, 0.1619850993156433, 0.17313417792320251, 0.18428324162960052, 0.19543232023715973, 0.20658138394355774, 0.21773046255111694, 0.22887954115867615, 0.24002861976623535, 0.25117766857147217, 0.26232674717903137, 0.2734758257865906, 0.2846248745918274, 0.2957739531993866, 0.3069230318069458, 0.318072110414505, 0.3292211890220642, 0.3403702676296234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 13.0, 9.0, 14.0, 22.0, 21.0, 35.0, 31.0, 42.0, 33.0, 42.0, 42.0, 48.0, 54.0, 54.0, 62.0, 52.0, 48.0, 49.0, 44.0, 38.0, 35.0, 40.0, 30.0, 33.0, 17.0, 14.0, 12.0, 18.0, 15.0, 5.0, 5.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.22568418085575104, -0.21931801736354828, -0.2129518687725067, -0.20658570528030396, -0.2002195417881012, -0.19385339319705963, -0.18748722970485687, -0.1811210811138153, -0.17475491762161255, -0.1683887541294098, -0.16202260553836823, -0.15565644204616547, -0.1492902785539627, -0.14292412996292114, -0.13655796647071838, -0.13019180297851562, -0.12382564693689346, -0.1174594908952713, -0.11109332740306854, -0.10472717136144638, -0.09836101531982422, -0.09199485182762146, -0.0856286957859993, -0.07926253974437714, -0.07289637625217438, -0.06653022021055222, -0.060164060443639755, -0.053797900676727295, -0.04743174463510513, -0.04106558486819267, -0.03469942510128021, -0.02833326905965805, -0.02196711301803589, -0.015600955113768578, -0.009234796278178692, -0.002868637442588806, 0.003497520461678505, 0.009863678365945816, 0.016229838132858276, 0.022595994174480438, 0.0289621539413929, 0.03532831370830536, 0.04169446974992752, 0.04806062951683998, 0.05442678928375244, 0.0607929453253746, 0.06715910136699677, 0.07352526485919952, 0.07989142090082169, 0.08625757694244385, 0.0926237404346466, 0.09898989647626877, 0.10535605251789093, 0.11172221601009369, 0.11808837205171585, 0.12445452809333801, 0.13082069158554077, 0.13718685507774353, 0.1435530036687851, 0.14991916716098785, 0.1562853306531906, 0.16265147924423218, 0.16901764273643494, 0.1753838062286377, 0.18174995481967926]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 17.0, 14.0, 17.0, 21.0, 40.0, 68.0, 79.0, 135.0, 229.0, 315.0, 435.0, 766.0, 1268.0, 2184.0, 3842.0, 7524.0, 15444.0, 36895.0, 110461.0, 471382.0, 277656.0, 68769.0, 25994.0, 11590.0, 5701.0, 3065.0, 1735.0, 1045.0, 644.0, 411.0, 275.0, 170.0, 107.0, 85.0, 50.0, 31.0, 19.0, 19.0, 15.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27685546875, -0.2678680419921875, -0.258880615234375, -0.2498931884765625, -0.24090576171875, -0.2319183349609375, -0.222930908203125, -0.2139434814453125, -0.2049560546875, -0.1959686279296875, -0.186981201171875, -0.1779937744140625, -0.16900634765625, -0.1600189208984375, -0.151031494140625, -0.1420440673828125, -0.133056640625, -0.1240692138671875, -0.115081787109375, -0.1060943603515625, -0.09710693359375, -0.0881195068359375, -0.079132080078125, -0.0701446533203125, -0.0611572265625, -0.0521697998046875, -0.043182373046875, -0.0341949462890625, -0.02520751953125, -0.0162200927734375, -0.007232666015625, 0.0017547607421875, 0.0107421875, 0.0197296142578125, 0.028717041015625, 0.0377044677734375, 0.04669189453125, 0.0556793212890625, 0.064666748046875, 0.0736541748046875, 0.0826416015625, 0.0916290283203125, 0.100616455078125, 0.1096038818359375, 0.11859130859375, 0.1275787353515625, 0.136566162109375, 0.1455535888671875, 0.154541015625, 0.1635284423828125, 0.172515869140625, 0.1815032958984375, 0.19049072265625, 0.1994781494140625, 0.208465576171875, 0.2174530029296875, 0.2264404296875, 0.2354278564453125, 0.244415283203125, 0.2534027099609375, 0.26239013671875, 0.2713775634765625, 0.280364990234375, 0.2893524169921875, 0.29833984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 4.0, 12.0, 8.0, 15.0, 21.0, 20.0, 24.0, 24.0, 23.0, 37.0, 41.0, 44.0, 44.0, 46.0, 44.0, 41.0, 52.0, 58.0, 64.0, 41.0, 52.0, 28.0, 43.0, 37.0, 25.0, 27.0, 22.0, 16.0, 18.0, 16.0, 8.0, 12.0, 9.0, 6.0, 5.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4253082275390625, -0.413360595703125, -0.4014129638671875, -0.38946533203125, -0.3775177001953125, -0.365570068359375, -0.3536224365234375, -0.3416748046875, -0.3297271728515625, -0.317779541015625, -0.3058319091796875, -0.29388427734375, -0.2819366455078125, -0.269989013671875, -0.2580413818359375, -0.24609375, -0.2341461181640625, -0.222198486328125, -0.2102508544921875, -0.19830322265625, -0.1863555908203125, -0.174407958984375, -0.1624603271484375, -0.1505126953125, -0.1385650634765625, -0.126617431640625, -0.1146697998046875, -0.10272216796875, -0.0907745361328125, -0.078826904296875, -0.0668792724609375, -0.054931640625, -0.0429840087890625, -0.031036376953125, -0.0190887451171875, -0.00714111328125, 0.0048065185546875, 0.016754150390625, 0.0287017822265625, 0.0406494140625, 0.0525970458984375, 0.064544677734375, 0.0764923095703125, 0.08843994140625, 0.1003875732421875, 0.112335205078125, 0.1242828369140625, 0.13623046875, 0.1481781005859375, 0.160125732421875, 0.1720733642578125, 0.18402099609375, 0.1959686279296875, 0.207916259765625, 0.2198638916015625, 0.2318115234375, 0.2437591552734375, 0.255706787109375, 0.2676544189453125, 0.27960205078125, 0.2915496826171875, 0.303497314453125, 0.3154449462890625, 0.327392578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 15.0, 15.0, 18.0, 21.0, 27.0, 42.0, 76.0, 101.0, 161.0, 368.0, 782.0, 2165.0, 8315.0, 42808.0, 537312.0, 409296.0, 36514.0, 7090.0, 2018.0, 665.0, 300.0, 147.0, 113.0, 64.0, 33.0, 18.0, 20.0, 14.0, 10.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.489990234375, -0.4724617004394531, -0.45493316650390625, -0.4374046325683594, -0.4198760986328125, -0.4023475646972656, -0.38481903076171875, -0.3672904968261719, -0.349761962890625, -0.3322334289550781, -0.31470489501953125, -0.2971763610839844, -0.2796478271484375, -0.2621192932128906, -0.24459075927734375, -0.22706222534179688, -0.20953369140625, -0.19200515747070312, -0.17447662353515625, -0.15694808959960938, -0.1394195556640625, -0.12189102172851562, -0.10436248779296875, -0.08683395385742188, -0.069305419921875, -0.051776885986328125, -0.03424835205078125, -0.016719818115234375, 0.0008087158203125, 0.018337249755859375, 0.03586578369140625, 0.053394317626953125, 0.0709228515625, 0.08845138549804688, 0.10597991943359375, 0.12350845336914062, 0.1410369873046875, 0.15856552124023438, 0.17609405517578125, 0.19362258911132812, 0.211151123046875, 0.22867965698242188, 0.24620819091796875, 0.2637367248535156, 0.2812652587890625, 0.2987937927246094, 0.31632232666015625, 0.3338508605957031, 0.35137939453125, 0.3689079284667969, 0.38643646240234375, 0.4039649963378906, 0.4214935302734375, 0.4390220642089844, 0.45655059814453125, 0.4740791320800781, 0.491607666015625, 0.5091361999511719, 0.5266647338867188, 0.5441932678222656, 0.5617218017578125, 0.5792503356933594, 0.5967788696289062, 0.6143074035644531, 0.6318359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 6.0, 7.0, 9.0, 12.0, 11.0, 12.0, 11.0, 22.0, 20.0, 26.0, 41.0, 36.0, 48.0, 48.0, 41.0, 50.0, 43.0, 65.0, 54.0, 51.0, 57.0, 48.0, 51.0, 35.0, 30.0, 29.0, 33.0, 23.0, 12.0, 15.0, 9.0, 13.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.4971504211425781, -0.48258209228515625, -0.4680137634277344, -0.4534454345703125, -0.4388771057128906, -0.42430877685546875, -0.4097404479980469, -0.395172119140625, -0.3806037902832031, -0.36603546142578125, -0.3514671325683594, -0.3368988037109375, -0.3223304748535156, -0.30776214599609375, -0.2931938171386719, -0.27862548828125, -0.2640571594238281, -0.24948883056640625, -0.23492050170898438, -0.2203521728515625, -0.20578384399414062, -0.19121551513671875, -0.17664718627929688, -0.162078857421875, -0.14751052856445312, -0.13294219970703125, -0.11837387084960938, -0.1038055419921875, -0.08923721313476562, -0.07466888427734375, -0.060100555419921875, -0.0455322265625, -0.030963897705078125, -0.01639556884765625, -0.001827239990234375, 0.0127410888671875, 0.027309417724609375, 0.04187774658203125, 0.056446075439453125, 0.071014404296875, 0.08558273315429688, 0.10015106201171875, 0.11471939086914062, 0.1292877197265625, 0.14385604858398438, 0.15842437744140625, 0.17299270629882812, 0.18756103515625, 0.20212936401367188, 0.21669769287109375, 0.23126602172851562, 0.2458343505859375, 0.2604026794433594, 0.27497100830078125, 0.2895393371582031, 0.304107666015625, 0.3186759948730469, 0.33324432373046875, 0.3478126525878906, 0.3623809814453125, 0.3769493103027344, 0.39151763916015625, 0.4060859680175781, 0.420654296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 17.0, 33.0, 57.0, 155.0, 397.0, 1425.0, 8287.0, 141495.0, 853355.0, 38279.0, 3683.0, 804.0, 263.0, 119.0, 47.0, 41.0, 13.0, 7.0, 11.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1829833984375, -0.17731857299804688, -0.17165374755859375, -0.16598892211914062, -0.1603240966796875, -0.15465927124023438, -0.14899444580078125, -0.14332962036132812, -0.137664794921875, -0.13199996948242188, -0.12633514404296875, -0.12067031860351562, -0.1150054931640625, -0.10934066772460938, -0.10367584228515625, -0.09801101684570312, -0.09234619140625, -0.08668136596679688, -0.08101654052734375, -0.07535171508789062, -0.0696868896484375, -0.06402206420898438, -0.05835723876953125, -0.052692413330078125, -0.047027587890625, -0.041362762451171875, -0.03569793701171875, -0.030033111572265625, -0.0243682861328125, -0.018703460693359375, -0.01303863525390625, -0.007373809814453125, -0.001708984375, 0.003955841064453125, 0.00962066650390625, 0.015285491943359375, 0.0209503173828125, 0.026615142822265625, 0.03227996826171875, 0.037944793701171875, 0.043609619140625, 0.049274444580078125, 0.05493927001953125, 0.060604095458984375, 0.0662689208984375, 0.07193374633789062, 0.07759857177734375, 0.08326339721679688, 0.08892822265625, 0.09459304809570312, 0.10025787353515625, 0.10592269897460938, 0.1115875244140625, 0.11725234985351562, 0.12291717529296875, 0.12858200073242188, 0.134246826171875, 0.13991165161132812, 0.14557647705078125, 0.15124130249023438, 0.1569061279296875, 0.16257095336914062, 0.16823577880859375, 0.17390060424804688, 0.1795654296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 8.0, 9.0, 18.0, 30.0, 27.0, 69.0, 79.0, 102.0, 191.0, 155.0, 88.0, 70.0, 39.0, 30.0, 19.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2024305760860443e-05, -1.1472031474113464e-05, -1.0919757187366486e-05, -1.0367482900619507e-05, -9.815208613872528e-06, -9.26293432712555e-06, -8.71066004037857e-06, -8.158385753631592e-06, -7.606111466884613e-06, -7.053837180137634e-06, -6.5015628933906555e-06, -5.949288606643677e-06, -5.397014319896698e-06, -4.844740033149719e-06, -4.2924657464027405e-06, -3.7401914596557617e-06, -3.187917172908783e-06, -2.635642886161804e-06, -2.0833685994148254e-06, -1.5310943126678467e-06, -9.78820025920868e-07, -4.2654573917388916e-07, 1.257285475730896e-07, 6.780028343200684e-07, 1.2302771210670471e-06, 1.7825514078140259e-06, 2.3348256945610046e-06, 2.8870999813079834e-06, 3.439374268054962e-06, 3.991648554801941e-06, 4.54392284154892e-06, 5.0961971282958984e-06, 5.648471415042877e-06, 6.200745701789856e-06, 6.753019988536835e-06, 7.3052942752838135e-06, 7.857568562030792e-06, 8.409842848777771e-06, 8.96211713552475e-06, 9.514391422271729e-06, 1.0066665709018707e-05, 1.0618939995765686e-05, 1.1171214282512665e-05, 1.1723488569259644e-05, 1.2275762856006622e-05, 1.2828037142753601e-05, 1.338031142950058e-05, 1.3932585716247559e-05, 1.4484860002994537e-05, 1.5037134289741516e-05, 1.5589408576488495e-05, 1.6141682863235474e-05, 1.6693957149982452e-05, 1.724623143672943e-05, 1.779850572347641e-05, 1.835078001022339e-05, 1.8903054296970367e-05, 1.9455328583717346e-05, 2.0007602870464325e-05, 2.0559877157211304e-05, 2.1112151443958282e-05, 2.166442573070526e-05, 2.221670001745224e-05, 2.276897430419922e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 21.0, 40.0, 60.0, 110.0, 210.0, 425.0, 826.0, 1726.0, 4588.0, 19135.0, 193150.0, 753078.0, 60098.0, 9558.0, 2974.0, 1238.0, 609.0, 338.0, 146.0, 75.0, 53.0, 29.0, 10.0, 15.0, 9.0, 5.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.151336669921875, -0.14678955078125, -0.142242431640625, -0.1376953125, -0.133148193359375, -0.12860107421875, -0.124053955078125, -0.1195068359375, -0.114959716796875, -0.11041259765625, -0.105865478515625, -0.101318359375, -0.096771240234375, -0.09222412109375, -0.087677001953125, -0.0831298828125, -0.078582763671875, -0.07403564453125, -0.069488525390625, -0.06494140625, -0.060394287109375, -0.05584716796875, -0.051300048828125, -0.0467529296875, -0.042205810546875, -0.03765869140625, -0.033111572265625, -0.028564453125, -0.024017333984375, -0.01947021484375, -0.014923095703125, -0.0103759765625, -0.005828857421875, -0.00128173828125, 0.003265380859375, 0.0078125, 0.012359619140625, 0.01690673828125, 0.021453857421875, 0.0260009765625, 0.030548095703125, 0.03509521484375, 0.039642333984375, 0.044189453125, 0.048736572265625, 0.05328369140625, 0.057830810546875, 0.0623779296875, 0.066925048828125, 0.07147216796875, 0.076019287109375, 0.08056640625, 0.085113525390625, 0.08966064453125, 0.094207763671875, 0.0987548828125, 0.103302001953125, 0.10784912109375, 0.112396240234375, 0.116943359375, 0.121490478515625, 0.12603759765625, 0.130584716796875, 0.1351318359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 4.0, 10.0, 13.0, 10.0, 29.0, 51.0, 73.0, 104.0, 118.0, 178.0, 128.0, 95.0, 51.0, 41.0, 25.0, 18.0, 12.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.062290191650390625, -0.06024932861328125, -0.058208465576171875, -0.0561676025390625, -0.054126739501953125, -0.05208587646484375, -0.050045013427734375, -0.048004150390625, -0.045963287353515625, -0.04392242431640625, -0.041881561279296875, -0.0398406982421875, -0.037799835205078125, -0.03575897216796875, -0.033718109130859375, -0.03167724609375, -0.029636383056640625, -0.02759552001953125, -0.025554656982421875, -0.0235137939453125, -0.021472930908203125, -0.01943206787109375, -0.017391204833984375, -0.015350341796875, -0.013309478759765625, -0.01126861572265625, -0.009227752685546875, -0.0071868896484375, -0.005146026611328125, -0.00310516357421875, -0.001064300537109375, 0.0009765625, 0.003017425537109375, 0.00505828857421875, 0.007099151611328125, 0.0091400146484375, 0.011180877685546875, 0.01322174072265625, 0.015262603759765625, 0.017303466796875, 0.019344329833984375, 0.02138519287109375, 0.023426055908203125, 0.0254669189453125, 0.027507781982421875, 0.02954864501953125, 0.031589508056640625, 0.03363037109375, 0.035671234130859375, 0.03771209716796875, 0.039752960205078125, 0.0417938232421875, 0.043834686279296875, 0.04587554931640625, 0.047916412353515625, 0.049957275390625, 0.051998138427734375, 0.05403900146484375, 0.056079864501953125, 0.0581207275390625, 0.060161590576171875, 0.06220245361328125, 0.06424331665039062, 0.0662841796875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [19.0, 112.0, 500.0, 333.0, 45.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33184677362442017, -0.2141825258731842, -0.09651826322078705, 0.021145999431610107, 0.13881024718284607, 0.25647449493408203, 0.3741387724876404, 0.49180299043655396, 0.6094672679901123, 0.7271315455436707, 0.8447957634925842, 0.9624600410461426, 1.0801242589950562, 1.1977884769439697, 1.3154528141021729, 1.4331170320510864, 1.55078125, 1.6684454679489136, 1.7861098051071167, 1.9037740230560303, 2.0214383602142334, 2.1391024589538574, 2.2567667961120605, 2.3744311332702637, 2.492095470428467, 2.60975980758667, 2.727423906326294, 2.845088243484497, 2.9627525806427, 3.080416679382324, 3.1980810165405273, 3.3157453536987305, 3.4334094524383545, 3.5510737895965576, 3.6687378883361816, 3.7864022254943848, 3.904066562652588, 4.021730899810791, 4.139394760131836, 4.257059097290039, 4.374723434448242, 4.492387771606445, 4.610052108764648, 4.727716445922852, 4.8453803062438965, 4.9630446434021, 5.080708980560303, 5.198373317718506, 5.316037654876709, 5.433701992034912, 5.551366329193115, 5.66903018951416, 5.786694526672363, 5.904358863830566, 6.0220232009887695, 6.139687538146973, 6.257351398468018, 6.375015735626221, 6.492680072784424, 6.610343933105469, 6.728008270263672, 6.845672607421875, 6.963336944580078, 7.081001281738281, 7.198665618896484]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 7.0, 2.0, 5.0, 9.0, 10.0, 24.0, 17.0, 14.0, 13.0, 21.0, 23.0, 26.0, 38.0, 26.0, 38.0, 33.0, 41.0, 48.0, 49.0, 40.0, 37.0, 36.0, 47.0, 42.0, 42.0, 37.0, 28.0, 25.0, 33.0, 34.0, 20.0, 24.0, 11.0, 18.0, 17.0, 13.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5970219373703003, -0.5782413482666016, -0.5594608187675476, -0.5406802296638489, -0.5218996405601501, -0.5031190514564514, -0.48433852195739746, -0.46555793285369873, -0.44677734375, -0.42799678444862366, -0.4092161953449249, -0.3904356360435486, -0.37165504693984985, -0.3528744876384735, -0.33409392833709717, -0.31531333923339844, -0.2965327799320221, -0.27775222063064575, -0.258971631526947, -0.24019107222557068, -0.22141048312187195, -0.2026299238204956, -0.18384934961795807, -0.16506877541542053, -0.146288201212883, -0.12750762701034546, -0.10872705280780792, -0.08994648605585098, -0.07116591185331345, -0.05238533765077591, -0.03360477089881897, -0.014824196696281433, 0.0039563775062561035, 0.02273694984614849, 0.04151752218604088, 0.060298092663288116, 0.07907866686582565, 0.09785924106836319, 0.11663980782032013, 0.13542038202285767, 0.1542009562253952, 0.17298153042793274, 0.19176210463047028, 0.2105426788330078, 0.22932323813438416, 0.24810382723808289, 0.26688438653945923, 0.28566497564315796, 0.3044455349445343, 0.32322609424591064, 0.3420066833496094, 0.3607872426509857, 0.37956783175468445, 0.3983483910560608, 0.4171289801597595, 0.43590953946113586, 0.4546900987625122, 0.47347065806388855, 0.4922512471675873, 0.5110318064689636, 0.5298123955726624, 0.5485929846763611, 0.567373514175415, 0.5861541032791138, 0.6049346923828125]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 7.0, 13.0, 16.0, 27.0, 31.0, 61.0, 100.0, 172.0, 319.0, 516.0, 973.0, 1792.0, 3760.0, 10696.0, 85813.0, 3086244.0, 961500.0, 29456.0, 6998.0, 2727.0, 1274.0, 713.0, 425.0, 251.0, 126.0, 90.0, 55.0, 50.0, 26.0, 21.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48095703125, -0.4630126953125, -0.445068359375, -0.4271240234375, -0.4091796875, -0.3912353515625, -0.373291015625, -0.3553466796875, -0.33740234375, -0.3194580078125, -0.301513671875, -0.2835693359375, -0.265625, -0.2476806640625, -0.229736328125, -0.2117919921875, -0.19384765625, -0.1759033203125, -0.157958984375, -0.1400146484375, -0.1220703125, -0.1041259765625, -0.086181640625, -0.0682373046875, -0.05029296875, -0.0323486328125, -0.014404296875, 0.0035400390625, 0.021484375, 0.0394287109375, 0.057373046875, 0.0753173828125, 0.09326171875, 0.1112060546875, 0.129150390625, 0.1470947265625, 0.1650390625, 0.1829833984375, 0.200927734375, 0.2188720703125, 0.23681640625, 0.2547607421875, 0.272705078125, 0.2906494140625, 0.30859375, 0.3265380859375, 0.344482421875, 0.3624267578125, 0.38037109375, 0.3983154296875, 0.416259765625, 0.4342041015625, 0.4521484375, 0.4700927734375, 0.488037109375, 0.5059814453125, 0.52392578125, 0.5418701171875, 0.559814453125, 0.5777587890625, 0.595703125, 0.6136474609375, 0.631591796875, 0.6495361328125, 0.66748046875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 13.0, 17.0, 15.0, 26.0, 30.0, 41.0, 34.0, 47.0, 61.0, 65.0, 68.0, 57.0, 67.0, 49.0, 47.0, 50.0, 50.0, 42.0, 37.0, 35.0, 32.0, 24.0, 16.0, 13.0, 8.0, 9.0, 15.0, 4.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2706260681152344, -0.26317596435546875, -0.2557258605957031, -0.2482757568359375, -0.24082565307617188, -0.23337554931640625, -0.22592544555664062, -0.218475341796875, -0.21102523803710938, -0.20357513427734375, -0.19612503051757812, -0.1886749267578125, -0.18122482299804688, -0.17377471923828125, -0.16632461547851562, -0.15887451171875, -0.15142440795898438, -0.14397430419921875, -0.13652420043945312, -0.1290740966796875, -0.12162399291992188, -0.11417388916015625, -0.10672378540039062, -0.099273681640625, -0.09182357788085938, -0.08437347412109375, -0.07692337036132812, -0.0694732666015625, -0.062023162841796875, -0.05457305908203125, -0.047122955322265625, -0.0396728515625, -0.032222747802734375, -0.02477264404296875, -0.017322540283203125, -0.0098724365234375, -0.002422332763671875, 0.00502777099609375, 0.012477874755859375, 0.019927978515625, 0.027378082275390625, 0.03482818603515625, 0.042278289794921875, 0.0497283935546875, 0.057178497314453125, 0.06462860107421875, 0.07207870483398438, 0.07952880859375, 0.08697891235351562, 0.09442901611328125, 0.10187911987304688, 0.1093292236328125, 0.11677932739257812, 0.12422943115234375, 0.13167953491210938, 0.139129638671875, 0.14657974243164062, 0.15402984619140625, 0.16147994995117188, 0.1689300537109375, 0.17638015747070312, 0.18383026123046875, 0.19128036499023438, 0.19873046875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 4.0, 6.0, 8.0, 6.0, 9.0, 8.0, 16.0, 23.0, 30.0, 38.0, 66.0, 92.0, 202.0, 407.0, 802.0, 1862.0, 4985.0, 17688.0, 124414.0, 3458518.0, 535635.0, 36028.0, 8119.0, 2907.0, 1196.0, 536.0, 270.0, 141.0, 79.0, 49.0, 38.0, 18.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.478515625, -0.4629364013671875, -0.447357177734375, -0.4317779541015625, -0.41619873046875, -0.4006195068359375, -0.385040283203125, -0.3694610595703125, -0.3538818359375, -0.3383026123046875, -0.322723388671875, -0.3071441650390625, -0.29156494140625, -0.2759857177734375, -0.260406494140625, -0.2448272705078125, -0.229248046875, -0.2136688232421875, -0.198089599609375, -0.1825103759765625, -0.16693115234375, -0.1513519287109375, -0.135772705078125, -0.1201934814453125, -0.1046142578125, -0.0890350341796875, -0.073455810546875, -0.0578765869140625, -0.04229736328125, -0.0267181396484375, -0.011138916015625, 0.0044403076171875, 0.02001953125, 0.0355987548828125, 0.051177978515625, 0.0667572021484375, 0.08233642578125, 0.0979156494140625, 0.113494873046875, 0.1290740966796875, 0.1446533203125, 0.1602325439453125, 0.175811767578125, 0.1913909912109375, 0.20697021484375, 0.2225494384765625, 0.238128662109375, 0.2537078857421875, 0.269287109375, 0.2848663330078125, 0.300445556640625, 0.3160247802734375, 0.33160400390625, 0.3471832275390625, 0.362762451171875, 0.3783416748046875, 0.3939208984375, 0.4095001220703125, 0.425079345703125, 0.4406585693359375, 0.45623779296875, 0.4718170166015625, 0.487396240234375, 0.5029754638671875, 0.5185546875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 9.0, 12.0, 6.0, 19.0, 22.0, 38.0, 44.0, 69.0, 124.0, 188.0, 284.0, 484.0, 588.0, 653.0, 509.0, 355.0, 219.0, 131.0, 87.0, 56.0, 44.0, 26.0, 18.0, 14.0, 14.0, 7.0, 10.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.12042236328125, -0.11680030822753906, -0.11317825317382812, -0.10955619812011719, -0.10593414306640625, -0.10231208801269531, -0.09869003295898438, -0.09506797790527344, -0.0914459228515625, -0.08782386779785156, -0.08420181274414062, -0.08057975769042969, -0.07695770263671875, -0.07333564758300781, -0.06971359252929688, -0.06609153747558594, -0.062469482421875, -0.05884742736816406, -0.055225372314453125, -0.05160331726074219, -0.04798126220703125, -0.04435920715332031, -0.040737152099609375, -0.03711509704589844, -0.0334930419921875, -0.029870986938476562, -0.026248931884765625, -0.022626876831054688, -0.01900482177734375, -0.015382766723632812, -0.011760711669921875, -0.008138656616210938, -0.0045166015625, -0.0008945465087890625, 0.002727508544921875, 0.0063495635986328125, 0.00997161865234375, 0.013593673706054688, 0.017215728759765625, 0.020837783813476562, 0.0244598388671875, 0.028081893920898438, 0.031703948974609375, 0.03532600402832031, 0.03894805908203125, 0.04257011413574219, 0.046192169189453125, 0.04981422424316406, 0.053436279296875, 0.05705833435058594, 0.060680389404296875, 0.06430244445800781, 0.06792449951171875, 0.07154655456542969, 0.07516860961914062, 0.07879066467285156, 0.0824127197265625, 0.08603477478027344, 0.08965682983398438, 0.09327888488769531, 0.09690093994140625, 0.10052299499511719, 0.10414505004882812, 0.10776710510253906, 0.11138916015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 12.0, 3.0, 12.0, 13.0, 20.0, 21.0, 17.0, 23.0, 42.0, 36.0, 60.0, 67.0, 66.0, 67.0, 87.0, 72.0, 73.0, 50.0, 62.0, 43.0, 30.0, 25.0, 25.0, 21.0, 13.0, 4.0, 5.0, 7.0, 5.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20238716900348663, -0.19300851225852966, -0.1836298406124115, -0.17425118386745453, -0.16487252712249756, -0.1554938554763794, -0.14611519873142242, -0.13673654198646545, -0.1273578703403473, -0.11797920614480972, -0.10860054939985275, -0.09922188520431519, -0.08984322845935822, -0.08046456426382065, -0.07108590006828308, -0.06170724332332611, -0.05232858657836914, -0.04294992610812187, -0.0335712656378746, -0.024192601442337036, -0.014813940972089767, -0.005435280501842499, 0.003943383693695068, 0.013322040438652039, 0.022700704634189606, 0.032079365104436874, 0.04145802557468414, 0.05083668977022171, 0.06021535024046898, 0.06959401071071625, 0.07897267490625381, 0.08835133165121078, 0.09773001074790955, 0.10710867494344711, 0.11648733168840408, 0.12586599588394165, 0.13524465262889862, 0.1446233093738556, 0.15400198101997375, 0.16338063776493073, 0.1727592945098877, 0.18213795125484467, 0.19151662290096283, 0.2008952796459198, 0.21027393639087677, 0.21965259313583374, 0.2290312647819519, 0.23840992152690887, 0.24778859317302704, 0.257167249917984, 0.2665459215641022, 0.27592456340789795, 0.2853032350540161, 0.2946819067001343, 0.30406057834625244, 0.3134392201900482, 0.3228178918361664, 0.33219656348228455, 0.3415752053260803, 0.3509538769721985, 0.36033254861831665, 0.3697111904621124, 0.3790898621082306, 0.38846850395202637, 0.39784717559814453]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 9.0, 9.0, 4.0, 12.0, 10.0, 18.0, 18.0, 19.0, 25.0, 30.0, 36.0, 30.0, 36.0, 33.0, 35.0, 34.0, 44.0, 40.0, 33.0, 41.0, 44.0, 51.0, 37.0, 32.0, 33.0, 37.0, 39.0, 39.0, 18.0, 19.0, 17.0, 19.0, 18.0, 25.0, 12.0, 13.0, 5.0, 8.0, 11.0, 1.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2659854292869568, -0.25872915983200073, -0.2514728903770447, -0.24421659111976624, -0.23696032166481018, -0.22970405220985413, -0.22244776785373688, -0.21519148349761963, -0.20793521404266357, -0.20067894458770752, -0.19342266023159027, -0.18616637587547302, -0.17891010642051697, -0.1716538369655609, -0.16439755260944366, -0.15714126825332642, -0.14988499879837036, -0.1426287293434143, -0.13537244498729706, -0.1281161606311798, -0.12085989117622375, -0.1136036142706871, -0.10634733736515045, -0.0990910604596138, -0.09183478355407715, -0.0845785066485405, -0.07732222974300385, -0.0700659528374672, -0.06280967593193054, -0.05555339902639389, -0.04829712212085724, -0.04104084521532059, -0.033784568309783936, -0.026528291404247284, -0.019272014498710632, -0.01201573759317398, -0.004759460687637329, 0.0024968162178993225, 0.009753093123435974, 0.017009370028972626, 0.024265646934509277, 0.03152192384004593, 0.03877820074558258, 0.04603447765111923, 0.053290754556655884, 0.060547031462192535, 0.06780330836772919, 0.07505958527326584, 0.08231586217880249, 0.08957213908433914, 0.0968284159898758, 0.10408469289541245, 0.1113409698009491, 0.11859724670648575, 0.1258535236120224, 0.13310980796813965, 0.1403660774230957, 0.14762234687805176, 0.154878631234169, 0.16213491559028625, 0.1693911850452423, 0.17664745450019836, 0.1839037388563156, 0.19116002321243286, 0.19841629266738892]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 19.0, 18.0, 34.0, 52.0, 90.0, 129.0, 179.0, 304.0, 418.0, 773.0, 1115.0, 1853.0, 3273.0, 5801.0, 11487.0, 28428.0, 114740.0, 574439.0, 229119.0, 43601.0, 15247.0, 7480.0, 3943.0, 2185.0, 1382.0, 866.0, 543.0, 365.0, 225.0, 121.0, 95.0, 71.0, 51.0, 29.0, 20.0, 17.0, 10.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08251953125, -0.07953834533691406, -0.07655715942382812, -0.07357597351074219, -0.07059478759765625, -0.06761360168457031, -0.06463241577148438, -0.06165122985839844, -0.0586700439453125, -0.05568885803222656, -0.052707672119140625, -0.04972648620605469, -0.04674530029296875, -0.04376411437988281, -0.040782928466796875, -0.03780174255371094, -0.034820556640625, -0.03183937072753906, -0.028858184814453125, -0.025876998901367188, -0.02289581298828125, -0.019914627075195312, -0.016933441162109375, -0.013952255249023438, -0.0109710693359375, -0.007989883422851562, -0.005008697509765625, -0.0020275115966796875, 0.00095367431640625, 0.0039348602294921875, 0.006916046142578125, 0.009897232055664062, 0.01287841796875, 0.015859603881835938, 0.018840789794921875, 0.021821975708007812, 0.02480316162109375, 0.027784347534179688, 0.030765533447265625, 0.03374671936035156, 0.0367279052734375, 0.03970909118652344, 0.042690277099609375, 0.04567146301269531, 0.04865264892578125, 0.05163383483886719, 0.054615020751953125, 0.05759620666503906, 0.060577392578125, 0.06355857849121094, 0.06653976440429688, 0.06952095031738281, 0.07250213623046875, 0.07548332214355469, 0.07846450805664062, 0.08144569396972656, 0.0844268798828125, 0.08740806579589844, 0.09038925170898438, 0.09337043762207031, 0.09635162353515625, 0.09933280944824219, 0.10231399536132812, 0.10529518127441406, 0.1082763671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 14.0, 15.0, 5.0, 5.0, 19.0, 21.0, 22.0, 26.0, 30.0, 35.0, 32.0, 46.0, 43.0, 41.0, 45.0, 41.0, 46.0, 35.0, 40.0, 41.0, 49.0, 41.0, 29.0, 28.0, 43.0, 44.0, 15.0, 22.0, 19.0, 17.0, 19.0, 18.0, 9.0, 13.0, 9.0, 4.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.19140625, -0.1866168975830078, -0.18182754516601562, -0.17703819274902344, -0.17224884033203125, -0.16745948791503906, -0.16267013549804688, -0.1578807830810547, -0.1530914306640625, -0.1483020782470703, -0.14351272583007812, -0.13872337341308594, -0.13393402099609375, -0.12914466857910156, -0.12435531616210938, -0.11956596374511719, -0.114776611328125, -0.10998725891113281, -0.10519790649414062, -0.10040855407714844, -0.09561920166015625, -0.09082984924316406, -0.08604049682617188, -0.08125114440917969, -0.0764617919921875, -0.07167243957519531, -0.06688308715820312, -0.06209373474121094, -0.05730438232421875, -0.05251502990722656, -0.047725677490234375, -0.04293632507324219, -0.03814697265625, -0.03335762023925781, -0.028568267822265625, -0.023778915405273438, -0.01898956298828125, -0.014200210571289062, -0.009410858154296875, -0.0046215057373046875, 0.0001678466796875, 0.0049571990966796875, 0.009746551513671875, 0.014535903930664062, 0.01932525634765625, 0.024114608764648438, 0.028903961181640625, 0.03369331359863281, 0.038482666015625, 0.04327201843261719, 0.048061370849609375, 0.05285072326660156, 0.05764007568359375, 0.06242942810058594, 0.06721878051757812, 0.07200813293457031, 0.0767974853515625, 0.08158683776855469, 0.08637619018554688, 0.09116554260253906, 0.09595489501953125, 0.10074424743652344, 0.10553359985351562, 0.11032295227050781, 0.1151123046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 13.0, 21.0, 22.0, 24.0, 57.0, 99.0, 171.0, 328.0, 565.0, 1197.0, 2599.0, 5967.0, 15438.0, 49752.0, 223505.0, 546030.0, 145001.0, 36168.0, 12377.0, 4911.0, 2184.0, 985.0, 497.0, 262.0, 161.0, 87.0, 47.0, 30.0, 25.0, 7.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.08016490936279297, -0.07768821716308594, -0.0752115249633789, -0.07273483276367188, -0.07025814056396484, -0.06778144836425781, -0.06530475616455078, -0.06282806396484375, -0.06035137176513672, -0.05787467956542969, -0.055397987365722656, -0.052921295166015625, -0.050444602966308594, -0.04796791076660156, -0.04549121856689453, -0.0430145263671875, -0.04053783416748047, -0.03806114196777344, -0.035584449768066406, -0.033107757568359375, -0.030631065368652344, -0.028154373168945312, -0.02567768096923828, -0.02320098876953125, -0.02072429656982422, -0.018247604370117188, -0.015770912170410156, -0.013294219970703125, -0.010817527770996094, -0.008340835571289062, -0.005864143371582031, -0.003387451171875, -0.0009107589721679688, 0.0015659332275390625, 0.004042625427246094, 0.006519317626953125, 0.008996009826660156, 0.011472702026367188, 0.013949394226074219, 0.01642608642578125, 0.01890277862548828, 0.021379470825195312, 0.023856163024902344, 0.026332855224609375, 0.028809547424316406, 0.03128623962402344, 0.03376293182373047, 0.0362396240234375, 0.03871631622314453, 0.04119300842285156, 0.043669700622558594, 0.046146392822265625, 0.048623085021972656, 0.05109977722167969, 0.05357646942138672, 0.05605316162109375, 0.05852985382080078, 0.06100654602050781, 0.06348323822021484, 0.06595993041992188, 0.0684366226196289, 0.07091331481933594, 0.07339000701904297, 0.07586669921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 9.0, 10.0, 20.0, 22.0, 15.0, 32.0, 45.0, 30.0, 37.0, 35.0, 47.0, 44.0, 48.0, 56.0, 42.0, 54.0, 44.0, 35.0, 47.0, 34.0, 40.0, 31.0, 34.0, 31.0, 19.0, 24.0, 29.0, 10.0, 18.0, 4.0, 7.0, 4.0, 3.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3564453125, -0.3443489074707031, -0.33225250244140625, -0.3201560974121094, -0.3080596923828125, -0.2959632873535156, -0.28386688232421875, -0.2717704772949219, -0.259674072265625, -0.24757766723632812, -0.23548126220703125, -0.22338485717773438, -0.2112884521484375, -0.19919204711914062, -0.18709564208984375, -0.17499923706054688, -0.16290283203125, -0.15080642700195312, -0.13871002197265625, -0.12661361694335938, -0.1145172119140625, -0.10242080688476562, -0.09032440185546875, -0.07822799682617188, -0.066131591796875, -0.054035186767578125, -0.04193878173828125, -0.029842376708984375, -0.0177459716796875, -0.005649566650390625, 0.00644683837890625, 0.018543243408203125, 0.0306396484375, 0.042736053466796875, 0.05483245849609375, 0.06692886352539062, 0.0790252685546875, 0.09112167358398438, 0.10321807861328125, 0.11531448364257812, 0.127410888671875, 0.13950729370117188, 0.15160369873046875, 0.16370010375976562, 0.1757965087890625, 0.18789291381835938, 0.19998931884765625, 0.21208572387695312, 0.22418212890625, 0.23627853393554688, 0.24837493896484375, 0.2604713439941406, 0.2725677490234375, 0.2846641540527344, 0.29676055908203125, 0.3088569641113281, 0.320953369140625, 0.3330497741699219, 0.34514617919921875, 0.3572425842285156, 0.3693389892578125, 0.3814353942871094, 0.39353179931640625, 0.4056282043457031, 0.417724609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 13.0, 16.0, 22.0, 22.0, 30.0, 38.0, 68.0, 129.0, 193.0, 344.0, 568.0, 1093.0, 2389.0, 5629.0, 16717.0, 75272.0, 487436.0, 380813.0, 54924.0, 13451.0, 4867.0, 2117.0, 1002.0, 567.0, 292.0, 180.0, 132.0, 63.0, 54.0, 33.0, 23.0, 13.0, 13.0, 7.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035400390625, -0.03435659408569336, -0.03331279754638672, -0.03226900100708008, -0.031225204467773438, -0.030181407928466797, -0.029137611389160156, -0.028093814849853516, -0.027050018310546875, -0.026006221771240234, -0.024962425231933594, -0.023918628692626953, -0.022874832153320312, -0.021831035614013672, -0.02078723907470703, -0.01974344253540039, -0.01869964599609375, -0.01765584945678711, -0.01661205291748047, -0.015568256378173828, -0.014524459838867188, -0.013480663299560547, -0.012436866760253906, -0.011393070220947266, -0.010349273681640625, -0.009305477142333984, -0.008261680603027344, -0.007217884063720703, -0.0061740875244140625, -0.005130290985107422, -0.004086494445800781, -0.0030426979064941406, -0.0019989013671875, -0.0009551048278808594, 8.869171142578125e-05, 0.0011324882507324219, 0.0021762847900390625, 0.003220081329345703, 0.004263877868652344, 0.005307674407958984, 0.006351470947265625, 0.007395267486572266, 0.008439064025878906, 0.009482860565185547, 0.010526657104492188, 0.011570453643798828, 0.012614250183105469, 0.01365804672241211, 0.01470184326171875, 0.01574563980102539, 0.01678943634033203, 0.017833232879638672, 0.018877029418945312, 0.019920825958251953, 0.020964622497558594, 0.022008419036865234, 0.023052215576171875, 0.024096012115478516, 0.025139808654785156, 0.026183605194091797, 0.027227401733398438, 0.028271198272705078, 0.02931499481201172, 0.03035879135131836, 0.031402587890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 9.0, 10.0, 20.0, 22.0, 35.0, 46.0, 54.0, 106.0, 107.0, 117.0, 113.0, 92.0, 100.0, 53.0, 46.0, 19.0, 11.0, 9.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2040138244628906e-05, -1.1427327990531921e-05, -1.0814517736434937e-05, -1.0201707482337952e-05, -9.588897228240967e-06, -8.976086974143982e-06, -8.363276720046997e-06, -7.750466465950012e-06, -7.137656211853027e-06, -6.5248459577560425e-06, -5.912035703659058e-06, -5.299225449562073e-06, -4.686415195465088e-06, -4.073604941368103e-06, -3.460794687271118e-06, -2.8479844331741333e-06, -2.2351741790771484e-06, -1.6223639249801636e-06, -1.0095536708831787e-06, -3.9674341678619385e-07, 2.1606683731079102e-07, 8.288770914077759e-07, 1.4416873455047607e-06, 2.0544975996017456e-06, 2.6673078536987305e-06, 3.2801181077957153e-06, 3.8929283618927e-06, 4.505738615989685e-06, 5.11854887008667e-06, 5.731359124183655e-06, 6.34416937828064e-06, 6.9569796323776245e-06, 7.569789886474609e-06, 8.182600140571594e-06, 8.795410394668579e-06, 9.408220648765564e-06, 1.0021030902862549e-05, 1.0633841156959534e-05, 1.1246651411056519e-05, 1.1859461665153503e-05, 1.2472271919250488e-05, 1.3085082173347473e-05, 1.3697892427444458e-05, 1.4310702681541443e-05, 1.4923512935638428e-05, 1.5536323189735413e-05, 1.6149133443832397e-05, 1.6761943697929382e-05, 1.7374753952026367e-05, 1.7987564206123352e-05, 1.8600374460220337e-05, 1.9213184714317322e-05, 1.9825994968414307e-05, 2.043880522251129e-05, 2.1051615476608276e-05, 2.166442573070526e-05, 2.2277235984802246e-05, 2.289004623889923e-05, 2.3502856492996216e-05, 2.41156667470932e-05, 2.4728477001190186e-05, 2.534128725528717e-05, 2.5954097509384155e-05, 2.656690776348114e-05, 2.7179718017578125e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 13.0, 19.0, 19.0, 43.0, 44.0, 60.0, 89.0, 105.0, 199.0, 282.0, 348.0, 500.0, 744.0, 1144.0, 1693.0, 2571.0, 4011.0, 6581.0, 11892.0, 22024.0, 45239.0, 98604.0, 201733.0, 274090.0, 190721.0, 92569.0, 42840.0, 21263.0, 11322.0, 6342.0, 3860.0, 2412.0, 1595.0, 1064.0, 667.0, 478.0, 357.0, 262.0, 177.0, 137.0, 109.0, 86.0, 66.0, 38.0, 35.0, 31.0, 17.0, 15.0, 9.0, 6.0, 8.0, 7.0, 1.0, 0.0, 1.0], "bins": [-0.0149078369140625, -0.014448404312133789, -0.013988971710205078, -0.013529539108276367, -0.013070106506347656, -0.012610673904418945, -0.012151241302490234, -0.011691808700561523, -0.011232376098632812, -0.010772943496704102, -0.01031351089477539, -0.00985407829284668, -0.009394645690917969, -0.008935213088989258, -0.008475780487060547, -0.008016347885131836, -0.007556915283203125, -0.007097482681274414, -0.006638050079345703, -0.006178617477416992, -0.005719184875488281, -0.00525975227355957, -0.004800319671630859, -0.0043408870697021484, -0.0038814544677734375, -0.0034220218658447266, -0.0029625892639160156, -0.0025031566619873047, -0.0020437240600585938, -0.0015842914581298828, -0.0011248588562011719, -0.0006654262542724609, -0.00020599365234375, 0.00025343894958496094, 0.0007128715515136719, 0.0011723041534423828, 0.0016317367553710938, 0.0020911693572998047, 0.0025506019592285156, 0.0030100345611572266, 0.0034694671630859375, 0.0039288997650146484, 0.004388332366943359, 0.00484776496887207, 0.005307197570800781, 0.005766630172729492, 0.006226062774658203, 0.006685495376586914, 0.007144927978515625, 0.007604360580444336, 0.008063793182373047, 0.008523225784301758, 0.008982658386230469, 0.00944209098815918, 0.00990152359008789, 0.010360956192016602, 0.010820388793945312, 0.011279821395874023, 0.011739253997802734, 0.012198686599731445, 0.012658119201660156, 0.013117551803588867, 0.013576984405517578, 0.014036417007446289, 0.014495849609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 7.0, 6.0, 5.0, 6.0, 8.0, 13.0, 16.0, 16.0, 23.0, 22.0, 39.0, 43.0, 59.0, 57.0, 67.0, 66.0, 67.0, 56.0, 65.0, 64.0, 41.0, 46.0, 35.0, 28.0, 29.0, 20.0, 19.0, 12.0, 9.0, 9.0, 12.0, 5.0, 4.0, 4.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006160736083984375, -0.005951225757598877, -0.005741715431213379, -0.005532205104827881, -0.005322694778442383, -0.005113184452056885, -0.004903674125671387, -0.004694163799285889, -0.004484653472900391, -0.004275143146514893, -0.0040656328201293945, -0.0038561224937438965, -0.0036466121673583984, -0.0034371018409729004, -0.0032275915145874023, -0.0030180811882019043, -0.0028085708618164062, -0.002599060535430908, -0.00238955020904541, -0.002180039882659912, -0.001970529556274414, -0.001761019229888916, -0.001551508903503418, -0.00134199857711792, -0.0011324882507324219, -0.0009229779243469238, -0.0007134675979614258, -0.0005039572715759277, -0.0002944469451904297, -8.493661880493164e-05, 0.0001245737075805664, 0.00033408403396606445, 0.0005435943603515625, 0.0007531046867370605, 0.0009626150131225586, 0.0011721253395080566, 0.0013816356658935547, 0.0015911459922790527, 0.0018006563186645508, 0.002010166645050049, 0.002219676971435547, 0.002429187297821045, 0.002638697624206543, 0.002848207950592041, 0.003057718276977539, 0.003267228603363037, 0.003476738929748535, 0.003686249256134033, 0.0038957595825195312, 0.004105269908905029, 0.004314780235290527, 0.004524290561676025, 0.0047338008880615234, 0.0049433112144470215, 0.0051528215408325195, 0.005362331867218018, 0.005571842193603516, 0.005781352519989014, 0.005990862846374512, 0.00620037317276001, 0.006409883499145508, 0.006619393825531006, 0.006828904151916504, 0.007038414478302002, 0.0072479248046875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 8.0, 13.0, 15.0, 39.0, 38.0, 34.0, 70.0, 73.0, 80.0, 93.0, 78.0, 96.0, 72.0, 75.0, 50.0, 34.0, 34.0, 20.0, 12.0, 13.0, 15.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22945018112659454, -0.2225847691297531, -0.21571935713291168, -0.20885394513607025, -0.20198851823806763, -0.1951231062412262, -0.18825769424438477, -0.18139228224754333, -0.1745268702507019, -0.16766145825386047, -0.16079604625701904, -0.1539306342601776, -0.14706522226333618, -0.14019981026649475, -0.13333438336849213, -0.1264689713716507, -0.11960355937480927, -0.11273814737796783, -0.1058727353811264, -0.09900731593370438, -0.09214190393686295, -0.08527649194002151, -0.07841107249259949, -0.07154566049575806, -0.06468024849891663, -0.057814836502075195, -0.050949420779943466, -0.04408400505781174, -0.037218593060970306, -0.030353181064128876, -0.023487765341997147, -0.016622349619865417, -0.00975695252418518, -0.0028915386646986008, 0.003973875194787979, 0.010839289054274559, 0.01770470291376114, 0.02457011491060257, 0.0314355306327343, 0.03830094635486603, 0.04516635835170746, 0.05203177034854889, 0.05889718607068062, 0.06576260179281235, 0.07262801378965378, 0.07949342578649521, 0.08635884523391724, 0.09322425723075867, 0.1000896692276001, 0.10695508122444153, 0.11382049322128296, 0.12068591266870499, 0.12755131721496582, 0.13441672921180725, 0.14128215610980988, 0.1481475681066513, 0.15501298010349274, 0.16187839210033417, 0.1687438040971756, 0.17560921609401703, 0.18247464299201965, 0.18934005498886108, 0.19620546698570251, 0.20307087898254395, 0.20993629097938538]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 4.0, 3.0, 7.0, 6.0, 18.0, 9.0, 10.0, 10.0, 10.0, 30.0, 34.0, 25.0, 29.0, 36.0, 32.0, 36.0, 36.0, 36.0, 42.0, 37.0, 36.0, 40.0, 47.0, 36.0, 44.0, 36.0, 46.0, 35.0, 38.0, 31.0, 21.0, 17.0, 18.0, 17.0, 28.0, 15.0, 15.0, 8.0, 11.0, 6.0, 3.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16031111776828766, -0.15586137771606445, -0.15141162276268005, -0.14696188271045685, -0.14251214265823364, -0.13806240260601044, -0.13361266255378723, -0.12916290760040283, -0.12471316754817963, -0.12026342749595642, -0.11581367999315262, -0.11136393249034882, -0.10691419243812561, -0.1024644523859024, -0.0980147048830986, -0.0935649573802948, -0.0891152173280716, -0.08466547727584839, -0.08021572977304459, -0.07576598227024078, -0.07131624221801758, -0.06686650216579437, -0.06241675466299057, -0.057967010885477066, -0.05351726710796356, -0.04906752333045006, -0.044617779552936554, -0.04016803577542305, -0.035718291997909546, -0.03126854822039604, -0.026818804442882538, -0.022369060665369034, -0.017919331789016724, -0.01346958801150322, -0.009019844233989716, -0.0045701004564762115, -0.00012035667896270752, 0.0043293870985507965, 0.0087791308760643, 0.013228874653577805, 0.01767861843109131, 0.022128362208604813, 0.026578105986118317, 0.03102784976363182, 0.035477593541145325, 0.03992733731865883, 0.04437708109617233, 0.04882682487368584, 0.05327656865119934, 0.057726312428712845, 0.06217605620622635, 0.06662580370903015, 0.07107554376125336, 0.07552528381347656, 0.07997503131628036, 0.08442477881908417, 0.08887451887130737, 0.09332425892353058, 0.09777400642633438, 0.10222375392913818, 0.10667349398136139, 0.1111232340335846, 0.1155729815363884, 0.1200227290391922, 0.1244724690914154]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 14.0, 14.0, 17.0, 30.0, 37.0, 62.0, 100.0, 154.0, 268.0, 411.0, 744.0, 1389.0, 2810.0, 6139.0, 14752.0, 38698.0, 118393.0, 378727.0, 329570.0, 99067.0, 33253.0, 12937.0, 5363.0, 2515.0, 1335.0, 715.0, 382.0, 244.0, 135.0, 79.0, 50.0, 37.0, 32.0, 25.0, 12.0, 9.0, 9.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.292236328125, -0.28386878967285156, -0.2755012512207031, -0.2671337127685547, -0.25876617431640625, -0.2503986358642578, -0.24203109741210938, -0.23366355895996094, -0.2252960205078125, -0.21692848205566406, -0.20856094360351562, -0.2001934051513672, -0.19182586669921875, -0.1834583282470703, -0.17509078979492188, -0.16672325134277344, -0.158355712890625, -0.14998817443847656, -0.14162063598632812, -0.1332530975341797, -0.12488555908203125, -0.11651802062988281, -0.10815048217773438, -0.09978294372558594, -0.0914154052734375, -0.08304786682128906, -0.07468032836914062, -0.06631278991699219, -0.05794525146484375, -0.04957771301269531, -0.041210174560546875, -0.03284263610839844, -0.02447509765625, -0.016107559204101562, -0.007740020751953125, 0.0006275177001953125, 0.00899505615234375, 0.017362594604492188, 0.025730133056640625, 0.03409767150878906, 0.0424652099609375, 0.05083274841308594, 0.059200286865234375, 0.06756782531738281, 0.07593536376953125, 0.08430290222167969, 0.09267044067382812, 0.10103797912597656, 0.109405517578125, 0.11777305603027344, 0.12614059448242188, 0.1345081329345703, 0.14287567138671875, 0.1512432098388672, 0.15961074829101562, 0.16797828674316406, 0.1763458251953125, 0.18471336364746094, 0.19308090209960938, 0.2014484405517578, 0.20981597900390625, 0.2181835174560547, 0.22655105590820312, 0.23491859436035156, 0.2432861328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 12.0, 3.0, 7.0, 13.0, 21.0, 13.0, 21.0, 27.0, 29.0, 27.0, 38.0, 23.0, 32.0, 38.0, 44.0, 40.0, 45.0, 37.0, 39.0, 51.0, 47.0, 37.0, 40.0, 41.0, 39.0, 33.0, 26.0, 32.0, 15.0, 13.0, 17.0, 19.0, 17.0, 10.0, 16.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2841796875, -0.27631568908691406, -0.2684516906738281, -0.2605876922607422, -0.25272369384765625, -0.2448596954345703, -0.23699569702148438, -0.22913169860839844, -0.2212677001953125, -0.21340370178222656, -0.20553970336914062, -0.1976757049560547, -0.18981170654296875, -0.1819477081298828, -0.17408370971679688, -0.16621971130371094, -0.158355712890625, -0.15049171447753906, -0.14262771606445312, -0.1347637176513672, -0.12689971923828125, -0.11903572082519531, -0.11117172241210938, -0.10330772399902344, -0.0954437255859375, -0.08757972717285156, -0.07971572875976562, -0.07185173034667969, -0.06398773193359375, -0.05612373352050781, -0.048259735107421875, -0.04039573669433594, -0.03253173828125, -0.024667739868164062, -0.016803741455078125, -0.008939743041992188, -0.00107574462890625, 0.0067882537841796875, 0.014652252197265625, 0.022516250610351562, 0.0303802490234375, 0.03824424743652344, 0.046108245849609375, 0.05397224426269531, 0.06183624267578125, 0.06970024108886719, 0.07756423950195312, 0.08542823791503906, 0.093292236328125, 0.10115623474121094, 0.10902023315429688, 0.11688423156738281, 0.12474822998046875, 0.1326122283935547, 0.14047622680664062, 0.14834022521972656, 0.1562042236328125, 0.16406822204589844, 0.17193222045898438, 0.1797962188720703, 0.18766021728515625, 0.1955242156982422, 0.20338821411132812, 0.21125221252441406, 0.2191162109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 4.0, 4.0, 5.0, 9.0, 9.0, 21.0, 22.0, 19.0, 31.0, 45.0, 56.0, 82.0, 112.0, 156.0, 246.0, 466.0, 871.0, 1654.0, 3908.0, 10491.0, 30112.0, 97532.0, 342546.0, 389966.0, 114590.0, 35145.0, 11808.0, 4508.0, 1867.0, 879.0, 480.0, 286.0, 173.0, 120.0, 86.0, 68.0, 43.0, 27.0, 31.0, 19.0, 13.0, 18.0, 6.0, 5.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.35302734375, -0.34323883056640625, -0.3334503173828125, -0.32366180419921875, -0.313873291015625, -0.30408477783203125, -0.2942962646484375, -0.28450775146484375, -0.27471923828125, -0.26493072509765625, -0.2551422119140625, -0.24535369873046875, -0.235565185546875, -0.22577667236328125, -0.2159881591796875, -0.20619964599609375, -0.1964111328125, -0.18662261962890625, -0.1768341064453125, -0.16704559326171875, -0.157257080078125, -0.14746856689453125, -0.1376800537109375, -0.12789154052734375, -0.11810302734375, -0.10831451416015625, -0.0985260009765625, -0.08873748779296875, -0.078948974609375, -0.06916046142578125, -0.0593719482421875, -0.04958343505859375, -0.039794921875, -0.03000640869140625, -0.0202178955078125, -0.01042938232421875, -0.000640869140625, 0.00914764404296875, 0.0189361572265625, 0.02872467041015625, 0.03851318359375, 0.04830169677734375, 0.0580902099609375, 0.06787872314453125, 0.077667236328125, 0.08745574951171875, 0.0972442626953125, 0.10703277587890625, 0.1168212890625, 0.12660980224609375, 0.1363983154296875, 0.14618682861328125, 0.155975341796875, 0.16576385498046875, 0.1755523681640625, 0.18534088134765625, 0.19512939453125, 0.20491790771484375, 0.2147064208984375, 0.22449493408203125, 0.234283447265625, 0.24407196044921875, 0.2538604736328125, 0.26364898681640625, 0.2734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 10.0, 9.0, 8.0, 8.0, 7.0, 11.0, 17.0, 15.0, 21.0, 23.0, 23.0, 31.0, 43.0, 37.0, 35.0, 42.0, 49.0, 41.0, 53.0, 41.0, 46.0, 49.0, 40.0, 49.0, 40.0, 38.0, 28.0, 27.0, 24.0, 19.0, 28.0, 19.0, 16.0, 10.0, 10.0, 11.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3027076721191406, -0.29389190673828125, -0.2850761413574219, -0.2762603759765625, -0.2674446105957031, -0.25862884521484375, -0.24981307983398438, -0.240997314453125, -0.23218154907226562, -0.22336578369140625, -0.21455001831054688, -0.2057342529296875, -0.19691848754882812, -0.18810272216796875, -0.17928695678710938, -0.17047119140625, -0.16165542602539062, -0.15283966064453125, -0.14402389526367188, -0.1352081298828125, -0.12639236450195312, -0.11757659912109375, -0.10876083374023438, -0.099945068359375, -0.09112930297851562, -0.08231353759765625, -0.07349777221679688, -0.0646820068359375, -0.055866241455078125, -0.04705047607421875, -0.038234710693359375, -0.0294189453125, -0.020603179931640625, -0.01178741455078125, -0.002971649169921875, 0.0058441162109375, 0.014659881591796875, 0.02347564697265625, 0.032291412353515625, 0.041107177734375, 0.049922943115234375, 0.05873870849609375, 0.06755447387695312, 0.0763702392578125, 0.08518600463867188, 0.09400177001953125, 0.10281753540039062, 0.11163330078125, 0.12044906616210938, 0.12926483154296875, 0.13808059692382812, 0.1468963623046875, 0.15571212768554688, 0.16452789306640625, 0.17334365844726562, 0.182159423828125, 0.19097518920898438, 0.19979095458984375, 0.20860671997070312, 0.2174224853515625, 0.22623825073242188, 0.23505401611328125, 0.24386978149414062, 0.252685546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 7.0, 10.0, 22.0, 46.0, 65.0, 127.0, 245.0, 622.0, 1580.0, 5052.0, 24667.0, 224744.0, 690497.0, 83476.0, 12304.0, 3158.0, 1045.0, 445.0, 181.0, 106.0, 51.0, 36.0, 17.0, 14.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0909423828125, -0.08803653717041016, -0.08513069152832031, -0.08222484588623047, -0.07931900024414062, -0.07641315460205078, -0.07350730895996094, -0.0706014633178711, -0.06769561767578125, -0.0647897720336914, -0.06188392639160156, -0.05897808074951172, -0.056072235107421875, -0.05316638946533203, -0.05026054382324219, -0.047354698181152344, -0.0444488525390625, -0.041543006896972656, -0.03863716125488281, -0.03573131561279297, -0.032825469970703125, -0.02991962432861328, -0.027013778686523438, -0.024107933044433594, -0.02120208740234375, -0.018296241760253906, -0.015390396118164062, -0.012484550476074219, -0.009578704833984375, -0.006672859191894531, -0.0037670135498046875, -0.0008611679077148438, 0.002044677734375, 0.004950523376464844, 0.007856369018554688, 0.010762214660644531, 0.013668060302734375, 0.01657390594482422, 0.019479751586914062, 0.022385597229003906, 0.02529144287109375, 0.028197288513183594, 0.031103134155273438, 0.03400897979736328, 0.036914825439453125, 0.03982067108154297, 0.04272651672363281, 0.045632362365722656, 0.0485382080078125, 0.051444053649902344, 0.05434989929199219, 0.05725574493408203, 0.060161590576171875, 0.06306743621826172, 0.06597328186035156, 0.0688791275024414, 0.07178497314453125, 0.0746908187866211, 0.07759666442871094, 0.08050251007080078, 0.08340835571289062, 0.08631420135498047, 0.08922004699707031, 0.09212589263916016, 0.09503173828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 9.0, 16.0, 12.0, 31.0, 37.0, 54.0, 55.0, 89.0, 84.0, 128.0, 132.0, 79.0, 69.0, 39.0, 45.0, 36.0, 18.0, 16.0, 6.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.404254913330078e-06, -8.063390851020813e-06, -7.722526788711548e-06, -7.381662726402283e-06, -7.040798664093018e-06, -6.6999346017837524e-06, -6.359070539474487e-06, -6.018206477165222e-06, -5.677342414855957e-06, -5.336478352546692e-06, -4.995614290237427e-06, -4.654750227928162e-06, -4.3138861656188965e-06, -3.973022103309631e-06, -3.632158041000366e-06, -3.291293978691101e-06, -2.950429916381836e-06, -2.609565854072571e-06, -2.2687017917633057e-06, -1.9278377294540405e-06, -1.5869736671447754e-06, -1.2461096048355103e-06, -9.052455425262451e-07, -5.6438148021698e-07, -2.2351741790771484e-07, 1.1734664440155029e-07, 4.5821070671081543e-07, 7.990747690200806e-07, 1.1399388313293457e-06, 1.4808028936386108e-06, 1.821666955947876e-06, 2.162531018257141e-06, 2.5033950805664062e-06, 2.8442591428756714e-06, 3.1851232051849365e-06, 3.5259872674942017e-06, 3.866851329803467e-06, 4.207715392112732e-06, 4.548579454421997e-06, 4.889443516731262e-06, 5.230307579040527e-06, 5.5711716413497925e-06, 5.912035703659058e-06, 6.252899765968323e-06, 6.593763828277588e-06, 6.934627890586853e-06, 7.275491952896118e-06, 7.616356015205383e-06, 7.957220077514648e-06, 8.298084139823914e-06, 8.638948202133179e-06, 8.979812264442444e-06, 9.320676326751709e-06, 9.661540389060974e-06, 1.000240445137024e-05, 1.0343268513679504e-05, 1.068413257598877e-05, 1.1024996638298035e-05, 1.13658607006073e-05, 1.1706724762916565e-05, 1.204758882522583e-05, 1.2388452887535095e-05, 1.272931694984436e-05, 1.3070181012153625e-05, 1.341104507446289e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 7.0, 18.0, 14.0, 27.0, 33.0, 56.0, 61.0, 97.0, 135.0, 191.0, 328.0, 480.0, 814.0, 1340.0, 2402.0, 4478.0, 8968.0, 21609.0, 67303.0, 276748.0, 486810.0, 117863.0, 32819.0, 12601.0, 5998.0, 3001.0, 1646.0, 915.0, 610.0, 382.0, 257.0, 162.0, 109.0, 83.0, 53.0, 36.0, 21.0, 23.0, 12.0, 3.0, 15.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.058563232421875, -0.0566864013671875, -0.0548095703125, -0.0529327392578125, -0.051055908203125, -0.0491790771484375, -0.04730224609375, -0.0454254150390625, -0.043548583984375, -0.0416717529296875, -0.039794921875, -0.0379180908203125, -0.036041259765625, -0.0341644287109375, -0.03228759765625, -0.0304107666015625, -0.028533935546875, -0.0266571044921875, -0.0247802734375, -0.0229034423828125, -0.021026611328125, -0.0191497802734375, -0.01727294921875, -0.0153961181640625, -0.013519287109375, -0.0116424560546875, -0.009765625, -0.0078887939453125, -0.006011962890625, -0.0041351318359375, -0.00225830078125, -0.0003814697265625, 0.001495361328125, 0.0033721923828125, 0.0052490234375, 0.0071258544921875, 0.009002685546875, 0.0108795166015625, 0.01275634765625, 0.0146331787109375, 0.016510009765625, 0.0183868408203125, 0.020263671875, 0.0221405029296875, 0.024017333984375, 0.0258941650390625, 0.02777099609375, 0.0296478271484375, 0.031524658203125, 0.0334014892578125, 0.0352783203125, 0.0371551513671875, 0.039031982421875, 0.0409088134765625, 0.04278564453125, 0.0446624755859375, 0.046539306640625, 0.0484161376953125, 0.05029296875, 0.0521697998046875, 0.054046630859375, 0.0559234619140625, 0.05780029296875, 0.0596771240234375, 0.061553955078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 7.0, 6.0, 4.0, 13.0, 21.0, 18.0, 16.0, 40.0, 65.0, 87.0, 98.0, 186.0, 118.0, 91.0, 77.0, 44.0, 35.0, 20.0, 14.0, 8.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04608154296875, -0.04462718963623047, -0.04317283630371094, -0.041718482971191406, -0.040264129638671875, -0.038809776306152344, -0.03735542297363281, -0.03590106964111328, -0.03444671630859375, -0.03299236297607422, -0.03153800964355469, -0.030083656311035156, -0.028629302978515625, -0.027174949645996094, -0.025720596313476562, -0.02426624298095703, -0.0228118896484375, -0.02135753631591797, -0.019903182983398438, -0.018448829650878906, -0.016994476318359375, -0.015540122985839844, -0.014085769653320312, -0.012631416320800781, -0.01117706298828125, -0.009722709655761719, -0.008268356323242188, -0.006814002990722656, -0.005359649658203125, -0.0039052963256835938, -0.0024509429931640625, -0.0009965896606445312, 0.000457763671875, 0.0019121170043945312, 0.0033664703369140625, 0.004820823669433594, 0.006275177001953125, 0.007729530334472656, 0.009183883666992188, 0.010638236999511719, 0.01209259033203125, 0.013546943664550781, 0.015001296997070312, 0.016455650329589844, 0.017910003662109375, 0.019364356994628906, 0.020818710327148438, 0.02227306365966797, 0.0237274169921875, 0.02518177032470703, 0.026636123657226562, 0.028090476989746094, 0.029544830322265625, 0.030999183654785156, 0.03245353698730469, 0.03390789031982422, 0.03536224365234375, 0.03681659698486328, 0.03827095031738281, 0.039725303649902344, 0.041179656982421875, 0.042634010314941406, 0.04408836364746094, 0.04554271697998047, 0.0469970703125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 5.0, 18.0, 30.0, 44.0, 76.0, 147.0, 185.0, 146.0, 118.0, 82.0, 49.0, 38.0, 25.0, 8.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8316740989685059, -0.8072460889816284, -0.7828181385993958, -0.7583901286125183, -0.7339621782302856, -0.7095341682434082, -0.6851061582565308, -0.6606782078742981, -0.6362502574920654, -0.611822247505188, -0.5873942971229553, -0.5629662871360779, -0.5385383367538452, -0.5141103267669678, -0.4896823465824127, -0.46525436639785767, -0.4408263564109802, -0.41639837622642517, -0.3919703960418701, -0.3675423860549927, -0.34311443567276, -0.31868642568588257, -0.2942584455013275, -0.26983046531677246, -0.2454024851322174, -0.22097450494766235, -0.1965465247631073, -0.17211852967739105, -0.147690549492836, -0.12326256930828094, -0.0988345742225647, -0.07440659403800964, -0.049978673458099365, -0.025550689548254013, -0.0011227056384086609, 0.02330528199672699, 0.04773326218128204, 0.0721612423658371, 0.09658923745155334, 0.1210172176361084, 0.14544519782066345, 0.1698731780052185, 0.19430115818977356, 0.2187291532754898, 0.24315713346004486, 0.2675850987434387, 0.29201310873031616, 0.3164410889148712, 0.34086906909942627, 0.3652970492839813, 0.3897250294685364, 0.4141530394554138, 0.4385809898376465, 0.4630089998245239, 0.487436980009079, 0.511864960193634, 0.5362929105758667, 0.5607209205627441, 0.5851488709449768, 0.6095768809318542, 0.6340048313140869, 0.6584328413009644, 0.6828608512878418, 0.7072888016700745, 0.7317168116569519]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 10.0, 19.0, 15.0, 21.0, 13.0, 27.0, 35.0, 34.0, 33.0, 34.0, 48.0, 26.0, 37.0, 30.0, 38.0, 46.0, 35.0, 45.0, 33.0, 35.0, 52.0, 34.0, 37.0, 29.0, 35.0, 27.0, 23.0, 21.0, 16.0, 19.0, 13.0, 15.0, 8.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5037117600440979, -0.4893195927143097, -0.4749274253845215, -0.4605352282524109, -0.4461430609226227, -0.4317508935928345, -0.4173586964607239, -0.40296652913093567, -0.38857436180114746, -0.37418219447135925, -0.35979002714157104, -0.34539783000946045, -0.33100566267967224, -0.31661349534988403, -0.30222129821777344, -0.28782913088798523, -0.273436963558197, -0.2590447962284088, -0.2446526139974594, -0.23026043176651, -0.2158682644367218, -0.2014760971069336, -0.1870839148759842, -0.1726917326450348, -0.15829956531524658, -0.14390739798545837, -0.12951521575450897, -0.11512304097414017, -0.10073086619377136, -0.08633869141340256, -0.07194651663303375, -0.05755434185266495, -0.043162137269973755, -0.02876996248960495, -0.014377787709236145, 1.4387071132659912e-05, 0.014406561851501465, 0.02879873663187027, 0.043190911412239075, 0.05758308619260788, 0.07197526097297668, 0.08636743575334549, 0.1007596105337143, 0.1151517853140831, 0.1295439600944519, 0.1439361274242401, 0.15832830965518951, 0.17272049188613892, 0.18711265921592712, 0.20150482654571533, 0.21589700877666473, 0.23028919100761414, 0.24468135833740234, 0.25907352566719055, 0.27346569299697876, 0.28785789012908936, 0.30225005745887756, 0.31664222478866577, 0.33103442192077637, 0.3454265892505646, 0.3598187565803528, 0.374210923910141, 0.3886030912399292, 0.4029952883720398, 0.417387455701828]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 3.0, 5.0, 9.0, 4.0, 9.0, 5.0, 15.0, 7.0, 17.0, 20.0, 40.0, 39.0, 59.0, 77.0, 118.0, 200.0, 285.0, 493.0, 818.0, 1713.0, 3983.0, 1035941.0, 3355.0, 1388.0, 705.0, 449.0, 257.0, 155.0, 115.0, 72.0, 59.0, 31.0, 32.0, 22.0, 16.0, 15.0, 8.0, 11.0, 11.0, 8.0, 7.0, 5.0, 1.0, 4.0, 7.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7920936942100525, -0.7683619856834412, -0.7446303367614746, -0.7208986282348633, -0.6971669793128967, -0.6734352707862854, -0.6497036218643188, -0.6259719133377075, -0.6022402048110962, -0.5785084962844849, -0.5547768473625183, -0.531045138835907, -0.5073134899139404, -0.4835817813873291, -0.45985010266304016, -0.4361184239387512, -0.41238677501678467, -0.3886550962924957, -0.3649234175682068, -0.34119170904159546, -0.3174600601196289, -0.2937283515930176, -0.26999667286872864, -0.2462649941444397, -0.22253331542015076, -0.19880163669586182, -0.17506995797157288, -0.15133826434612274, -0.1276065856218338, -0.10387490689754486, -0.08014321327209473, -0.056411534547805786, -0.032679855823516846, -0.008948173373937607, 0.014783509075641632, 0.03851519525051117, 0.06224687397480011, 0.08597855269908905, 0.10971024632453918, 0.13344192504882812, 0.15717360377311707, 0.180905282497406, 0.20463696122169495, 0.22836865484714508, 0.2521003484725952, 0.27583199739456177, 0.2995637059211731, 0.32329538464546204, 0.347027063369751, 0.3707587420940399, 0.39449042081832886, 0.4182221293449402, 0.44195377826690674, 0.46568548679351807, 0.489417165517807, 0.513148844242096, 0.5368804931640625, 0.5606122016906738, 0.5843438506126404, 0.6080755591392517, 0.6318072080612183, 0.6555389165878296, 0.6792706251144409, 0.7030022740364075, 0.7267339825630188]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 9.0, 3.0, 6.0, 19.0, 20.0, 31.0, 38.0, 56.0, 93.0, 117.0, 178.0, 259.0, 468.0, 1034.0, 3502.0, 51455756.0, 5920.0, 1232.0, 577.0, 328.0, 216.0, 135.0, 101.0, 62.0, 50.0, 32.0, 28.0, 23.0, 12.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.387202262878418, -10.047842025756836, -9.70848274230957, -9.369122505187988, -9.029762268066406, -8.69040298461914, -8.351042747497559, -8.011682510375977, -7.6723222732543945, -7.332962512969971, -6.993602752685547, -6.654242515563965, -6.314882278442383, -5.975522518157959, -5.636162757873535, -5.296802520751953, -4.957442283630371, -4.618082523345947, -4.278722763061523, -3.9393625259399414, -3.6000025272369385, -3.2606425285339355, -2.9212825298309326, -2.5819225311279297, -2.2425625324249268, -1.9032025337219238, -1.563842535018921, -1.224482536315918, -0.885122537612915, -0.5457625389099121, -0.20640254020690918, 0.13295841217041016, 0.4723184108734131, 0.811678409576416, 1.151038408279419, 1.4903984069824219, 1.8297584056854248, 2.1691184043884277, 2.5084784030914307, 2.8478384017944336, 3.1871984004974365, 3.5265583992004395, 3.8659183979034424, 4.205278396606445, 4.544638633728027, 4.883998394012451, 5.223358154296875, 5.562718391418457, 5.902078628540039, 6.241438388824463, 6.580798149108887, 6.920158386230469, 7.259518623352051, 7.598878383636475, 7.938238143920898, 8.27759838104248, 8.616958618164062, 8.956317901611328, 9.29567813873291, 9.635038375854492, 9.974398612976074, 10.313758850097656, 10.653118133544922, 10.992478370666504]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 16.0, 18.0, 28.0, 42.0, 72.0, 64.0, 115.0, 163.0, 307.0, 431.0, 645.0, 1056.0, 1752.0, 2719.0, 4801.0, 7860.0, 13485.0, 24120.0, 43756.0, 79521.0, 146907.0, 264780.0, 444811.0, 2621232.0, 1655880.0, 421060.0, 248093.0, 137278.0, 74274.0, 40961.0, 22810.0, 12994.0, 7433.0, 4491.0, 2764.0, 1676.0, 1115.0, 692.0, 387.0, 288.0, 184.0, 129.0, 73.0, 54.0, 27.0, 19.0, 18.0, 15.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.77099609375, -0.7482833862304688, -0.7255706787109375, -0.7028579711914062, -0.680145263671875, -0.6574325561523438, -0.6347198486328125, -0.6120071411132812, -0.58929443359375, -0.5665817260742188, -0.5438690185546875, -0.5211563110351562, -0.498443603515625, -0.47573089599609375, -0.4530181884765625, -0.43030548095703125, -0.4075927734375, -0.38488006591796875, -0.3621673583984375, -0.33945465087890625, -0.316741943359375, -0.29402923583984375, -0.2713165283203125, -0.24860382080078125, -0.22589111328125, -0.20317840576171875, -0.1804656982421875, -0.15775299072265625, -0.135040283203125, -0.11232757568359375, -0.0896148681640625, -0.06690216064453125, -0.044189453125, -0.02147674560546875, 0.0012359619140625, 0.02394866943359375, 0.046661376953125, 0.06937408447265625, 0.0920867919921875, 0.11479949951171875, 0.13751220703125, 0.16022491455078125, 0.1829376220703125, 0.20565032958984375, 0.228363037109375, 0.25107574462890625, 0.2737884521484375, 0.29650115966796875, 0.3192138671875, 0.34192657470703125, 0.3646392822265625, 0.38735198974609375, 0.410064697265625, 0.43277740478515625, 0.4554901123046875, 0.47820281982421875, 0.50091552734375, 0.5236282348632812, 0.5463409423828125, 0.5690536499023438, 0.591766357421875, 0.6144790649414062, 0.6371917724609375, 0.6599044799804688, 0.6826171875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 5.0, 8.0, 12.0, 11.0, 20.0, 14.0, 23.0, 20.0, 15.0, 27.0, 37.0, 49.0, 45.0, 45.0, 50.0, 65.0, 240.0, 805.0, 115.0, 55.0, 46.0, 52.0, 42.0, 36.0, 33.0, 24.0, 22.0, 20.0, 22.0, 14.0, 14.0, 11.0, 5.0, 10.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.4049072265625, -5.247314453125, -5.0897216796875, -4.93212890625, -4.7745361328125, -4.616943359375, -4.4593505859375, -4.3017578125, -4.1441650390625, -3.986572265625, -3.8289794921875, -3.67138671875, -3.5137939453125, -3.356201171875, -3.1986083984375, -3.041015625, -2.8834228515625, -2.725830078125, -2.5682373046875, -2.41064453125, -2.2530517578125, -2.095458984375, -1.9378662109375, -1.7802734375, -1.6226806640625, -1.465087890625, -1.3074951171875, -1.14990234375, -0.9923095703125, -0.834716796875, -0.6771240234375, -0.51953125, -0.3619384765625, -0.204345703125, -0.0467529296875, 0.11083984375, 0.2684326171875, 0.426025390625, 0.5836181640625, 0.7412109375, 0.8988037109375, 1.056396484375, 1.2139892578125, 1.37158203125, 1.5291748046875, 1.686767578125, 1.8443603515625, 2.001953125, 2.1595458984375, 2.317138671875, 2.4747314453125, 2.63232421875, 2.7899169921875, 2.947509765625, 3.1051025390625, 3.2626953125, 3.4202880859375, 3.577880859375, 3.7354736328125, 3.89306640625, 4.0506591796875, 4.208251953125, 4.3658447265625, 4.5234375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 8.0, 14.0, 21.0, 41.0, 86.0, 91.0, 174.0, 285.0, 427.0, 683.0, 1020.0, 1738.0, 2672.0, 4442.0, 7084.0, 11442.0, 18563.0, 29475.0, 47676.0, 74988.0, 116299.0, 173113.0, 245073.0, 323822.0, 595413.0, 3293874.0, 398791.0, 297153.0, 220176.0, 152391.0, 100788.0, 64954.0, 41074.0, 25781.0, 15952.0, 9668.0, 6165.0, 3815.0, 2423.0, 1390.0, 916.0, 560.0, 354.0, 225.0, 112.0, 86.0, 47.0, 32.0, 16.0, 12.0, 10.0, 12.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.405517578125, -0.392578125, -0.379638671875, -0.36669921875, -0.353759765625, -0.3408203125, -0.327880859375, -0.31494140625, -0.302001953125, -0.2890625, -0.276123046875, -0.26318359375, -0.250244140625, -0.2373046875, -0.224365234375, -0.21142578125, -0.198486328125, -0.185546875, -0.172607421875, -0.15966796875, -0.146728515625, -0.1337890625, -0.120849609375, -0.10791015625, -0.094970703125, -0.08203125, -0.069091796875, -0.05615234375, -0.043212890625, -0.0302734375, -0.017333984375, -0.00439453125, 0.008544921875, 0.021484375, 0.034423828125, 0.04736328125, 0.060302734375, 0.0732421875, 0.086181640625, 0.09912109375, 0.112060546875, 0.125, 0.137939453125, 0.15087890625, 0.163818359375, 0.1767578125, 0.189697265625, 0.20263671875, 0.215576171875, 0.228515625, 0.241455078125, 0.25439453125, 0.267333984375, 0.2802734375, 0.293212890625, 0.30615234375, 0.319091796875, 0.33203125, 0.344970703125, 0.35791015625, 0.370849609375, 0.3837890625, 0.396728515625, 0.40966796875, 0.422607421875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 13.0, 5.0, 14.0, 18.0, 13.0, 17.0, 20.0, 17.0, 20.0, 30.0, 30.0, 29.0, 37.0, 34.0, 41.0, 28.0, 40.0, 75.0, 438.0, 592.0, 73.0, 41.0, 28.0, 26.0, 33.0, 42.0, 20.0, 29.0, 26.0, 14.0, 17.0, 16.0, 23.0, 14.0, 10.0, 12.0, 14.0, 8.0, 4.0, 9.0, 9.0, 7.0, 4.0, 5.0, 7.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.076171875, -2.977264404296875, -2.87835693359375, -2.779449462890625, -2.6805419921875, -2.581634521484375, -2.48272705078125, -2.383819580078125, -2.284912109375, -2.186004638671875, -2.08709716796875, -1.988189697265625, -1.8892822265625, -1.790374755859375, -1.69146728515625, -1.592559814453125, -1.49365234375, -1.394744873046875, -1.29583740234375, -1.196929931640625, -1.0980224609375, -0.999114990234375, -0.90020751953125, -0.801300048828125, -0.702392578125, -0.603485107421875, -0.50457763671875, -0.405670166015625, -0.3067626953125, -0.207855224609375, -0.10894775390625, -0.010040283203125, 0.0888671875, 0.187774658203125, 0.28668212890625, 0.385589599609375, 0.4844970703125, 0.583404541015625, 0.68231201171875, 0.781219482421875, 0.880126953125, 0.979034423828125, 1.07794189453125, 1.176849365234375, 1.2757568359375, 1.374664306640625, 1.47357177734375, 1.572479248046875, 1.67138671875, 1.770294189453125, 1.86920166015625, 1.968109130859375, 2.0670166015625, 2.165924072265625, 2.26483154296875, 2.363739013671875, 2.462646484375, 2.561553955078125, 2.66046142578125, 2.759368896484375, 2.8582763671875, 2.957183837890625, 3.05609130859375, 3.154998779296875, 3.25390625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 18.0, 20.0, 25.0, 26.0, 34.0, 47.0, 71.0, 94.0, 113.0, 148.0, 213.0, 319.0, 486.0, 684.0, 931.0, 1494.0, 2473.0, 4143.0, 7615.0, 15149.0, 31358.0, 64539.0, 132790.0, 5544323.0, 298825.0, 93221.0, 45443.0, 21798.0, 10582.0, 5507.0, 3203.0, 1763.0, 1149.0, 774.0, 564.0, 422.0, 287.0, 251.0, 162.0, 114.0, 77.0, 50.0, 42.0, 22.0, 16.0, 12.0, 14.0, 4.0, 6.0, 6.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.5313720703125, -1.484619140625, -1.4378662109375, -1.39111328125, -1.3443603515625, -1.297607421875, -1.2508544921875, -1.2041015625, -1.1573486328125, -1.110595703125, -1.0638427734375, -1.01708984375, -0.9703369140625, -0.923583984375, -0.8768310546875, -0.830078125, -0.7833251953125, -0.736572265625, -0.6898193359375, -0.64306640625, -0.5963134765625, -0.549560546875, -0.5028076171875, -0.4560546875, -0.4093017578125, -0.362548828125, -0.3157958984375, -0.26904296875, -0.2222900390625, -0.175537109375, -0.1287841796875, -0.08203125, -0.0352783203125, 0.011474609375, 0.0582275390625, 0.10498046875, 0.1517333984375, 0.198486328125, 0.2452392578125, 0.2919921875, 0.3387451171875, 0.385498046875, 0.4322509765625, 0.47900390625, 0.5257568359375, 0.572509765625, 0.6192626953125, 0.666015625, 0.7127685546875, 0.759521484375, 0.8062744140625, 0.85302734375, 0.8997802734375, 0.946533203125, 0.9932861328125, 1.0400390625, 1.0867919921875, 1.133544921875, 1.1802978515625, 1.22705078125, 1.2738037109375, 1.320556640625, 1.3673095703125, 1.4140625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 16.0, 6.0, 8.0, 11.0, 26.0, 13.0, 36.0, 28.0, 25.0, 25.0, 30.0, 29.0, 49.0, 45.0, 49.0, 44.0, 340.0, 750.0, 69.0, 38.0, 40.0, 33.0, 47.0, 36.0, 31.0, 27.0, 24.0, 27.0, 18.0, 13.0, 15.0, 18.0, 9.0, 6.0, 6.0, 6.0, 4.0, 8.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.06884765625, -3.9462890625, -3.82373046875, -3.701171875, -3.57861328125, -3.4560546875, -3.33349609375, -3.2109375, -3.08837890625, -2.9658203125, -2.84326171875, -2.720703125, -2.59814453125, -2.4755859375, -2.35302734375, -2.23046875, -2.10791015625, -1.9853515625, -1.86279296875, -1.740234375, -1.61767578125, -1.4951171875, -1.37255859375, -1.25, -1.12744140625, -1.0048828125, -0.88232421875, -0.759765625, -0.63720703125, -0.5146484375, -0.39208984375, -0.26953125, -0.14697265625, -0.0244140625, 0.09814453125, 0.220703125, 0.34326171875, 0.4658203125, 0.58837890625, 0.7109375, 0.83349609375, 0.9560546875, 1.07861328125, 1.201171875, 1.32373046875, 1.4462890625, 1.56884765625, 1.69140625, 1.81396484375, 1.9365234375, 2.05908203125, 2.181640625, 2.30419921875, 2.4267578125, 2.54931640625, 2.671875, 2.79443359375, 2.9169921875, 3.03955078125, 3.162109375, 3.28466796875, 3.4072265625, 3.52978515625, 3.65234375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 11.0, 25.0, 35.0, 75.0, 162.0, 245.0, 216.0, 105.0, 47.0, 22.0, 21.0, 9.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.026805877685547, -18.461204528808594, -17.89560317993164, -17.330001831054688, -16.764400482177734, -16.198801040649414, -15.633199691772461, -15.067598342895508, -14.501996994018555, -13.936395645141602, -13.370794296264648, -12.805193901062012, -12.239592552185059, -11.673991203308105, -11.108390808105469, -10.542789459228516, -9.977188110351562, -9.41158676147461, -8.845985412597656, -8.28038501739502, -7.714783668518066, -7.149182319641113, -6.583581447601318, -6.017980575561523, -5.45237922668457, -4.886777877807617, -4.321177005767822, -3.7555758953094482, -3.189974784851074, -2.6243736743927, -2.058772563934326, -1.4931714534759521, -0.9275722503662109, -0.3619711399078369, 0.2036299705505371, 0.7692310810089111, 1.3348321914672852, 1.9004333019256592, 2.466034412384033, 3.0316355228424072, 3.5972366333007812, 4.162837982177734, 4.728438854217529, 5.294039726257324, 5.859641075134277, 6.4252424240112305, 6.990843296051025, 7.55644416809082, 8.122045516967773, 8.687646865844727, 9.25324821472168, 9.818848609924316, 10.38444995880127, 10.950051307678223, 11.51565170288086, 12.081253051757812, 12.646854400634766, 13.212455749511719, 13.778057098388672, 14.343657493591309, 14.909258842468262, 15.474860191345215, 16.04046058654785, 16.606061935424805, 17.171663284301758]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 5.0, 9.0, 10.0, 13.0, 9.0, 16.0, 17.0, 18.0, 33.0, 28.0, 29.0, 53.0, 51.0, 44.0, 55.0, 62.0, 67.0, 53.0, 53.0, 45.0, 44.0, 39.0, 42.0, 21.0, 37.0, 26.0, 18.0, 9.0, 14.0, 8.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-12.745399475097656, -12.375323295593262, -12.005248069763184, -11.635171890258789, -11.265096664428711, -10.895020484924316, -10.524944305419922, -10.154869079589844, -9.784793853759766, -9.414717674255371, -9.044642448425293, -8.674566268920898, -8.30449104309082, -7.934414863586426, -7.5643391609191895, -7.194263458251953, -6.824187278747559, -6.454111576080322, -6.084035873413086, -5.713959693908691, -5.343884468078613, -4.973808288574219, -4.603732585906982, -4.233656883239746, -3.8635811805725098, -3.4935054779052734, -3.123429775238037, -2.7533538341522217, -2.3832781314849854, -2.013202428817749, -1.6431264877319336, -1.2730507850646973, -0.9029760360717773, -0.5329002737998962, -0.16282451152801514, 0.20725131034851074, 0.5773270130157471, 0.9474027156829834, 1.3174786567687988, 1.6875543594360352, 2.0576300621032715, 2.427705764770508, 2.797781467437744, 3.1678574085235596, 3.537933111190796, 3.9080088138580322, 4.278084754943848, 4.648160457611084, 5.01823616027832, 5.388311862945557, 5.758387565612793, 6.1284637451171875, 6.498538970947266, 6.86861515045166, 7.2386908531188965, 7.608766555786133, 7.978842258453369, 8.348917961120605, 8.718994140625, 9.089069366455078, 9.459145545959473, 9.82922077178955, 10.199296951293945, 10.569372177124023, 10.939448356628418]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 8.0, 10.0, 8.0, 14.0, 37.0, 35.0, 52.0, 80.0, 90.0, 108.0, 193.0, 299.0, 434.0, 817.0, 1475.0, 2877.0, 6527.0, 16773.0, 73269.0, 3966963.0, 90873.0, 18738.0, 6967.0, 3383.0, 1743.0, 950.0, 543.0, 333.0, 199.0, 137.0, 94.0, 60.0, 43.0, 34.0, 23.0, 18.0, 12.0, 11.0, 9.0, 3.0, 9.0, 6.0, 7.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.1640625, -0.15917396545410156, -0.15428543090820312, -0.1493968963623047, -0.14450836181640625, -0.1396198272705078, -0.13473129272460938, -0.12984275817871094, -0.1249542236328125, -0.12006568908691406, -0.11517715454101562, -0.11028861999511719, -0.10540008544921875, -0.10051155090332031, -0.09562301635742188, -0.09073448181152344, -0.085845947265625, -0.08095741271972656, -0.07606887817382812, -0.07118034362792969, -0.06629180908203125, -0.06140327453613281, -0.056514739990234375, -0.05162620544433594, -0.0467376708984375, -0.04184913635253906, -0.036960601806640625, -0.03207206726074219, -0.02718353271484375, -0.022294998168945312, -0.017406463623046875, -0.012517929077148438, -0.00762939453125, -0.0027408599853515625, 0.002147674560546875, 0.0070362091064453125, 0.01192474365234375, 0.016813278198242188, 0.021701812744140625, 0.026590347290039062, 0.0314788818359375, 0.03636741638183594, 0.041255950927734375, 0.04614448547363281, 0.05103302001953125, 0.05592155456542969, 0.060810089111328125, 0.06569862365722656, 0.070587158203125, 0.07547569274902344, 0.08036422729492188, 0.08525276184082031, 0.09014129638671875, 0.09502983093261719, 0.09991836547851562, 0.10480690002441406, 0.1096954345703125, 0.11458396911621094, 0.11947250366210938, 0.12436103820800781, 0.12924957275390625, 0.1341381072998047, 0.13902664184570312, 0.14391517639160156, 0.1488037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 6.0, 5.0, 8.0, 10.0, 14.0, 14.0, 31.0, 51.0, 182.0, 465.0, 56.0, 28.0, 14.0, 13.0, 10.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.047943115234375, -0.046575069427490234, -0.04520702362060547, -0.0438389778137207, -0.04247093200683594, -0.04110288619995117, -0.039734840393066406, -0.03836679458618164, -0.036998748779296875, -0.03563070297241211, -0.034262657165527344, -0.03289461135864258, -0.03152656555175781, -0.030158519744873047, -0.02879047393798828, -0.027422428131103516, -0.02605438232421875, -0.024686336517333984, -0.02331829071044922, -0.021950244903564453, -0.020582199096679688, -0.019214153289794922, -0.017846107482910156, -0.01647806167602539, -0.015110015869140625, -0.01374197006225586, -0.012373924255371094, -0.011005878448486328, -0.009637832641601562, -0.008269786834716797, -0.006901741027832031, -0.005533695220947266, -0.0041656494140625, -0.0027976036071777344, -0.0014295578002929688, -6.151199340820312e-05, 0.0013065338134765625, 0.002674579620361328, 0.004042625427246094, 0.005410671234130859, 0.006778717041015625, 0.00814676284790039, 0.009514808654785156, 0.010882854461669922, 0.012250900268554688, 0.013618946075439453, 0.014986991882324219, 0.016355037689208984, 0.01772308349609375, 0.019091129302978516, 0.02045917510986328, 0.021827220916748047, 0.023195266723632812, 0.024563312530517578, 0.025931358337402344, 0.02729940414428711, 0.028667449951171875, 0.03003549575805664, 0.031403541564941406, 0.03277158737182617, 0.03413963317871094, 0.0355076789855957, 0.03687572479248047, 0.038243770599365234, 0.03961181640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 7.0, 3.0, 12.0, 14.0, 20.0, 34.0, 40.0, 54.0, 96.0, 156.0, 345.0, 787.0, 1811.0, 4880.0, 14697.0, 54042.0, 287101.0, 3206417.0, 514418.0, 78126.0, 20336.0, 6503.0, 2361.0, 973.0, 435.0, 228.0, 136.0, 65.0, 51.0, 31.0, 29.0, 16.0, 12.0, 8.0, 10.0, 6.0, 0.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09147453308105469, -0.08803939819335938, -0.08460426330566406, -0.08116912841796875, -0.07773399353027344, -0.07429885864257812, -0.07086372375488281, -0.0674285888671875, -0.06399345397949219, -0.060558319091796875, -0.05712318420410156, -0.05368804931640625, -0.05025291442871094, -0.046817779541015625, -0.04338264465332031, -0.039947509765625, -0.03651237487792969, -0.033077239990234375, -0.029642105102539062, -0.02620697021484375, -0.022771835327148438, -0.019336700439453125, -0.015901565551757812, -0.0124664306640625, -0.009031295776367188, -0.005596160888671875, -0.0021610260009765625, 0.00127410888671875, 0.0047092437744140625, 0.008144378662109375, 0.011579513549804688, 0.0150146484375, 0.018449783325195312, 0.021884918212890625, 0.025320053100585938, 0.02875518798828125, 0.03219032287597656, 0.035625457763671875, 0.03906059265136719, 0.0424957275390625, 0.04593086242675781, 0.049365997314453125, 0.05280113220214844, 0.05623626708984375, 0.05967140197753906, 0.06310653686523438, 0.06654167175292969, 0.069976806640625, 0.07341194152832031, 0.07684707641601562, 0.08028221130371094, 0.08371734619140625, 0.08715248107910156, 0.09058761596679688, 0.09402275085449219, 0.0974578857421875, 0.10089302062988281, 0.10432815551757812, 0.10776329040527344, 0.11119842529296875, 0.11463356018066406, 0.11806869506835938, 0.12150382995605469, 0.12493896484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 2.0, 13.0, 13.0, 11.0, 17.0, 16.0, 23.0, 34.0, 43.0, 50.0, 65.0, 81.0, 110.0, 183.0, 265.0, 599.0, 1066.0, 551.0, 281.0, 174.0, 111.0, 80.0, 55.0, 48.0, 36.0, 20.0, 25.0, 24.0, 14.0, 10.0, 10.0, 6.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030140399932861328, -0.029000282287597656, -0.027860164642333984, -0.026720046997070312, -0.02557992935180664, -0.02443981170654297, -0.023299694061279297, -0.022159576416015625, -0.021019458770751953, -0.01987934112548828, -0.01873922348022461, -0.017599105834960938, -0.016458988189697266, -0.015318870544433594, -0.014178752899169922, -0.01303863525390625, -0.011898517608642578, -0.010758399963378906, -0.009618282318115234, -0.008478164672851562, -0.007338047027587891, -0.006197929382324219, -0.005057811737060547, -0.003917694091796875, -0.002777576446533203, -0.0016374588012695312, -0.0004973411560058594, 0.0006427764892578125, 0.0017828941345214844, 0.0029230117797851562, 0.004063129425048828, 0.0052032470703125, 0.006343364715576172, 0.007483482360839844, 0.008623600006103516, 0.009763717651367188, 0.01090383529663086, 0.012043952941894531, 0.013184070587158203, 0.014324188232421875, 0.015464305877685547, 0.01660442352294922, 0.01774454116821289, 0.018884658813476562, 0.020024776458740234, 0.021164894104003906, 0.022305011749267578, 0.02344512939453125, 0.024585247039794922, 0.025725364685058594, 0.026865482330322266, 0.028005599975585938, 0.02914571762084961, 0.03028583526611328, 0.03142595291137695, 0.032566070556640625, 0.0337061882019043, 0.03484630584716797, 0.03598642349243164, 0.03712654113769531, 0.038266658782958984, 0.039406776428222656, 0.04054689407348633, 0.04168701171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 12.0, 28.0, 64.0, 149.0, 243.0, 254.0, 140.0, 60.0, 23.0, 10.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22374887764453888, -0.21200014650821686, -0.20025141537189484, -0.18850268423557281, -0.1767539530992508, -0.16500522196292877, -0.15325647592544556, -0.14150774478912354, -0.1297590136528015, -0.11801028251647949, -0.10626155138015747, -0.09451282024383545, -0.08276408910751343, -0.0710153579711914, -0.05926661938428879, -0.047517888247966766, -0.03576916456222534, -0.02402043342590332, -0.01227170042693615, -0.0005229674279689789, 0.011225763708353043, 0.022974494844675064, 0.034723229706287384, 0.046471960842609406, 0.05822069197893143, 0.06996942311525345, 0.08171815425157547, 0.09346689283847809, 0.10521562397480011, 0.11696435511112213, 0.12871308624744415, 0.14046181738376617, 0.1522105634212494, 0.1639592945575714, 0.17570802569389343, 0.18745675683021545, 0.19920548796653748, 0.2109542191028595, 0.22270295023918152, 0.23445168137550354, 0.24620041251182556, 0.2579491436481476, 0.2696978747844696, 0.2814466059207916, 0.29319533705711365, 0.30494406819343567, 0.3166927993297577, 0.3284415304660797, 0.3401902914047241, 0.35193902254104614, 0.36368775367736816, 0.3754364848136902, 0.3871852159500122, 0.39893394708633423, 0.41068267822265625, 0.42243140935897827, 0.4341801404953003, 0.4459288716316223, 0.45767760276794434, 0.46942633390426636, 0.4811750650405884, 0.4929237961769104, 0.5046725273132324, 0.5164212584495544, 0.5281699895858765]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 5.0, 6.0, 3.0, 9.0, 12.0, 14.0, 15.0, 20.0, 25.0, 35.0, 44.0, 39.0, 51.0, 51.0, 74.0, 64.0, 71.0, 71.0, 71.0, 56.0, 62.0, 32.0, 32.0, 22.0, 29.0, 19.0, 24.0, 9.0, 8.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17424196004867554, -0.16807514429092407, -0.1619083285331726, -0.15574151277542114, -0.14957469701766968, -0.14340786635875702, -0.13724105060100555, -0.1310742348432541, -0.12490741908550262, -0.11874060332775116, -0.1125737875699997, -0.10640696436166763, -0.10024014860391617, -0.0940733328461647, -0.08790650963783264, -0.08173969388008118, -0.07557287812232971, -0.06940606236457825, -0.06323924660682678, -0.05707242339849472, -0.050905607640743256, -0.04473879188299179, -0.03857197239995003, -0.032405152916908264, -0.0262383371591568, -0.020071519538760185, -0.013904701918363571, -0.007737884297966957, -0.001571066677570343, 0.004595750942826271, 0.010762568563222885, 0.01692938804626465, 0.023096203804016113, 0.029263021424412727, 0.03542983904480934, 0.041596658527851105, 0.04776347428560257, 0.053930290043354034, 0.0600971095263958, 0.06626392900943756, 0.07243074476718903, 0.07859756052494049, 0.08476437628269196, 0.09093119949102402, 0.09709801524877548, 0.10326483100652695, 0.10943165421485901, 0.11559846997261047, 0.12176528573036194, 0.1279321014881134, 0.13409891724586487, 0.14026573300361633, 0.1464325487613678, 0.15259937942028046, 0.15876619517803192, 0.1649330109357834, 0.17109982669353485, 0.17726664245128632, 0.18343345820903778, 0.18960027396678925, 0.1957671046257019, 0.20193392038345337, 0.20810073614120483, 0.2142675518989563, 0.22043436765670776]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 1.0, 6.0, 6.0, 13.0, 19.0, 34.0, 39.0, 54.0, 84.0, 128.0, 168.0, 206.0, 307.0, 426.0, 551.0, 837.0, 1209.0, 1629.0, 2324.0, 3583.0, 5382.0, 8550.0, 14316.0, 26646.0, 71387.0, 762478.0, 79506.0, 28038.0, 14664.0, 8820.0, 5510.0, 3593.0, 2429.0, 1660.0, 1107.0, 795.0, 551.0, 393.0, 308.0, 244.0, 167.0, 118.0, 90.0, 66.0, 28.0, 30.0, 24.0, 11.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1036376953125, -0.10035037994384766, -0.09706306457519531, -0.09377574920654297, -0.09048843383789062, -0.08720111846923828, -0.08391380310058594, -0.0806264877319336, -0.07733917236328125, -0.0740518569946289, -0.07076454162597656, -0.06747722625732422, -0.06418991088867188, -0.06090259552001953, -0.05761528015136719, -0.054327964782714844, -0.0510406494140625, -0.047753334045410156, -0.04446601867675781, -0.04117870330810547, -0.037891387939453125, -0.03460407257080078, -0.03131675720214844, -0.028029441833496094, -0.02474212646484375, -0.021454811096191406, -0.018167495727539062, -0.014880180358886719, -0.011592864990234375, -0.008305549621582031, -0.0050182342529296875, -0.0017309188842773438, 0.001556396484375, 0.004843711853027344, 0.008131027221679688, 0.011418342590332031, 0.014705657958984375, 0.01799297332763672, 0.021280288696289062, 0.024567604064941406, 0.02785491943359375, 0.031142234802246094, 0.03442955017089844, 0.03771686553955078, 0.041004180908203125, 0.04429149627685547, 0.04757881164550781, 0.050866127014160156, 0.0541534423828125, 0.057440757751464844, 0.06072807312011719, 0.06401538848876953, 0.06730270385742188, 0.07059001922607422, 0.07387733459472656, 0.0771646499633789, 0.08045196533203125, 0.0837392807006836, 0.08702659606933594, 0.09031391143798828, 0.09360122680664062, 0.09688854217529297, 0.10017585754394531, 0.10346317291259766, 0.10675048828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 5.0, 9.0, 9.0, 6.0, 6.0, 6.0, 7.0, 17.0, 24.0, 27.0, 80.0, 361.0, 249.0, 52.0, 32.0, 15.0, 14.0, 11.0, 7.0, 8.0, 9.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.044189453125, -0.04288339614868164, -0.04157733917236328, -0.04027128219604492, -0.03896522521972656, -0.0376591682434082, -0.036353111267089844, -0.035047054290771484, -0.033740997314453125, -0.032434940338134766, -0.031128883361816406, -0.029822826385498047, -0.028516769409179688, -0.027210712432861328, -0.02590465545654297, -0.02459859848022461, -0.02329254150390625, -0.02198648452758789, -0.02068042755126953, -0.019374370574951172, -0.018068313598632812, -0.016762256622314453, -0.015456199645996094, -0.014150142669677734, -0.012844085693359375, -0.011538028717041016, -0.010231971740722656, -0.008925914764404297, -0.0076198577880859375, -0.006313800811767578, -0.005007743835449219, -0.0037016868591308594, -0.0023956298828125, -0.0010895729064941406, 0.00021648406982421875, 0.0015225410461425781, 0.0028285980224609375, 0.004134654998779297, 0.005440711975097656, 0.006746768951416016, 0.008052825927734375, 0.009358882904052734, 0.010664939880371094, 0.011970996856689453, 0.013277053833007812, 0.014583110809326172, 0.01588916778564453, 0.01719522476196289, 0.01850128173828125, 0.01980733871459961, 0.02111339569091797, 0.022419452667236328, 0.023725509643554688, 0.025031566619873047, 0.026337623596191406, 0.027643680572509766, 0.028949737548828125, 0.030255794525146484, 0.031561851501464844, 0.0328679084777832, 0.03417396545410156, 0.03548002243041992, 0.03678607940673828, 0.03809213638305664, 0.039398193359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 12.0, 10.0, 13.0, 12.0, 19.0, 13.0, 30.0, 49.0, 70.0, 80.0, 127.0, 196.0, 349.0, 654.0, 1382.0, 3186.0, 8582.0, 26079.0, 99762.0, 436684.0, 356226.0, 79939.0, 22210.0, 7318.0, 2765.0, 1207.0, 621.0, 330.0, 175.0, 130.0, 83.0, 49.0, 41.0, 38.0, 18.0, 16.0, 24.0, 17.0, 7.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10247802734375, -0.09916400909423828, -0.09584999084472656, -0.09253597259521484, -0.08922195434570312, -0.0859079360961914, -0.08259391784667969, -0.07927989959716797, -0.07596588134765625, -0.07265186309814453, -0.06933784484863281, -0.0660238265991211, -0.06270980834960938, -0.059395790100097656, -0.05608177185058594, -0.05276775360107422, -0.0494537353515625, -0.04613971710205078, -0.04282569885253906, -0.039511680603027344, -0.036197662353515625, -0.032883644104003906, -0.029569625854492188, -0.02625560760498047, -0.02294158935546875, -0.01962757110595703, -0.016313552856445312, -0.012999534606933594, -0.009685516357421875, -0.006371498107910156, -0.0030574798583984375, 0.00025653839111328125, 0.003570556640625, 0.006884574890136719, 0.010198593139648438, 0.013512611389160156, 0.016826629638671875, 0.020140647888183594, 0.023454666137695312, 0.02676868438720703, 0.03008270263671875, 0.03339672088623047, 0.03671073913574219, 0.040024757385253906, 0.043338775634765625, 0.046652793884277344, 0.04996681213378906, 0.05328083038330078, 0.0565948486328125, 0.05990886688232422, 0.06322288513183594, 0.06653690338134766, 0.06985092163085938, 0.0731649398803711, 0.07647895812988281, 0.07979297637939453, 0.08310699462890625, 0.08642101287841797, 0.08973503112792969, 0.0930490493774414, 0.09636306762695312, 0.09967708587646484, 0.10299110412597656, 0.10630512237548828, 0.109619140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 10.0, 12.0, 9.0, 6.0, 9.0, 16.0, 16.0, 18.0, 24.0, 23.0, 26.0, 38.0, 36.0, 33.0, 39.0, 33.0, 31.0, 28.0, 56.0, 42.0, 38.0, 42.0, 35.0, 42.0, 32.0, 36.0, 40.0, 31.0, 25.0, 24.0, 32.0, 19.0, 13.0, 7.0, 9.0, 16.0, 17.0, 10.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.123260498046875, -0.11920166015625, -0.115142822265625, -0.111083984375, -0.107025146484375, -0.10296630859375, -0.098907470703125, -0.0948486328125, -0.090789794921875, -0.08673095703125, -0.082672119140625, -0.07861328125, -0.074554443359375, -0.07049560546875, -0.066436767578125, -0.0623779296875, -0.058319091796875, -0.05426025390625, -0.050201416015625, -0.046142578125, -0.042083740234375, -0.03802490234375, -0.033966064453125, -0.0299072265625, -0.025848388671875, -0.02178955078125, -0.017730712890625, -0.013671875, -0.009613037109375, -0.00555419921875, -0.001495361328125, 0.0025634765625, 0.006622314453125, 0.01068115234375, 0.014739990234375, 0.018798828125, 0.022857666015625, 0.02691650390625, 0.030975341796875, 0.0350341796875, 0.039093017578125, 0.04315185546875, 0.047210693359375, 0.05126953125, 0.055328369140625, 0.05938720703125, 0.063446044921875, 0.0675048828125, 0.071563720703125, 0.07562255859375, 0.079681396484375, 0.083740234375, 0.087799072265625, 0.09185791015625, 0.095916748046875, 0.0999755859375, 0.104034423828125, 0.10809326171875, 0.112152099609375, 0.1162109375, 0.120269775390625, 0.12432861328125, 0.128387451171875, 0.1324462890625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 11.0, 15.0, 15.0, 31.0, 65.0, 98.0, 127.0, 259.0, 562.0, 1232.0, 3442.0, 12675.0, 82478.0, 732303.0, 185716.0, 21056.0, 5267.0, 1663.0, 717.0, 350.0, 187.0, 97.0, 62.0, 41.0, 22.0, 19.0, 7.0, 12.0, 5.0, 8.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09393310546875, -0.09105682373046875, -0.0881805419921875, -0.08530426025390625, -0.082427978515625, -0.07955169677734375, -0.0766754150390625, -0.07379913330078125, -0.0709228515625, -0.06804656982421875, -0.0651702880859375, -0.06229400634765625, -0.059417724609375, -0.05654144287109375, -0.0536651611328125, -0.05078887939453125, -0.04791259765625, -0.04503631591796875, -0.0421600341796875, -0.03928375244140625, -0.036407470703125, -0.03353118896484375, -0.0306549072265625, -0.02777862548828125, -0.02490234375, -0.02202606201171875, -0.0191497802734375, -0.01627349853515625, -0.013397216796875, -0.01052093505859375, -0.0076446533203125, -0.00476837158203125, -0.00189208984375, 0.00098419189453125, 0.0038604736328125, 0.00673675537109375, 0.009613037109375, 0.01248931884765625, 0.0153656005859375, 0.01824188232421875, 0.0211181640625, 0.02399444580078125, 0.0268707275390625, 0.02974700927734375, 0.032623291015625, 0.03549957275390625, 0.0383758544921875, 0.04125213623046875, 0.04412841796875, 0.04700469970703125, 0.0498809814453125, 0.05275726318359375, 0.055633544921875, 0.05850982666015625, 0.0613861083984375, 0.06426239013671875, 0.067138671875, 0.07001495361328125, 0.0728912353515625, 0.07576751708984375, 0.078643798828125, 0.08152008056640625, 0.0843963623046875, 0.08727264404296875, 0.09014892578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 5.0, 5.0, 5.0, 7.0, 10.0, 12.0, 16.0, 20.0, 34.0, 30.0, 28.0, 42.0, 59.0, 57.0, 83.0, 74.0, 58.0, 57.0, 49.0, 66.0, 38.0, 36.0, 41.0, 23.0, 38.0, 30.0, 15.0, 12.0, 9.0, 21.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2278556823730469e-05, -1.176539808511734e-05, -1.1252239346504211e-05, -1.0739080607891083e-05, -1.0225921869277954e-05, -9.712763130664825e-06, -9.199604392051697e-06, -8.686445653438568e-06, -8.17328691482544e-06, -7.66012817621231e-06, -7.146969437599182e-06, -6.6338106989860535e-06, -6.120651960372925e-06, -5.607493221759796e-06, -5.0943344831466675e-06, -4.581175744533539e-06, -4.06801700592041e-06, -3.5548582673072815e-06, -3.041699528694153e-06, -2.528540790081024e-06, -2.0153820514678955e-06, -1.5022233128547668e-06, -9.890645742416382e-07, -4.759058356285095e-07, 3.725290298461914e-08, 5.504116415977478e-07, 1.0635703802108765e-06, 1.5767291188240051e-06, 2.089887857437134e-06, 2.6030465960502625e-06, 3.116205334663391e-06, 3.6293640732765198e-06, 4.1425228118896484e-06, 4.655681550502777e-06, 5.168840289115906e-06, 5.6819990277290344e-06, 6.195157766342163e-06, 6.708316504955292e-06, 7.22147524356842e-06, 7.734633982181549e-06, 8.247792720794678e-06, 8.760951459407806e-06, 9.274110198020935e-06, 9.787268936634064e-06, 1.0300427675247192e-05, 1.0813586413860321e-05, 1.132674515247345e-05, 1.1839903891086578e-05, 1.2353062629699707e-05, 1.2866221368312836e-05, 1.3379380106925964e-05, 1.3892538845539093e-05, 1.4405697584152222e-05, 1.491885632276535e-05, 1.543201506137848e-05, 1.5945173799991608e-05, 1.6458332538604736e-05, 1.6971491277217865e-05, 1.7484650015830994e-05, 1.7997808754444122e-05, 1.851096749305725e-05, 1.902412623167038e-05, 1.9537284970283508e-05, 2.0050443708896637e-05, 2.0563602447509766e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 9.0, 25.0, 30.0, 54.0, 107.0, 199.0, 473.0, 1163.0, 3959.0, 18313.0, 170356.0, 750991.0, 86571.0, 11769.0, 2834.0, 902.0, 377.0, 177.0, 90.0, 51.0, 23.0, 24.0, 10.0, 17.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0916748046875, -0.08832550048828125, -0.0849761962890625, -0.08162689208984375, -0.078277587890625, -0.07492828369140625, -0.0715789794921875, -0.06822967529296875, -0.06488037109375, -0.06153106689453125, -0.0581817626953125, -0.05483245849609375, -0.051483154296875, -0.04813385009765625, -0.0447845458984375, -0.04143524169921875, -0.0380859375, -0.03473663330078125, -0.0313873291015625, -0.02803802490234375, -0.024688720703125, -0.02133941650390625, -0.0179901123046875, -0.01464080810546875, -0.01129150390625, -0.00794219970703125, -0.0045928955078125, -0.00124359130859375, 0.002105712890625, 0.00545501708984375, 0.0088043212890625, 0.01215362548828125, 0.0155029296875, 0.01885223388671875, 0.0222015380859375, 0.02555084228515625, 0.028900146484375, 0.03224945068359375, 0.0355987548828125, 0.03894805908203125, 0.04229736328125, 0.04564666748046875, 0.0489959716796875, 0.05234527587890625, 0.055694580078125, 0.05904388427734375, 0.0623931884765625, 0.06574249267578125, 0.069091796875, 0.07244110107421875, 0.0757904052734375, 0.07913970947265625, 0.082489013671875, 0.08583831787109375, 0.0891876220703125, 0.09253692626953125, 0.09588623046875, 0.09923553466796875, 0.1025848388671875, 0.10593414306640625, 0.109283447265625, 0.11263275146484375, 0.1159820556640625, 0.11933135986328125, 0.1226806640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 8.0, 12.0, 19.0, 23.0, 35.0, 42.0, 75.0, 85.0, 130.0, 101.0, 127.0, 97.0, 75.0, 51.0, 34.0, 30.0, 20.0, 12.0, 7.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07171630859375, -0.0688161849975586, -0.06591606140136719, -0.06301593780517578, -0.060115814208984375, -0.05721569061279297, -0.05431556701660156, -0.051415443420410156, -0.04851531982421875, -0.045615196228027344, -0.04271507263183594, -0.03981494903564453, -0.036914825439453125, -0.03401470184326172, -0.031114578247070312, -0.028214454650878906, -0.0253143310546875, -0.022414207458496094, -0.019514083862304688, -0.01661396026611328, -0.013713836669921875, -0.010813713073730469, -0.007913589477539062, -0.005013465881347656, -0.00211334228515625, 0.0007867813110351562, 0.0036869049072265625, 0.006587028503417969, 0.009487152099609375, 0.012387275695800781, 0.015287399291992188, 0.018187522888183594, 0.021087646484375, 0.023987770080566406, 0.026887893676757812, 0.02978801727294922, 0.032688140869140625, 0.03558826446533203, 0.03848838806152344, 0.041388511657714844, 0.04428863525390625, 0.047188758850097656, 0.05008888244628906, 0.05298900604248047, 0.055889129638671875, 0.05878925323486328, 0.06168937683105469, 0.0645895004272461, 0.0674896240234375, 0.0703897476196289, 0.07328987121582031, 0.07618999481201172, 0.07909011840820312, 0.08199024200439453, 0.08489036560058594, 0.08779048919677734, 0.09069061279296875, 0.09359073638916016, 0.09649085998535156, 0.09939098358154297, 0.10229110717773438, 0.10519123077392578, 0.10809135437011719, 0.1109914779663086, 0.1138916015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 25.0, 47.0, 133.0, 276.0, 282.0, 119.0, 50.0, 29.0, 12.0, 6.0, 10.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1231088638305664, -1.076072335243225, -1.0290359258651733, -0.981999397277832, -0.9349629878997803, -0.887926459312439, -0.8408899903297424, -0.7938535213470459, -0.7468170523643494, -0.6997805833816528, -0.6527441143989563, -0.6057076454162598, -0.5586711168289185, -0.5116347074508667, -0.4645981788635254, -0.41756170988082886, -0.3705252408981323, -0.3234887719154358, -0.27645230293273926, -0.22941580414772034, -0.1823793351650238, -0.13534286618232727, -0.08830636739730835, -0.041269898414611816, 0.005766570568084717, 0.05280304700136185, 0.09983952343463898, 0.1468760073184967, 0.19391247630119324, 0.24094894528388977, 0.2879854440689087, 0.3350219130516052, 0.3820585012435913, 0.42909497022628784, 0.4761314392089844, 0.5231679677963257, 0.5702043771743774, 0.6172409057617188, 0.6642773747444153, 0.7113138437271118, 0.7583503127098083, 0.8053867816925049, 0.8524232506752014, 0.899459719657898, 0.9464962482452393, 0.993532657623291, 1.0405691862106323, 1.0876057147979736, 1.1346421241760254, 1.1816786527633667, 1.2287150621414185, 1.2757515907287598, 1.3227880001068115, 1.3698245286941528, 1.4168610572814941, 1.463897466659546, 1.5109338760375977, 1.557970404624939, 1.6050068140029907, 1.652043342590332, 1.6990797519683838, 1.746116280555725, 1.7931528091430664, 1.8401892185211182, 1.8872257471084595]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 8.0, 6.0, 8.0, 15.0, 19.0, 40.0, 53.0, 90.0, 138.0, 170.0, 134.0, 92.0, 71.0, 39.0, 30.0, 10.0, 13.0, 8.0, 5.0, 10.0, 6.0, 8.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0380027294158936, -2.9527106285095215, -2.8674187660217285, -2.7821266651153564, -2.6968345642089844, -2.6115427017211914, -2.5262506008148193, -2.4409584999084473, -2.3556666374206543, -2.2703745365142822, -2.1850826740264893, -2.099790573120117, -2.014498472213745, -1.9292064905166626, -1.84391450881958, -1.758622407913208, -1.673330307006836, -1.5880383253097534, -1.5027462244033813, -1.4174542427062988, -1.3321621417999268, -1.2468701601028442, -1.1615781784057617, -1.0762860774993896, -0.9909940958023071, -0.9057020545005798, -0.8204100131988525, -0.73511803150177, -0.6498259902000427, -0.5645339488983154, -0.4792419672012329, -0.3939499258995056, -0.3086576461791992, -0.22336561977863312, -0.13807359337806702, -0.05278158187866211, 0.032510459423065186, 0.11780250072479248, 0.203094482421875, 0.2883865237236023, 0.3736785650253296, 0.4589706063270569, 0.5442626476287842, 0.6295546293258667, 0.714846670627594, 0.8001387119293213, 0.8854306936264038, 0.9707227349281311, 1.0560147762298584, 1.141306757926941, 1.226598858833313, 1.3118908405303955, 1.3971829414367676, 1.48247492313385, 1.5677669048309326, 1.6530590057373047, 1.7383509874343872, 1.8236429691314697, 1.9089350700378418, 1.9942270517349243, 2.079519033432007, 2.164811134338379, 2.250102996826172, 2.335395097732544, 2.420687198638916]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 11.0, 13.0, 15.0, 31.0, 47.0, 72.0, 99.0, 149.0, 236.0, 320.0, 562.0, 861.0, 1440.0, 2470.0, 4775.0, 10208.0, 26285.0, 122434.0, 3879397.0, 101224.0, 23233.0, 9252.0, 4484.0, 2476.0, 1462.0, 889.0, 587.0, 380.0, 248.0, 178.0, 118.0, 99.0, 63.0, 43.0, 26.0, 27.0, 23.0, 11.0, 8.0, 12.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.322265625, -0.31317901611328125, -0.3040924072265625, -0.29500579833984375, -0.285919189453125, -0.27683258056640625, -0.2677459716796875, -0.25865936279296875, -0.24957275390625, -0.24048614501953125, -0.2313995361328125, -0.22231292724609375, -0.213226318359375, -0.20413970947265625, -0.1950531005859375, -0.18596649169921875, -0.1768798828125, -0.16779327392578125, -0.1587066650390625, -0.14962005615234375, -0.140533447265625, -0.13144683837890625, -0.1223602294921875, -0.11327362060546875, -0.10418701171875, -0.09510040283203125, -0.0860137939453125, -0.07692718505859375, -0.067840576171875, -0.05875396728515625, -0.0496673583984375, -0.04058074951171875, -0.031494140625, -0.02240753173828125, -0.0133209228515625, -0.00423431396484375, 0.004852294921875, 0.01393890380859375, 0.0230255126953125, 0.03211212158203125, 0.04119873046875, 0.05028533935546875, 0.0593719482421875, 0.06845855712890625, 0.077545166015625, 0.08663177490234375, 0.0957183837890625, 0.10480499267578125, 0.1138916015625, 0.12297821044921875, 0.1320648193359375, 0.14115142822265625, 0.150238037109375, 0.15932464599609375, 0.1684112548828125, 0.17749786376953125, 0.18658447265625, 0.19567108154296875, 0.2047576904296875, 0.21384429931640625, 0.222930908203125, 0.23201751708984375, 0.2411041259765625, 0.25019073486328125, 0.25927734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 2.0, 11.0, 8.0, 11.0, 13.0, 16.0, 27.0, 54.0, 101.0, 209.0, 242.0, 112.0, 55.0, 20.0, 15.0, 8.0, 13.0, 8.0, 5.0, 14.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03717041015625, -0.036008358001708984, -0.03484630584716797, -0.03368425369262695, -0.03252220153808594, -0.03136014938354492, -0.030198097229003906, -0.02903604507446289, -0.027873992919921875, -0.02671194076538086, -0.025549888610839844, -0.024387836456298828, -0.023225784301757812, -0.022063732147216797, -0.02090167999267578, -0.019739627838134766, -0.01857757568359375, -0.017415523529052734, -0.01625347137451172, -0.015091419219970703, -0.013929367065429688, -0.012767314910888672, -0.011605262756347656, -0.01044321060180664, -0.009281158447265625, -0.00811910629272461, -0.006957054138183594, -0.005795001983642578, -0.0046329498291015625, -0.003470897674560547, -0.0023088455200195312, -0.0011467933654785156, 1.52587890625e-05, 0.0011773109436035156, 0.0023393630981445312, 0.003501415252685547, 0.0046634674072265625, 0.005825519561767578, 0.006987571716308594, 0.00814962387084961, 0.009311676025390625, 0.01047372817993164, 0.011635780334472656, 0.012797832489013672, 0.013959884643554688, 0.015121936798095703, 0.01628398895263672, 0.017446041107177734, 0.01860809326171875, 0.019770145416259766, 0.02093219757080078, 0.022094249725341797, 0.023256301879882812, 0.024418354034423828, 0.025580406188964844, 0.02674245834350586, 0.027904510498046875, 0.02906656265258789, 0.030228614807128906, 0.03139066696166992, 0.03255271911621094, 0.03371477127075195, 0.03487682342529297, 0.036038875579833984, 0.037200927734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 14.0, 23.0, 41.0, 50.0, 72.0, 148.0, 271.0, 591.0, 1369.0, 3744.0, 12517.0, 55023.0, 572250.0, 3386271.0, 128856.0, 22979.0, 6105.0, 2153.0, 908.0, 402.0, 190.0, 105.0, 68.0, 39.0, 28.0, 15.0, 8.0, 10.0, 5.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.2549896240234375, -0.246551513671875, -0.2381134033203125, -0.22967529296875, -0.2212371826171875, -0.212799072265625, -0.2043609619140625, -0.1959228515625, -0.1874847412109375, -0.179046630859375, -0.1706085205078125, -0.16217041015625, -0.1537322998046875, -0.145294189453125, -0.1368560791015625, -0.12841796875, -0.1199798583984375, -0.111541748046875, -0.1031036376953125, -0.09466552734375, -0.0862274169921875, -0.077789306640625, -0.0693511962890625, -0.0609130859375, -0.0524749755859375, -0.044036865234375, -0.0355987548828125, -0.02716064453125, -0.0187225341796875, -0.010284423828125, -0.0018463134765625, 0.006591796875, 0.0150299072265625, 0.023468017578125, 0.0319061279296875, 0.04034423828125, 0.0487823486328125, 0.057220458984375, 0.0656585693359375, 0.0740966796875, 0.0825347900390625, 0.090972900390625, 0.0994110107421875, 0.10784912109375, 0.1162872314453125, 0.124725341796875, 0.1331634521484375, 0.1416015625, 0.1500396728515625, 0.158477783203125, 0.1669158935546875, 0.17535400390625, 0.1837921142578125, 0.192230224609375, 0.2006683349609375, 0.2091064453125, 0.2175445556640625, 0.225982666015625, 0.2344207763671875, 0.24285888671875, 0.2512969970703125, 0.259735107421875, 0.2681732177734375, 0.276611328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 9.0, 7.0, 13.0, 11.0, 15.0, 16.0, 24.0, 39.0, 67.0, 106.0, 138.0, 251.0, 541.0, 1639.0, 468.0, 231.0, 146.0, 97.0, 64.0, 46.0, 34.0, 17.0, 12.0, 11.0, 14.0, 7.0, 9.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.038083553314208984, -0.03682994842529297, -0.03557634353637695, -0.03432273864746094, -0.03306913375854492, -0.031815528869628906, -0.03056192398071289, -0.029308319091796875, -0.02805471420288086, -0.026801109313964844, -0.025547504425048828, -0.024293899536132812, -0.023040294647216797, -0.02178668975830078, -0.020533084869384766, -0.01927947998046875, -0.018025875091552734, -0.01677227020263672, -0.015518665313720703, -0.014265060424804688, -0.013011455535888672, -0.011757850646972656, -0.01050424575805664, -0.009250640869140625, -0.00799703598022461, -0.006743431091308594, -0.005489826202392578, -0.0042362213134765625, -0.002982616424560547, -0.0017290115356445312, -0.0004754066467285156, 0.0007781982421875, 0.0020318031311035156, 0.0032854080200195312, 0.004539012908935547, 0.0057926177978515625, 0.007046222686767578, 0.008299827575683594, 0.00955343246459961, 0.010807037353515625, 0.01206064224243164, 0.013314247131347656, 0.014567852020263672, 0.015821456909179688, 0.017075061798095703, 0.01832866668701172, 0.019582271575927734, 0.02083587646484375, 0.022089481353759766, 0.02334308624267578, 0.024596691131591797, 0.025850296020507812, 0.027103900909423828, 0.028357505798339844, 0.02961111068725586, 0.030864715576171875, 0.03211832046508789, 0.033371925354003906, 0.03462553024291992, 0.03587913513183594, 0.03713274002075195, 0.03838634490966797, 0.039639949798583984, 0.0408935546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 10.0, 92.0, 442.0, 353.0, 74.0, 15.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2886160910129547, -0.2639516294002533, -0.23928715288639069, -0.21462269127368927, -0.18995821475982666, -0.16529375314712524, -0.14062929153442383, -0.11596481502056122, -0.0913003534078598, -0.06663588434457779, -0.041971419006586075, -0.01730695366859436, 0.007357515394687653, 0.032021984457969666, 0.05668644607067108, 0.08135092258453369, 0.10601538419723511, 0.13067984580993652, 0.15534432232379913, 0.18000878393650055, 0.20467326045036316, 0.22933772206306458, 0.254002183675766, 0.2786666750907898, 0.3033311367034912, 0.3279955983161926, 0.35266005992889404, 0.37732452154159546, 0.40198901295661926, 0.4266534745693207, 0.4513179361820221, 0.4759824275970459, 0.5006468892097473, 0.5253113508224487, 0.5499758124351501, 0.5746402740478516, 0.599304735660553, 0.6239691972732544, 0.6486337184906006, 0.673298180103302, 0.6979626417160034, 0.7226271033287048, 0.7472915649414062, 0.7719560265541077, 0.7966204881668091, 0.8212850093841553, 0.8459494113922119, 0.8706139326095581, 0.8952783346176147, 0.9199427962303162, 0.9446072578430176, 0.969271719455719, 0.9939361810684204, 1.0186007022857666, 1.0432651042938232, 1.0679296255111694, 1.0925941467285156, 1.1172586679458618, 1.1419230699539185, 1.1665875911712646, 1.1912519931793213, 1.2159165143966675, 1.2405809164047241, 1.2652454376220703, 1.289909839630127]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 9.0, 7.0, 16.0, 16.0, 19.0, 21.0, 35.0, 38.0, 49.0, 47.0, 46.0, 57.0, 60.0, 68.0, 56.0, 57.0, 59.0, 63.0, 45.0, 37.0, 30.0, 36.0, 18.0, 17.0, 10.0, 13.0, 13.0, 8.0, 5.0, 5.0, 10.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.23094552755355835, -0.22420775890350342, -0.21747000515460968, -0.21073223650455475, -0.203994482755661, -0.19725671410560608, -0.19051894545555115, -0.1837811917066574, -0.17704343795776367, -0.17030566930770874, -0.163567915558815, -0.15683014690876007, -0.15009239315986633, -0.1433546245098114, -0.13661685585975647, -0.12987910211086273, -0.1231413334608078, -0.11640357226133347, -0.10966581106185913, -0.1029280424118042, -0.09619028866291046, -0.08945252001285553, -0.0827147588133812, -0.07597699761390686, -0.06923923641443253, -0.06250147521495819, -0.055763714015483856, -0.04902594909071922, -0.04228818789124489, -0.035550426691770554, -0.02881266176700592, -0.022074900567531586, -0.015337139368057251, -0.008599377237260342, -0.0018616151064634323, 0.004876147955656052, 0.011613909155130386, 0.01835167035460472, 0.025089435279369354, 0.03182719647884369, 0.038564957678318024, 0.04530271887779236, 0.05204048007726669, 0.058778245002031326, 0.06551600992679596, 0.0722537636756897, 0.07899153232574463, 0.08572929352521896, 0.0924670547246933, 0.09920481592416763, 0.10594257712364197, 0.1126803457736969, 0.11941809952259064, 0.12615586817264557, 0.1328936219215393, 0.13963139057159424, 0.14636915922164917, 0.1531069278717041, 0.15984468162059784, 0.16658245027065277, 0.1733202040195465, 0.18005797266960144, 0.18679574131965637, 0.1935334950685501, 0.20027124881744385]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 6.0, 12.0, 26.0, 20.0, 40.0, 53.0, 83.0, 101.0, 149.0, 222.0, 357.0, 505.0, 864.0, 1349.0, 2219.0, 3747.0, 7230.0, 15584.0, 39957.0, 244889.0, 621690.0, 66505.0, 21328.0, 9589.0, 4915.0, 2768.0, 1570.0, 933.0, 588.0, 396.0, 258.0, 170.0, 136.0, 85.0, 55.0, 45.0, 28.0, 15.0, 16.0, 17.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0], "bins": [-0.222412109375, -0.21626663208007812, -0.21012115478515625, -0.20397567749023438, -0.1978302001953125, -0.19168472290039062, -0.18553924560546875, -0.17939376831054688, -0.173248291015625, -0.16710281372070312, -0.16095733642578125, -0.15481185913085938, -0.1486663818359375, -0.14252090454101562, -0.13637542724609375, -0.13022994995117188, -0.12408447265625, -0.11793899536132812, -0.11179351806640625, -0.10564804077148438, -0.0995025634765625, -0.09335708618164062, -0.08721160888671875, -0.08106613159179688, -0.074920654296875, -0.06877517700195312, -0.06262969970703125, -0.056484222412109375, -0.0503387451171875, -0.044193267822265625, -0.03804779052734375, -0.031902313232421875, -0.0257568359375, -0.019611358642578125, -0.01346588134765625, -0.007320404052734375, -0.0011749267578125, 0.004970550537109375, 0.01111602783203125, 0.017261505126953125, 0.023406982421875, 0.029552459716796875, 0.03569793701171875, 0.041843414306640625, 0.0479888916015625, 0.054134368896484375, 0.06027984619140625, 0.06642532348632812, 0.07257080078125, 0.07871627807617188, 0.08486175537109375, 0.09100723266601562, 0.0971527099609375, 0.10329818725585938, 0.10944366455078125, 0.11558914184570312, 0.121734619140625, 0.12788009643554688, 0.13402557373046875, 0.14017105102539062, 0.1463165283203125, 0.15246200561523438, 0.15860748291015625, 0.16475296020507812, 0.1708984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 7.0, 3.0, 14.0, 12.0, 10.0, 19.0, 25.0, 44.0, 85.0, 152.0, 216.0, 152.0, 92.0, 51.0, 26.0, 18.0, 13.0, 11.0, 9.0, 7.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03662109375, -0.03542137145996094, -0.034221649169921875, -0.03302192687988281, -0.03182220458984375, -0.030622482299804688, -0.029422760009765625, -0.028223037719726562, -0.0270233154296875, -0.025823593139648438, -0.024623870849609375, -0.023424148559570312, -0.02222442626953125, -0.021024703979492188, -0.019824981689453125, -0.018625259399414062, -0.017425537109375, -0.016225814819335938, -0.015026092529296875, -0.013826370239257812, -0.01262664794921875, -0.011426925659179688, -0.010227203369140625, -0.009027481079101562, -0.0078277587890625, -0.0066280364990234375, -0.005428314208984375, -0.0042285919189453125, -0.00302886962890625, -0.0018291473388671875, -0.000629425048828125, 0.0005702972412109375, 0.00177001953125, 0.0029697418212890625, 0.004169464111328125, 0.0053691864013671875, 0.00656890869140625, 0.0077686309814453125, 0.008968353271484375, 0.010168075561523438, 0.0113677978515625, 0.012567520141601562, 0.013767242431640625, 0.014966964721679688, 0.01616668701171875, 0.017366409301757812, 0.018566131591796875, 0.019765853881835938, 0.020965576171875, 0.022165298461914062, 0.023365020751953125, 0.024564743041992188, 0.02576446533203125, 0.026964187622070312, 0.028163909912109375, 0.029363632202148438, 0.0305633544921875, 0.03176307678222656, 0.032962799072265625, 0.03416252136230469, 0.03536224365234375, 0.03656196594238281, 0.037761688232421875, 0.03896141052246094, 0.0401611328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 13.0, 8.0, 8.0, 19.0, 25.0, 48.0, 52.0, 87.0, 138.0, 244.0, 357.0, 637.0, 1200.0, 2476.0, 5943.0, 15279.0, 46885.0, 185956.0, 521220.0, 194403.0, 47503.0, 15079.0, 5696.0, 2447.0, 1198.0, 655.0, 317.0, 215.0, 152.0, 78.0, 55.0, 42.0, 36.0, 22.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12445068359375, -0.12062358856201172, -0.11679649353027344, -0.11296939849853516, -0.10914230346679688, -0.1053152084350586, -0.10148811340332031, -0.09766101837158203, -0.09383392333984375, -0.09000682830810547, -0.08617973327636719, -0.0823526382446289, -0.07852554321289062, -0.07469844818115234, -0.07087135314941406, -0.06704425811767578, -0.0632171630859375, -0.05939006805419922, -0.05556297302246094, -0.051735877990722656, -0.047908782958984375, -0.044081687927246094, -0.04025459289550781, -0.03642749786376953, -0.03260040283203125, -0.02877330780029297, -0.024946212768554688, -0.021119117736816406, -0.017292022705078125, -0.013464927673339844, -0.009637832641601562, -0.005810737609863281, -0.001983642578125, 0.0018434524536132812, 0.0056705474853515625, 0.009497642517089844, 0.013324737548828125, 0.017151832580566406, 0.020978927612304688, 0.02480602264404297, 0.02863311767578125, 0.03246021270751953, 0.03628730773925781, 0.040114402770996094, 0.043941497802734375, 0.047768592834472656, 0.05159568786621094, 0.05542278289794922, 0.0592498779296875, 0.06307697296142578, 0.06690406799316406, 0.07073116302490234, 0.07455825805664062, 0.0783853530883789, 0.08221244812011719, 0.08603954315185547, 0.08986663818359375, 0.09369373321533203, 0.09752082824707031, 0.1013479232788086, 0.10517501831054688, 0.10900211334228516, 0.11282920837402344, 0.11665630340576172, 0.1204833984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 2.0, 6.0, 4.0, 7.0, 12.0, 12.0, 13.0, 26.0, 20.0, 29.0, 27.0, 21.0, 31.0, 43.0, 25.0, 52.0, 48.0, 49.0, 38.0, 43.0, 44.0, 56.0, 49.0, 41.0, 27.0, 42.0, 31.0, 29.0, 26.0, 25.0, 24.0, 18.0, 10.0, 8.0, 11.0, 10.0, 10.0, 7.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0965576171875, -0.09331607818603516, -0.09007453918457031, -0.08683300018310547, -0.08359146118164062, -0.08034992218017578, -0.07710838317871094, -0.0738668441772461, -0.07062530517578125, -0.0673837661743164, -0.06414222717285156, -0.06090068817138672, -0.057659149169921875, -0.05441761016845703, -0.05117607116699219, -0.047934532165527344, -0.0446929931640625, -0.041451454162597656, -0.03820991516113281, -0.03496837615966797, -0.031726837158203125, -0.02848529815673828, -0.025243759155273438, -0.022002220153808594, -0.01876068115234375, -0.015519142150878906, -0.012277603149414062, -0.009036064147949219, -0.005794525146484375, -0.0025529861450195312, 0.0006885528564453125, 0.003930091857910156, 0.007171630859375, 0.010413169860839844, 0.013654708862304688, 0.01689624786376953, 0.020137786865234375, 0.02337932586669922, 0.026620864868164062, 0.029862403869628906, 0.03310394287109375, 0.036345481872558594, 0.03958702087402344, 0.04282855987548828, 0.046070098876953125, 0.04931163787841797, 0.05255317687988281, 0.055794715881347656, 0.0590362548828125, 0.062277793884277344, 0.06551933288574219, 0.06876087188720703, 0.07200241088867188, 0.07524394989013672, 0.07848548889160156, 0.0817270278930664, 0.08496856689453125, 0.0882101058959961, 0.09145164489746094, 0.09469318389892578, 0.09793472290039062, 0.10117626190185547, 0.10441780090332031, 0.10765933990478516, 0.11090087890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 16.0, 15.0, 26.0, 41.0, 59.0, 95.0, 117.0, 184.0, 333.0, 660.0, 1173.0, 2511.0, 6280.0, 20072.0, 97445.0, 564946.0, 290576.0, 44609.0, 11459.0, 3992.0, 1817.0, 861.0, 477.0, 277.0, 176.0, 101.0, 70.0, 47.0, 31.0, 21.0, 15.0, 10.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1287059783935547, -0.12423324584960938, -0.11976051330566406, -0.11528778076171875, -0.11081504821777344, -0.10634231567382812, -0.10186958312988281, -0.0973968505859375, -0.09292411804199219, -0.08845138549804688, -0.08397865295410156, -0.07950592041015625, -0.07503318786621094, -0.07056045532226562, -0.06608772277832031, -0.061614990234375, -0.05714225769042969, -0.052669525146484375, -0.04819679260253906, -0.04372406005859375, -0.03925132751464844, -0.034778594970703125, -0.030305862426757812, -0.0258331298828125, -0.021360397338867188, -0.016887664794921875, -0.012414932250976562, -0.00794219970703125, -0.0034694671630859375, 0.001003265380859375, 0.0054759979248046875, 0.00994873046875, 0.014421463012695312, 0.018894195556640625, 0.023366928100585938, 0.02783966064453125, 0.03231239318847656, 0.036785125732421875, 0.04125785827636719, 0.0457305908203125, 0.05020332336425781, 0.054676055908203125, 0.05914878845214844, 0.06362152099609375, 0.06809425354003906, 0.07256698608398438, 0.07703971862792969, 0.081512451171875, 0.08598518371582031, 0.09045791625976562, 0.09493064880371094, 0.09940338134765625, 0.10387611389160156, 0.10834884643554688, 0.11282157897949219, 0.1172943115234375, 0.12176704406738281, 0.12623977661132812, 0.13071250915527344, 0.13518524169921875, 0.13965797424316406, 0.14413070678710938, 0.1486034393310547, 0.153076171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 3.0, 11.0, 25.0, 23.0, 32.0, 40.0, 47.0, 67.0, 84.0, 88.0, 107.0, 107.0, 92.0, 59.0, 60.0, 54.0, 23.0, 28.0, 22.0, 10.0, 9.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8715858459472656e-05, -1.7663463950157166e-05, -1.6611069440841675e-05, -1.5558674931526184e-05, -1.4506280422210693e-05, -1.3453885912895203e-05, -1.2401491403579712e-05, -1.1349096894264221e-05, -1.029670238494873e-05, -9.24430787563324e-06, -8.191913366317749e-06, -7.139518857002258e-06, -6.087124347686768e-06, -5.034729838371277e-06, -3.982335329055786e-06, -2.9299408197402954e-06, -1.8775463104248047e-06, -8.25151801109314e-07, 2.2724270820617676e-07, 1.2796372175216675e-06, 2.332031726837158e-06, 3.384426236152649e-06, 4.43682074546814e-06, 5.48921525478363e-06, 6.541609764099121e-06, 7.594004273414612e-06, 8.646398782730103e-06, 9.698793292045593e-06, 1.0751187801361084e-05, 1.1803582310676575e-05, 1.2855976819992065e-05, 1.3908371329307556e-05, 1.4960765838623047e-05, 1.6013160347938538e-05, 1.706555485725403e-05, 1.811794936656952e-05, 1.917034387588501e-05, 2.02227383852005e-05, 2.127513289451599e-05, 2.2327527403831482e-05, 2.3379921913146973e-05, 2.4432316422462463e-05, 2.5484710931777954e-05, 2.6537105441093445e-05, 2.7589499950408936e-05, 2.8641894459724426e-05, 2.9694288969039917e-05, 3.074668347835541e-05, 3.17990779876709e-05, 3.285147249698639e-05, 3.390386700630188e-05, 3.495626151561737e-05, 3.600865602493286e-05, 3.706105053424835e-05, 3.811344504356384e-05, 3.9165839552879333e-05, 4.0218234062194824e-05, 4.1270628571510315e-05, 4.2323023080825806e-05, 4.3375417590141296e-05, 4.442781209945679e-05, 4.548020660877228e-05, 4.653260111808777e-05, 4.758499562740326e-05, 4.863739013671875e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 8.0, 10.0, 16.0, 19.0, 32.0, 46.0, 61.0, 78.0, 142.0, 230.0, 353.0, 630.0, 1141.0, 2224.0, 4822.0, 11893.0, 36418.0, 153478.0, 509231.0, 245839.0, 54062.0, 16008.0, 5989.0, 2661.0, 1324.0, 704.0, 399.0, 256.0, 135.0, 93.0, 69.0, 48.0, 31.0, 25.0, 10.0, 21.0, 12.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.1171875, -0.11380577087402344, -0.11042404174804688, -0.10704231262207031, -0.10366058349609375, -0.10027885437011719, -0.09689712524414062, -0.09351539611816406, -0.0901336669921875, -0.08675193786621094, -0.08337020874023438, -0.07998847961425781, -0.07660675048828125, -0.07322502136230469, -0.06984329223632812, -0.06646156311035156, -0.063079833984375, -0.05969810485839844, -0.056316375732421875, -0.05293464660644531, -0.04955291748046875, -0.04617118835449219, -0.042789459228515625, -0.03940773010253906, -0.0360260009765625, -0.03264427185058594, -0.029262542724609375, -0.025880813598632812, -0.02249908447265625, -0.019117355346679688, -0.015735626220703125, -0.012353897094726562, -0.00897216796875, -0.0055904388427734375, -0.002208709716796875, 0.0011730194091796875, 0.00455474853515625, 0.007936477661132812, 0.011318206787109375, 0.014699935913085938, 0.0180816650390625, 0.021463394165039062, 0.024845123291015625, 0.028226852416992188, 0.03160858154296875, 0.03499031066894531, 0.038372039794921875, 0.04175376892089844, 0.045135498046875, 0.04851722717285156, 0.051898956298828125, 0.05528068542480469, 0.05866241455078125, 0.06204414367675781, 0.06542587280273438, 0.06880760192871094, 0.0721893310546875, 0.07557106018066406, 0.07895278930664062, 0.08233451843261719, 0.08571624755859375, 0.08909797668457031, 0.09247970581054688, 0.09586143493652344, 0.0992431640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 7.0, 10.0, 15.0, 22.0, 16.0, 23.0, 28.0, 30.0, 48.0, 58.0, 73.0, 74.0, 80.0, 67.0, 79.0, 55.0, 65.0, 68.0, 43.0, 27.0, 21.0, 14.0, 13.0, 10.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08795166015625, -0.08558177947998047, -0.08321189880371094, -0.0808420181274414, -0.07847213745117188, -0.07610225677490234, -0.07373237609863281, -0.07136249542236328, -0.06899261474609375, -0.06662273406982422, -0.06425285339355469, -0.061882972717285156, -0.059513092041015625, -0.057143211364746094, -0.05477333068847656, -0.05240345001220703, -0.0500335693359375, -0.04766368865966797, -0.04529380798339844, -0.042923927307128906, -0.040554046630859375, -0.038184165954589844, -0.03581428527832031, -0.03344440460205078, -0.03107452392578125, -0.02870464324951172, -0.026334762573242188, -0.023964881896972656, -0.021595001220703125, -0.019225120544433594, -0.016855239868164062, -0.014485359191894531, -0.012115478515625, -0.009745597839355469, -0.0073757171630859375, -0.005005836486816406, -0.002635955810546875, -0.00026607513427734375, 0.0021038055419921875, 0.004473686218261719, 0.00684356689453125, 0.009213447570800781, 0.011583328247070312, 0.013953208923339844, 0.016323089599609375, 0.018692970275878906, 0.021062850952148438, 0.02343273162841797, 0.0258026123046875, 0.02817249298095703, 0.030542373657226562, 0.032912254333496094, 0.035282135009765625, 0.037652015686035156, 0.04002189636230469, 0.04239177703857422, 0.04476165771484375, 0.04713153839111328, 0.04950141906738281, 0.051871299743652344, 0.054241180419921875, 0.056611061096191406, 0.05898094177246094, 0.06135082244873047, 0.063720703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 11.0, 92.0, 785.0, 112.0, 13.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.077866554260254, -0.9116312861442566, -0.7453960180282593, -0.579160749912262, -0.41292548179626465, -0.24669021368026733, -0.08045494556427002, 0.08578038215637207, 0.2520155906677246, 0.4182508587837219, 0.5844861268997192, 0.7507213950157166, 0.9169566631317139, 1.0831918716430664, 1.2494271993637085, 1.4156625270843506, 1.5818977355957031, 1.7481329441070557, 1.9143682718276978, 2.08060359954834, 2.2468388080596924, 2.413074016571045, 2.5793094635009766, 2.745544672012329, 2.9117798805236816, 3.078015089035034, 3.2442502975463867, 3.4104857444763184, 3.576720952987671, 3.7429561614990234, 3.909191608428955, 4.075427055358887, 4.24166202545166, 4.407897472381592, 4.574132442474365, 4.740367889404297, 4.90660285949707, 5.072838306427002, 5.239073753356934, 5.405308723449707, 5.571544170379639, 5.73777961730957, 5.904014587402344, 6.070250034332275, 6.236485481262207, 6.4027204513549805, 6.568955898284912, 6.735191345214844, 6.901426315307617, 7.067661762237549, 7.233896732330322, 7.400132179260254, 7.566367149353027, 7.732602596282959, 7.898838043212891, 8.065073013305664, 8.231307983398438, 8.397542953491211, 8.5637788772583, 8.730013847351074, 8.896248817443848, 9.062484741210938, 9.228719711303711, 9.394954681396484, 9.561190605163574]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 10.0, 4.0, 6.0, 8.0, 16.0, 12.0, 19.0, 23.0, 37.0, 69.0, 52.0, 65.0, 75.0, 71.0, 83.0, 83.0, 71.0, 63.0, 48.0, 49.0, 20.0, 15.0, 17.0, 10.0, 17.0, 9.0, 8.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1898272037506104, -1.1554876565933228, -1.1211482286453247, -1.086808681488037, -1.052469253540039, -1.0181297063827515, -0.9837902188301086, -0.9494507312774658, -0.915111243724823, -0.8807717561721802, -0.8464322686195374, -0.8120927810668945, -0.7777532339096069, -0.7434138059616089, -0.7090742588043213, -0.6747347712516785, -0.6403952836990356, -0.6060557961463928, -0.57171630859375, -0.5373768210411072, -0.5030373334884644, -0.46869781613349915, -0.43435829877853394, -0.4000188112258911, -0.3656793236732483, -0.33133983612060547, -0.29700034856796265, -0.26266083121299744, -0.22832134366035461, -0.1939818561077118, -0.15964235365390778, -0.12530285120010376, -0.09096336364746094, -0.05662386864423752, -0.0222843736410141, 0.01205512136220932, 0.04639461636543274, 0.08073410391807556, 0.11507360637187958, 0.1494131088256836, 0.18375259637832642, 0.21809208393096924, 0.25243157148361206, 0.28677108883857727, 0.3211105763912201, 0.3554500639438629, 0.3897895812988281, 0.42412906885147095, 0.45846855640411377, 0.4928080439567566, 0.5271475315093994, 0.5614870190620422, 0.5958265066146851, 0.6301660537719727, 0.6645055413246155, 0.6988450288772583, 0.7331845164299011, 0.767524003982544, 0.8018634915351868, 0.8362029790878296, 0.8705425262451172, 0.9048819541931152, 0.9392215013504028, 0.9735609889030457, 1.0079004764556885]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 16.0, 11.0, 18.0, 28.0, 30.0, 27.0, 65.0, 79.0, 106.0, 139.0, 200.0, 333.0, 436.0, 660.0, 1059.0, 1706.0, 3092.0, 6029.0, 13899.0, 46188.0, 878554.0, 3159404.0, 52098.0, 14899.0, 6340.0, 3187.0, 1788.0, 1147.0, 737.0, 512.0, 357.0, 246.0, 205.0, 150.0, 112.0, 78.0, 69.0, 47.0, 52.0, 40.0, 28.0, 28.0, 23.0, 15.0, 14.0, 4.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.3525390625, -0.3408050537109375, -0.329071044921875, -0.3173370361328125, -0.30560302734375, -0.2938690185546875, -0.282135009765625, -0.2704010009765625, -0.2586669921875, -0.2469329833984375, -0.235198974609375, -0.2234649658203125, -0.21173095703125, -0.1999969482421875, -0.188262939453125, -0.1765289306640625, -0.164794921875, -0.1530609130859375, -0.141326904296875, -0.1295928955078125, -0.11785888671875, -0.1061248779296875, -0.094390869140625, -0.0826568603515625, -0.0709228515625, -0.0591888427734375, -0.047454833984375, -0.0357208251953125, -0.02398681640625, -0.0122528076171875, -0.000518798828125, 0.0112152099609375, 0.02294921875, 0.0346832275390625, 0.046417236328125, 0.0581512451171875, 0.06988525390625, 0.0816192626953125, 0.093353271484375, 0.1050872802734375, 0.1168212890625, 0.1285552978515625, 0.140289306640625, 0.1520233154296875, 0.16375732421875, 0.1754913330078125, 0.187225341796875, 0.1989593505859375, 0.210693359375, 0.2224273681640625, 0.234161376953125, 0.2458953857421875, 0.25762939453125, 0.2693634033203125, 0.281097412109375, 0.2928314208984375, 0.3045654296875, 0.3162994384765625, 0.328033447265625, 0.3397674560546875, 0.35150146484375, 0.3632354736328125, 0.374969482421875, 0.3867034912109375, 0.3984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 8.0, 5.0, 3.0, 6.0, 2.0, 6.0, 14.0, 12.0, 22.0, 31.0, 44.0, 65.0, 110.0, 161.0, 133.0, 117.0, 94.0, 47.0, 38.0, 27.0, 13.0, 11.0, 7.0, 3.0, 2.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.034088134765625, -0.032959938049316406, -0.03183174133300781, -0.03070354461669922, -0.029575347900390625, -0.02844715118408203, -0.027318954467773438, -0.026190757751464844, -0.02506256103515625, -0.023934364318847656, -0.022806167602539062, -0.02167797088623047, -0.020549774169921875, -0.01942157745361328, -0.018293380737304688, -0.017165184020996094, -0.0160369873046875, -0.014908790588378906, -0.013780593872070312, -0.012652397155761719, -0.011524200439453125, -0.010396003723144531, -0.009267807006835938, -0.008139610290527344, -0.00701141357421875, -0.005883216857910156, -0.0047550201416015625, -0.0036268234252929688, -0.002498626708984375, -0.0013704299926757812, -0.0002422332763671875, 0.0008859634399414062, 0.00201416015625, 0.0031423568725585938, 0.0042705535888671875, 0.005398750305175781, 0.006526947021484375, 0.007655143737792969, 0.008783340454101562, 0.009911537170410156, 0.01103973388671875, 0.012167930603027344, 0.013296127319335938, 0.014424324035644531, 0.015552520751953125, 0.01668071746826172, 0.017808914184570312, 0.018937110900878906, 0.0200653076171875, 0.021193504333496094, 0.022321701049804688, 0.02344989776611328, 0.024578094482421875, 0.02570629119873047, 0.026834487915039062, 0.027962684631347656, 0.02909088134765625, 0.030219078063964844, 0.03134727478027344, 0.03247547149658203, 0.033603668212890625, 0.03473186492919922, 0.03586006164550781, 0.036988258361816406, 0.038116455078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 8.0, 16.0, 12.0, 27.0, 66.0, 133.0, 344.0, 1361.0, 10417.0, 321676.0, 3829569.0, 26984.0, 2699.0, 571.0, 181.0, 87.0, 39.0, 25.0, 20.0, 12.0, 8.0, 1.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.8121795654296875, -0.788421630859375, -0.7646636962890625, -0.74090576171875, -0.7171478271484375, -0.693389892578125, -0.6696319580078125, -0.6458740234375, -0.6221160888671875, -0.598358154296875, -0.5746002197265625, -0.55084228515625, -0.5270843505859375, -0.503326416015625, -0.4795684814453125, -0.455810546875, -0.4320526123046875, -0.408294677734375, -0.3845367431640625, -0.36077880859375, -0.3370208740234375, -0.313262939453125, -0.2895050048828125, -0.2657470703125, -0.2419891357421875, -0.218231201171875, -0.1944732666015625, -0.17071533203125, -0.1469573974609375, -0.123199462890625, -0.0994415283203125, -0.07568359375, -0.0519256591796875, -0.028167724609375, -0.0044097900390625, 0.01934814453125, 0.0431060791015625, 0.066864013671875, 0.0906219482421875, 0.1143798828125, 0.1381378173828125, 0.161895751953125, 0.1856536865234375, 0.20941162109375, 0.2331695556640625, 0.256927490234375, 0.2806854248046875, 0.304443359375, 0.3282012939453125, 0.351959228515625, 0.3757171630859375, 0.39947509765625, 0.4232330322265625, 0.446990966796875, 0.4707489013671875, 0.4945068359375, 0.5182647705078125, 0.542022705078125, 0.5657806396484375, 0.58953857421875, 0.6132965087890625, 0.637054443359375, 0.6608123779296875, 0.6845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 11.0, 10.0, 22.0, 28.0, 49.0, 69.0, 113.0, 276.0, 683.0, 1950.0, 410.0, 193.0, 89.0, 50.0, 37.0, 20.0, 16.0, 12.0, 5.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06629371643066406, -0.06410598754882812, -0.06191825866699219, -0.05973052978515625, -0.05754280090332031, -0.055355072021484375, -0.05316734313964844, -0.0509796142578125, -0.04879188537597656, -0.046604156494140625, -0.04441642761230469, -0.04222869873046875, -0.04004096984863281, -0.037853240966796875, -0.03566551208496094, -0.033477783203125, -0.03129005432128906, -0.029102325439453125, -0.026914596557617188, -0.02472686767578125, -0.022539138793945312, -0.020351409912109375, -0.018163681030273438, -0.0159759521484375, -0.013788223266601562, -0.011600494384765625, -0.009412765502929688, -0.00722503662109375, -0.0050373077392578125, -0.002849578857421875, -0.0006618499755859375, 0.00152587890625, 0.0037136077880859375, 0.005901336669921875, 0.008089065551757812, 0.01027679443359375, 0.012464523315429688, 0.014652252197265625, 0.016839981079101562, 0.0190277099609375, 0.021215438842773438, 0.023403167724609375, 0.025590896606445312, 0.02777862548828125, 0.029966354370117188, 0.032154083251953125, 0.03434181213378906, 0.036529541015625, 0.03871726989746094, 0.040904998779296875, 0.04309272766113281, 0.04528045654296875, 0.04746818542480469, 0.049655914306640625, 0.05184364318847656, 0.0540313720703125, 0.05621910095214844, 0.058406829833984375, 0.06059455871582031, 0.06278228759765625, 0.06497001647949219, 0.06715774536132812, 0.06934547424316406, 0.071533203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 16.0, 19.0, 26.0, 75.0, 120.0, 136.0, 190.0, 147.0, 107.0, 67.0, 32.0, 23.0, 11.0, 4.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3303999900817871, -0.32059523463249207, -0.31079044938087463, -0.3009856939315796, -0.29118093848228455, -0.2813761830329895, -0.27157139778137207, -0.261766642332077, -0.251961886882782, -0.24215711653232574, -0.2323523610830307, -0.22254759073257446, -0.21274283528327942, -0.20293806493282318, -0.19313329458236694, -0.1833285391330719, -0.17352375388145447, -0.16371898353099823, -0.15391422808170319, -0.14410945773124695, -0.1343047022819519, -0.12449993193149567, -0.11469516158103943, -0.10489039868116379, -0.09508563578128815, -0.0852808728814125, -0.07547610998153687, -0.06567133963108063, -0.05586657673120499, -0.046061813831329346, -0.036257047206163406, -0.026452280580997467, -0.016647517681121826, -0.006842752918601036, 0.002962011843919754, 0.012766776606440544, 0.022571541368961334, 0.032376304268836975, 0.042181070894002914, 0.051985837519168854, 0.061790600419044495, 0.07159536331892014, 0.08140012621879578, 0.09120489656925201, 0.10100965946912766, 0.1108144223690033, 0.12061919271945953, 0.13042396306991577, 0.14022871851921082, 0.15003348886966705, 0.1598382443189621, 0.16964301466941833, 0.17944777011871338, 0.18925254046916962, 0.19905731081962585, 0.2088620662689209, 0.21866683661937714, 0.22847160696983337, 0.23827636241912842, 0.24808113276958466, 0.2578859031200409, 0.26769065856933594, 0.277495414018631, 0.2873001992702484, 0.29710495471954346]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 4.0, 8.0, 10.0, 7.0, 15.0, 22.0, 21.0, 32.0, 39.0, 36.0, 43.0, 58.0, 63.0, 62.0, 70.0, 69.0, 57.0, 59.0, 57.0, 41.0, 59.0, 34.0, 28.0, 25.0, 20.0, 16.0, 7.0, 7.0, 7.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23356515169143677, -0.22616197168827057, -0.21875879168510437, -0.21135561168193817, -0.20395243167877197, -0.19654925167560577, -0.18914607167243958, -0.18174290657043457, -0.17433971166610718, -0.16693653166294098, -0.15953335165977478, -0.15213017165660858, -0.14472699165344238, -0.13732381165027618, -0.12992063164710999, -0.12251745909452438, -0.11511428654193878, -0.10771110653877258, -0.10030792653560638, -0.09290474653244019, -0.08550156652927399, -0.07809838652610779, -0.07069521397352219, -0.06329203397035599, -0.05588885396718979, -0.04848567396402359, -0.04108249396085739, -0.03367931768298149, -0.026276137679815292, -0.018872957676649094, -0.011469781398773193, -0.004066601395606995, 0.003336578607559204, 0.010739757679402828, 0.018142936751246452, 0.025546114891767502, 0.0329492948949337, 0.0403524748980999, 0.0477556511759758, 0.055158831179142, 0.0625620111823082, 0.0699651911854744, 0.0773683711886406, 0.0847715437412262, 0.0921747237443924, 0.0995779037475586, 0.10698108375072479, 0.11438426375389099, 0.12178744375705719, 0.1291906237602234, 0.1365938037633896, 0.1439969837665558, 0.15140016376972198, 0.15880334377288818, 0.1662065088748932, 0.17360970377922058, 0.18101286888122559, 0.18841604888439178, 0.19581922888755798, 0.20322240889072418, 0.21062558889389038, 0.21802876889705658, 0.22543194890022278, 0.23283511400222778, 0.24023830890655518]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 15.0, 18.0, 25.0, 31.0, 42.0, 68.0, 79.0, 138.0, 211.0, 291.0, 461.0, 811.0, 1392.0, 2460.0, 4779.0, 10877.0, 32468.0, 167038.0, 647489.0, 132026.0, 28150.0, 9604.0, 4405.0, 2279.0, 1228.0, 726.0, 454.0, 305.0, 193.0, 150.0, 96.0, 65.0, 48.0, 38.0, 26.0, 23.0, 8.0, 7.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.22307205200195312, -0.21494293212890625, -0.20681381225585938, -0.1986846923828125, -0.19055557250976562, -0.18242645263671875, -0.17429733276367188, -0.166168212890625, -0.15803909301757812, -0.14990997314453125, -0.14178085327148438, -0.1336517333984375, -0.12552261352539062, -0.11739349365234375, -0.10926437377929688, -0.10113525390625, -0.09300613403320312, -0.08487701416015625, -0.07674789428710938, -0.0686187744140625, -0.060489654541015625, -0.05236053466796875, -0.044231414794921875, -0.036102294921875, -0.027973175048828125, -0.01984405517578125, -0.011714935302734375, -0.0035858154296875, 0.004543304443359375, 0.01267242431640625, 0.020801544189453125, 0.0289306640625, 0.037059783935546875, 0.04518890380859375, 0.053318023681640625, 0.0614471435546875, 0.06957626342773438, 0.07770538330078125, 0.08583450317382812, 0.093963623046875, 0.10209274291992188, 0.11022186279296875, 0.11835098266601562, 0.1264801025390625, 0.13460922241210938, 0.14273834228515625, 0.15086746215820312, 0.15899658203125, 0.16712570190429688, 0.17525482177734375, 0.18338394165039062, 0.1915130615234375, 0.19964218139648438, 0.20777130126953125, 0.21590042114257812, 0.224029541015625, 0.23215866088867188, 0.24028778076171875, 0.24841690063476562, 0.2565460205078125, 0.2646751403808594, 0.27280426025390625, 0.2809333801269531, 0.2890625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 5.0, 11.0, 13.0, 23.0, 31.0, 55.0, 78.0, 122.0, 159.0, 166.0, 115.0, 79.0, 41.0, 32.0, 19.0, 10.0, 9.0, 2.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.038909912109375, -0.03768587112426758, -0.036461830139160156, -0.035237789154052734, -0.03401374816894531, -0.03278970718383789, -0.03156566619873047, -0.030341625213623047, -0.029117584228515625, -0.027893543243408203, -0.02666950225830078, -0.02544546127319336, -0.024221420288085938, -0.022997379302978516, -0.021773338317871094, -0.020549297332763672, -0.01932525634765625, -0.018101215362548828, -0.016877174377441406, -0.015653133392333984, -0.014429092407226562, -0.01320505142211914, -0.011981010437011719, -0.010756969451904297, -0.009532928466796875, -0.008308887481689453, -0.007084846496582031, -0.005860805511474609, -0.0046367645263671875, -0.0034127235412597656, -0.0021886825561523438, -0.0009646415710449219, 0.0002593994140625, 0.0014834403991699219, 0.0027074813842773438, 0.003931522369384766, 0.0051555633544921875, 0.006379604339599609, 0.007603645324707031, 0.008827686309814453, 0.010051727294921875, 0.011275768280029297, 0.012499809265136719, 0.01372385025024414, 0.014947891235351562, 0.016171932220458984, 0.017395973205566406, 0.018620014190673828, 0.01984405517578125, 0.021068096160888672, 0.022292137145996094, 0.023516178131103516, 0.024740219116210938, 0.02596426010131836, 0.02718830108642578, 0.028412342071533203, 0.029636383056640625, 0.030860424041748047, 0.03208446502685547, 0.03330850601196289, 0.03453254699707031, 0.035756587982177734, 0.036980628967285156, 0.03820466995239258, 0.0394287109375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 13.0, 9.0, 16.0, 21.0, 46.0, 53.0, 79.0, 113.0, 160.0, 303.0, 529.0, 1075.0, 2992.0, 10795.0, 56439.0, 374243.0, 499517.0, 80594.0, 14917.0, 3821.0, 1325.0, 562.0, 333.0, 224.0, 107.0, 58.0, 49.0, 33.0, 29.0, 19.0, 15.0, 8.0, 11.0, 9.0, 3.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23313331604003906, -0.22420120239257812, -0.2152690887451172, -0.20633697509765625, -0.1974048614501953, -0.18847274780273438, -0.17954063415527344, -0.1706085205078125, -0.16167640686035156, -0.15274429321289062, -0.1438121795654297, -0.13488006591796875, -0.1259479522705078, -0.11701583862304688, -0.10808372497558594, -0.099151611328125, -0.09021949768066406, -0.08128738403320312, -0.07235527038574219, -0.06342315673828125, -0.05449104309082031, -0.045558929443359375, -0.03662681579589844, -0.0276947021484375, -0.018762588500976562, -0.009830474853515625, -0.0008983612060546875, 0.00803375244140625, 0.016965866088867188, 0.025897979736328125, 0.03483009338378906, 0.04376220703125, 0.05269432067871094, 0.061626434326171875, 0.07055854797363281, 0.07949066162109375, 0.08842277526855469, 0.09735488891601562, 0.10628700256347656, 0.1152191162109375, 0.12415122985839844, 0.13308334350585938, 0.1420154571533203, 0.15094757080078125, 0.1598796844482422, 0.16881179809570312, 0.17774391174316406, 0.186676025390625, 0.19560813903808594, 0.20454025268554688, 0.2134723663330078, 0.22240447998046875, 0.2313365936279297, 0.24026870727539062, 0.24920082092285156, 0.2581329345703125, 0.26706504821777344, 0.2759971618652344, 0.2849292755126953, 0.29386138916015625, 0.3027935028076172, 0.3117256164550781, 0.32065773010253906, 0.32958984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 8.0, 2.0, 10.0, 7.0, 11.0, 6.0, 12.0, 14.0, 20.0, 16.0, 28.0, 24.0, 29.0, 29.0, 35.0, 36.0, 37.0, 54.0, 52.0, 54.0, 40.0, 44.0, 48.0, 54.0, 46.0, 42.0, 39.0, 32.0, 35.0, 29.0, 19.0, 13.0, 14.0, 12.0, 9.0, 17.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10009765625, -0.09634971618652344, -0.09260177612304688, -0.08885383605957031, -0.08510589599609375, -0.08135795593261719, -0.07761001586914062, -0.07386207580566406, -0.0701141357421875, -0.06636619567871094, -0.06261825561523438, -0.05887031555175781, -0.05512237548828125, -0.05137443542480469, -0.047626495361328125, -0.04387855529785156, -0.040130615234375, -0.03638267517089844, -0.032634735107421875, -0.028886795043945312, -0.02513885498046875, -0.021390914916992188, -0.017642974853515625, -0.013895034790039062, -0.0101470947265625, -0.0063991546630859375, -0.002651214599609375, 0.0010967254638671875, 0.00484466552734375, 0.008592605590820312, 0.012340545654296875, 0.016088485717773438, 0.01983642578125, 0.023584365844726562, 0.027332305908203125, 0.031080245971679688, 0.03482818603515625, 0.03857612609863281, 0.042324066162109375, 0.04607200622558594, 0.0498199462890625, 0.05356788635253906, 0.057315826416015625, 0.06106376647949219, 0.06481170654296875, 0.06855964660644531, 0.07230758666992188, 0.07605552673339844, 0.079803466796875, 0.08355140686035156, 0.08729934692382812, 0.09104728698730469, 0.09479522705078125, 0.09854316711425781, 0.10229110717773438, 0.10603904724121094, 0.1097869873046875, 0.11353492736816406, 0.11728286743164062, 0.12103080749511719, 0.12477874755859375, 0.1285266876220703, 0.13227462768554688, 0.13602256774902344, 0.1397705078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 8.0, 13.0, 12.0, 20.0, 19.0, 53.0, 67.0, 66.0, 133.0, 166.0, 222.0, 319.0, 551.0, 922.0, 1682.0, 3171.0, 6682.0, 15176.0, 37878.0, 104135.0, 296515.0, 357164.0, 138945.0, 48746.0, 19120.0, 7989.0, 3872.0, 2043.0, 1096.0, 559.0, 397.0, 239.0, 151.0, 113.0, 80.0, 52.0, 51.0, 31.0, 25.0, 16.0, 14.0, 5.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08282470703125, -0.0802469253540039, -0.07766914367675781, -0.07509136199951172, -0.07251358032226562, -0.06993579864501953, -0.06735801696777344, -0.06478023529052734, -0.06220245361328125, -0.059624671936035156, -0.05704689025878906, -0.05446910858154297, -0.051891326904296875, -0.04931354522705078, -0.04673576354980469, -0.044157981872558594, -0.0415802001953125, -0.039002418518066406, -0.03642463684082031, -0.03384685516357422, -0.031269073486328125, -0.02869129180908203, -0.026113510131835938, -0.023535728454589844, -0.02095794677734375, -0.018380165100097656, -0.015802383422851562, -0.013224601745605469, -0.010646820068359375, -0.008069038391113281, -0.0054912567138671875, -0.0029134750366210938, -0.000335693359375, 0.0022420883178710938, 0.0048198699951171875, 0.007397651672363281, 0.009975433349609375, 0.012553215026855469, 0.015130996704101562, 0.017708778381347656, 0.02028656005859375, 0.022864341735839844, 0.025442123413085938, 0.02801990509033203, 0.030597686767578125, 0.03317546844482422, 0.03575325012207031, 0.038331031799316406, 0.0409088134765625, 0.043486595153808594, 0.04606437683105469, 0.04864215850830078, 0.051219940185546875, 0.05379772186279297, 0.05637550354003906, 0.058953285217285156, 0.06153106689453125, 0.06410884857177734, 0.06668663024902344, 0.06926441192626953, 0.07184219360351562, 0.07441997528076172, 0.07699775695800781, 0.0795755386352539, 0.0821533203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 14.0, 14.0, 14.0, 24.0, 23.0, 34.0, 39.0, 37.0, 45.0, 58.0, 79.0, 73.0, 84.0, 65.0, 68.0, 52.0, 48.0, 52.0, 33.0, 29.0, 23.0, 21.0, 15.0, 15.0, 8.0, 7.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.647804260253906e-05, -3.535579890012741e-05, -3.423355519771576e-05, -3.311131149530411e-05, -3.1989067792892456e-05, -3.0866824090480804e-05, -2.9744580388069153e-05, -2.86223366856575e-05, -2.750009298324585e-05, -2.6377849280834198e-05, -2.5255605578422546e-05, -2.4133361876010895e-05, -2.3011118173599243e-05, -2.188887447118759e-05, -2.076663076877594e-05, -1.964438706636429e-05, -1.8522143363952637e-05, -1.7399899661540985e-05, -1.6277655959129333e-05, -1.5155412256717682e-05, -1.403316855430603e-05, -1.2910924851894379e-05, -1.1788681149482727e-05, -1.0666437447071075e-05, -9.544193744659424e-06, -8.421950042247772e-06, -7.299706339836121e-06, -6.177462637424469e-06, -5.055218935012817e-06, -3.932975232601166e-06, -2.810731530189514e-06, -1.6884878277778625e-06, -5.662441253662109e-07, 5.559995770454407e-07, 1.6782432794570923e-06, 2.800486981868744e-06, 3.9227306842803955e-06, 5.044974386692047e-06, 6.167218089103699e-06, 7.28946179151535e-06, 8.411705493927002e-06, 9.533949196338654e-06, 1.0656192898750305e-05, 1.1778436601161957e-05, 1.2900680303573608e-05, 1.402292400598526e-05, 1.5145167708396912e-05, 1.6267411410808563e-05, 1.7389655113220215e-05, 1.8511898815631866e-05, 1.9634142518043518e-05, 2.075638622045517e-05, 2.187862992286682e-05, 2.3000873625278473e-05, 2.4123117327690125e-05, 2.5245361030101776e-05, 2.6367604732513428e-05, 2.748984843492508e-05, 2.861209213733673e-05, 2.9734335839748383e-05, 3.0856579542160034e-05, 3.1978823244571686e-05, 3.310106694698334e-05, 3.422331064939499e-05, 3.534555435180664e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 10.0, 9.0, 11.0, 15.0, 25.0, 40.0, 46.0, 87.0, 112.0, 228.0, 416.0, 786.0, 1908.0, 5688.0, 20903.0, 105175.0, 549593.0, 296652.0, 49323.0, 11330.0, 3462.0, 1330.0, 577.0, 327.0, 176.0, 93.0, 73.0, 37.0, 27.0, 18.0, 13.0, 19.0, 12.0, 9.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13454437255859375, -0.1301727294921875, -0.12580108642578125, -0.121429443359375, -0.11705780029296875, -0.1126861572265625, -0.10831451416015625, -0.10394287109375, -0.09957122802734375, -0.0951995849609375, -0.09082794189453125, -0.086456298828125, -0.08208465576171875, -0.0777130126953125, -0.07334136962890625, -0.0689697265625, -0.06459808349609375, -0.0602264404296875, -0.05585479736328125, -0.051483154296875, -0.04711151123046875, -0.0427398681640625, -0.03836822509765625, -0.03399658203125, -0.02962493896484375, -0.0252532958984375, -0.02088165283203125, -0.016510009765625, -0.01213836669921875, -0.0077667236328125, -0.00339508056640625, 0.0009765625, 0.00534820556640625, 0.0097198486328125, 0.01409149169921875, 0.018463134765625, 0.02283477783203125, 0.0272064208984375, 0.03157806396484375, 0.03594970703125, 0.04032135009765625, 0.0446929931640625, 0.04906463623046875, 0.053436279296875, 0.05780792236328125, 0.0621795654296875, 0.06655120849609375, 0.0709228515625, 0.07529449462890625, 0.0796661376953125, 0.08403778076171875, 0.088409423828125, 0.09278106689453125, 0.0971527099609375, 0.10152435302734375, 0.10589599609375, 0.11026763916015625, 0.1146392822265625, 0.11901092529296875, 0.123382568359375, 0.12775421142578125, 0.1321258544921875, 0.13649749755859375, 0.140869140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 4.0, 8.0, 7.0, 10.0, 14.0, 16.0, 27.0, 28.0, 29.0, 43.0, 49.0, 55.0, 62.0, 71.0, 69.0, 66.0, 76.0, 59.0, 57.0, 48.0, 35.0, 24.0, 22.0, 18.0, 14.0, 14.0, 7.0, 13.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.060272216796875, -0.058428287506103516, -0.05658435821533203, -0.05474042892456055, -0.05289649963378906, -0.05105257034301758, -0.049208641052246094, -0.04736471176147461, -0.045520782470703125, -0.04367685317993164, -0.041832923889160156, -0.03998899459838867, -0.03814506530761719, -0.0363011360168457, -0.03445720672607422, -0.032613277435302734, -0.03076934814453125, -0.028925418853759766, -0.02708148956298828, -0.025237560272216797, -0.023393630981445312, -0.021549701690673828, -0.019705772399902344, -0.01786184310913086, -0.016017913818359375, -0.01417398452758789, -0.012330055236816406, -0.010486125946044922, -0.008642196655273438, -0.006798267364501953, -0.004954338073730469, -0.0031104087829589844, -0.0012664794921875, 0.0005774497985839844, 0.0024213790893554688, 0.004265308380126953, 0.0061092376708984375, 0.007953166961669922, 0.009797096252441406, 0.01164102554321289, 0.013484954833984375, 0.01532888412475586, 0.017172813415527344, 0.019016742706298828, 0.020860671997070312, 0.022704601287841797, 0.02454853057861328, 0.026392459869384766, 0.02823638916015625, 0.030080318450927734, 0.03192424774169922, 0.0337681770324707, 0.03561210632324219, 0.03745603561401367, 0.039299964904785156, 0.04114389419555664, 0.042987823486328125, 0.04483175277709961, 0.046675682067871094, 0.04851961135864258, 0.05036354064941406, 0.05220746994018555, 0.05405139923095703, 0.055895328521728516, 0.0577392578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 13.0, 27.0, 53.0, 118.0, 233.0, 238.0, 146.0, 94.0, 35.0, 14.0, 13.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8776824474334717, -1.8176438808441162, -1.7576054334640503, -1.6975668668746948, -1.6375283002853394, -1.5774898529052734, -1.517451286315918, -1.4574127197265625, -1.397374153137207, -1.3373355865478516, -1.2772971391677856, -1.2172585725784302, -1.1572200059890747, -1.0971815586090088, -1.0371429920196533, -0.9771044254302979, -0.9170659780502319, -0.8570274710655212, -0.7969889044761658, -0.7369503974914551, -0.6769118309020996, -0.6168733239173889, -0.5568348169326782, -0.49679628014564514, -0.43675774335861206, -0.376719206571579, -0.3166806697845459, -0.2566421627998352, -0.19660362601280212, -0.13656508922576904, -0.07652658224105835, -0.01648804545402527, 0.04355049133300781, 0.1035890206694603, 0.16362755000591278, 0.22366607189178467, 0.28370460867881775, 0.34374314546585083, 0.4037816524505615, 0.4638201892375946, 0.5238587260246277, 0.5838972330093384, 0.6439357995986938, 0.7039743065834045, 0.7640128135681152, 0.8240513801574707, 0.8840898871421814, 0.9441283941268921, 1.0041669607162476, 1.064205527305603, 1.124243974685669, 1.1842825412750244, 1.2443211078643799, 1.3043596744537354, 1.3643981218338013, 1.4244366884231567, 1.4844751358032227, 1.5445137023925781, 1.604552149772644, 1.6645907163619995, 1.724629282951355, 1.784667730331421, 1.8447062969207764, 1.9047448635101318, 1.9647834300994873]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 17.0, 17.0, 21.0, 29.0, 25.0, 45.0, 39.0, 50.0, 64.0, 75.0, 72.0, 60.0, 67.0, 58.0, 45.0, 46.0, 45.0, 39.0, 32.0, 19.0, 20.0, 19.0, 18.0, 14.0, 8.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9781767725944519, -0.9423176050186157, -0.9064583778381348, -0.8705992102622986, -0.8347400426864624, -0.7988808751106262, -0.76302170753479, -0.7271624803543091, -0.6913033127784729, -0.6554441452026367, -0.6195849180221558, -0.5837257504463196, -0.5478665828704834, -0.5120074152946472, -0.47614821791648865, -0.4402890205383301, -0.4044298529624939, -0.3685706853866577, -0.33271148800849915, -0.2968522906303406, -0.2609931230545044, -0.22513394057750702, -0.18927475810050964, -0.15341556072235107, -0.11755639314651489, -0.08169721066951752, -0.04583802819252014, -0.009978845715522766, 0.02588033676147461, 0.061739519238471985, 0.09759870171546936, 0.13345789909362793, 0.1693171262741089, 0.20517630875110626, 0.24103549122810364, 0.2768946886062622, 0.3127538561820984, 0.34861302375793457, 0.38447222113609314, 0.4203314185142517, 0.4561905860900879, 0.4920497536659241, 0.5279089212417603, 0.5637681484222412, 0.5996273159980774, 0.6354864835739136, 0.6713457107543945, 0.7072048783302307, 0.7430640459060669, 0.7789232134819031, 0.8147823810577393, 0.8506416082382202, 0.8865007758140564, 0.9223599433898926, 0.9582191705703735, 0.9940783381462097, 1.029937505722046, 1.0657967329025269, 1.1016558408737183, 1.1375150680541992, 1.1733741760253906, 1.2092334032058716, 1.2450926303863525, 1.280951738357544, 1.316810965538025]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 1.0, 1.0, 10.0, 17.0, 11.0, 40.0, 100.0, 197.0, 571.0, 2373.0, 19596.0, 4051129.0, 112363.0, 5714.0, 1266.0, 462.0, 194.0, 111.0, 42.0, 29.0, 17.0, 14.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.9731292724609375, -0.940399169921875, -0.9076690673828125, -0.87493896484375, -0.8422088623046875, -0.809478759765625, -0.7767486572265625, -0.7440185546875, -0.7112884521484375, -0.678558349609375, -0.6458282470703125, -0.61309814453125, -0.5803680419921875, -0.547637939453125, -0.5149078369140625, -0.482177734375, -0.4494476318359375, -0.416717529296875, -0.3839874267578125, -0.35125732421875, -0.3185272216796875, -0.285797119140625, -0.2530670166015625, -0.2203369140625, -0.1876068115234375, -0.154876708984375, -0.1221466064453125, -0.08941650390625, -0.0566864013671875, -0.023956298828125, 0.0087738037109375, 0.04150390625, 0.0742340087890625, 0.106964111328125, 0.1396942138671875, 0.17242431640625, 0.2051544189453125, 0.237884521484375, 0.2706146240234375, 0.3033447265625, 0.3360748291015625, 0.368804931640625, 0.4015350341796875, 0.43426513671875, 0.4669952392578125, 0.499725341796875, 0.5324554443359375, 0.565185546875, 0.5979156494140625, 0.630645751953125, 0.6633758544921875, 0.69610595703125, 0.7288360595703125, 0.761566162109375, 0.7942962646484375, 0.8270263671875, 0.8597564697265625, 0.892486572265625, 0.9252166748046875, 0.95794677734375, 0.9906768798828125, 1.023406982421875, 1.0561370849609375, 1.0888671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 6.0, 7.0, 18.0, 21.0, 29.0, 43.0, 67.0, 107.0, 146.0, 131.0, 130.0, 100.0, 61.0, 46.0, 31.0, 25.0, 9.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043304443359375, -0.04178476333618164, -0.04026508331298828, -0.03874540328979492, -0.03722572326660156, -0.0357060432434082, -0.034186363220214844, -0.032666683197021484, -0.031147003173828125, -0.029627323150634766, -0.028107643127441406, -0.026587963104248047, -0.025068283081054688, -0.023548603057861328, -0.02202892303466797, -0.02050924301147461, -0.01898956298828125, -0.01746988296508789, -0.01595020294189453, -0.014430522918701172, -0.012910842895507812, -0.011391162872314453, -0.009871482849121094, -0.008351802825927734, -0.006832122802734375, -0.005312442779541016, -0.0037927627563476562, -0.002273082733154297, -0.0007534027099609375, 0.0007662773132324219, 0.0022859573364257812, 0.0038056373596191406, 0.0053253173828125, 0.006844997406005859, 0.008364677429199219, 0.009884357452392578, 0.011404037475585938, 0.012923717498779297, 0.014443397521972656, 0.015963077545166016, 0.017482757568359375, 0.019002437591552734, 0.020522117614746094, 0.022041797637939453, 0.023561477661132812, 0.025081157684326172, 0.02660083770751953, 0.02812051773071289, 0.02964019775390625, 0.03115987777709961, 0.03267955780029297, 0.03419923782348633, 0.03571891784667969, 0.03723859786987305, 0.038758277893066406, 0.040277957916259766, 0.041797637939453125, 0.043317317962646484, 0.044836997985839844, 0.0463566780090332, 0.04787635803222656, 0.04939603805541992, 0.05091571807861328, 0.05243539810180664, 0.053955078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 2.0, 11.0, 6.0, 11.0, 25.0, 28.0, 30.0, 50.0, 79.0, 91.0, 149.0, 222.0, 449.0, 792.0, 1542.0, 3383.0, 8209.0, 22235.0, 75676.0, 472385.0, 3292128.0, 240010.0, 49947.0, 15710.0, 5909.0, 2569.0, 1174.0, 575.0, 328.0, 175.0, 112.0, 79.0, 56.0, 32.0, 31.0, 23.0, 13.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2191162109375, -0.21164894104003906, -0.20418167114257812, -0.1967144012451172, -0.18924713134765625, -0.1817798614501953, -0.17431259155273438, -0.16684532165527344, -0.1593780517578125, -0.15191078186035156, -0.14444351196289062, -0.1369762420654297, -0.12950897216796875, -0.12204170227050781, -0.11457443237304688, -0.10710716247558594, -0.099639892578125, -0.09217262268066406, -0.08470535278320312, -0.07723808288574219, -0.06977081298828125, -0.06230354309082031, -0.054836273193359375, -0.04736900329589844, -0.0399017333984375, -0.03243446350097656, -0.024967193603515625, -0.017499923706054688, -0.01003265380859375, -0.0025653839111328125, 0.004901885986328125, 0.012369155883789062, 0.01983642578125, 0.027303695678710938, 0.034770965576171875, 0.04223823547363281, 0.04970550537109375, 0.05717277526855469, 0.06464004516601562, 0.07210731506347656, 0.0795745849609375, 0.08704185485839844, 0.09450912475585938, 0.10197639465332031, 0.10944366455078125, 0.11691093444824219, 0.12437820434570312, 0.13184547424316406, 0.139312744140625, 0.14678001403808594, 0.15424728393554688, 0.1617145538330078, 0.16918182373046875, 0.1766490936279297, 0.18411636352539062, 0.19158363342285156, 0.1990509033203125, 0.20651817321777344, 0.21398544311523438, 0.2214527130126953, 0.22891998291015625, 0.2363872528076172, 0.24385452270507812, 0.25132179260253906, 0.2587890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 6.0, 9.0, 14.0, 24.0, 20.0, 20.0, 36.0, 44.0, 65.0, 106.0, 183.0, 405.0, 1612.0, 686.0, 292.0, 168.0, 124.0, 68.0, 52.0, 41.0, 23.0, 13.0, 10.0, 6.0, 11.0, 10.0, 1.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05889892578125, -0.056987762451171875, -0.05507659912109375, -0.053165435791015625, -0.0512542724609375, -0.049343109130859375, -0.04743194580078125, -0.045520782470703125, -0.043609619140625, -0.041698455810546875, -0.03978729248046875, -0.037876129150390625, -0.0359649658203125, -0.034053802490234375, -0.03214263916015625, -0.030231475830078125, -0.0283203125, -0.026409149169921875, -0.02449798583984375, -0.022586822509765625, -0.0206756591796875, -0.018764495849609375, -0.01685333251953125, -0.014942169189453125, -0.013031005859375, -0.011119842529296875, -0.00920867919921875, -0.007297515869140625, -0.0053863525390625, -0.003475189208984375, -0.00156402587890625, 0.000347137451171875, 0.00225830078125, 0.004169464111328125, 0.00608062744140625, 0.007991790771484375, 0.0099029541015625, 0.011814117431640625, 0.01372528076171875, 0.015636444091796875, 0.017547607421875, 0.019458770751953125, 0.02136993408203125, 0.023281097412109375, 0.0251922607421875, 0.027103424072265625, 0.02901458740234375, 0.030925750732421875, 0.0328369140625, 0.034748077392578125, 0.03665924072265625, 0.038570404052734375, 0.0404815673828125, 0.042392730712890625, 0.04430389404296875, 0.046215057373046875, 0.048126220703125, 0.050037384033203125, 0.05194854736328125, 0.053859710693359375, 0.0557708740234375, 0.057682037353515625, 0.05959320068359375, 0.061504364013671875, 0.06341552734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 28.0, 110.0, 240.0, 350.0, 191.0, 52.0, 12.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3059757947921753, -1.2800270318984985, -1.2540782690048218, -1.228129506111145, -1.2021806240081787, -1.176231861114502, -1.1502830982208252, -1.1243343353271484, -1.0983855724334717, -1.072436809539795, -1.0464880466461182, -1.0205392837524414, -0.9945904612541199, -0.9686416387557983, -0.9426928758621216, -0.9167441129684448, -0.8907953500747681, -0.8648465871810913, -0.8388977646827698, -0.812949001789093, -0.7870002388954163, -0.7610514163970947, -0.735102653503418, -0.7091538906097412, -0.6832050681114197, -0.6572563052177429, -0.6313074827194214, -0.6053587198257446, -0.5794099569320679, -0.5534611940383911, -0.5275123715400696, -0.5015636086463928, -0.47561487555503845, -0.4496660828590393, -0.42371731996536255, -0.3977685272693634, -0.37181976437568665, -0.3458709716796875, -0.31992220878601074, -0.2939734160900116, -0.26802462339401245, -0.2420758455991745, -0.21612706780433655, -0.1901782751083374, -0.16422951221466064, -0.1382807195186615, -0.11233194172382355, -0.0863831639289856, -0.06043440103530884, -0.034485623240470886, -0.008536841720342636, 0.017411939799785614, 0.043360717594623566, 0.06930950284004211, 0.09525828063488007, 0.12120705842971802, 0.14715583622455597, 0.17310461401939392, 0.19905339181423187, 0.22500216960906982, 0.25095096230506897, 0.2768997550010681, 0.3028485178947449, 0.32879728078842163, 0.3547460734844208]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 6.0, 14.0, 13.0, 12.0, 8.0, 10.0, 14.0, 14.0, 23.0, 22.0, 27.0, 34.0, 43.0, 40.0, 37.0, 40.0, 34.0, 49.0, 41.0, 41.0, 38.0, 47.0, 43.0, 39.0, 41.0, 32.0, 27.0, 24.0, 27.0, 26.0, 22.0, 13.0, 12.0, 16.0, 9.0, 10.0, 12.0, 7.0, 3.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.21332383155822754, -0.2074023187160492, -0.20148082077503204, -0.1955593079328537, -0.18963779509067535, -0.1837162971496582, -0.17779478430747986, -0.1718732714653015, -0.16595175862312317, -0.16003024578094482, -0.15410874783992767, -0.14818723499774933, -0.14226572215557098, -0.13634422421455383, -0.1304227113723755, -0.12450119853019714, -0.11857970058917999, -0.11265819519758224, -0.1067366823554039, -0.10081517696380615, -0.09489366412162781, -0.08897215873003006, -0.08305065333843231, -0.07712914049625397, -0.07120763510465622, -0.06528612971305847, -0.05936461687088013, -0.05344311147928238, -0.04752160236239433, -0.04160009324550629, -0.03567858785390854, -0.029757078737020493, -0.023835569620132446, -0.0179140605032444, -0.011992553249001503, -0.006071045994758606, -0.0001495368778705597, 0.005771972239017487, 0.011693477630615234, 0.01761498674750328, 0.023536495864391327, 0.029458004981279373, 0.03537951409816742, 0.04130101948976517, 0.047222528606653214, 0.05314403772354126, 0.05906554311513901, 0.06498704850673676, 0.0709085613489151, 0.07683006674051285, 0.08275157958269119, 0.08867308497428894, 0.09459459781646729, 0.10051610320806503, 0.10643760859966278, 0.11235912144184113, 0.11828062683343887, 0.12420213222503662, 0.13012364506721497, 0.1360451579093933, 0.14196665585041046, 0.1478881686925888, 0.15380966663360596, 0.1597311794757843, 0.16565269231796265]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 6.0, 7.0, 14.0, 9.0, 18.0, 33.0, 56.0, 72.0, 90.0, 194.0, 331.0, 538.0, 1023.0, 2051.0, 5323.0, 20280.0, 130314.0, 668951.0, 182309.0, 25615.0, 6500.0, 2320.0, 1033.0, 595.0, 336.0, 202.0, 120.0, 78.0, 47.0, 30.0, 21.0, 10.0, 10.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30810546875, -0.29834747314453125, -0.2885894775390625, -0.27883148193359375, -0.269073486328125, -0.25931549072265625, -0.2495574951171875, -0.23979949951171875, -0.23004150390625, -0.22028350830078125, -0.2105255126953125, -0.20076751708984375, -0.191009521484375, -0.18125152587890625, -0.1714935302734375, -0.16173553466796875, -0.1519775390625, -0.14221954345703125, -0.1324615478515625, -0.12270355224609375, -0.112945556640625, -0.10318756103515625, -0.0934295654296875, -0.08367156982421875, -0.07391357421875, -0.06415557861328125, -0.0543975830078125, -0.04463958740234375, -0.034881591796875, -0.02512359619140625, -0.0153656005859375, -0.00560760498046875, 0.004150390625, 0.01390838623046875, 0.0236663818359375, 0.03342437744140625, 0.043182373046875, 0.05294036865234375, 0.0626983642578125, 0.07245635986328125, 0.08221435546875, 0.09197235107421875, 0.1017303466796875, 0.11148834228515625, 0.121246337890625, 0.13100433349609375, 0.1407623291015625, 0.15052032470703125, 0.1602783203125, 0.17003631591796875, 0.1797943115234375, 0.18955230712890625, 0.199310302734375, 0.20906829833984375, 0.2188262939453125, 0.22858428955078125, 0.23834228515625, 0.24810028076171875, 0.2578582763671875, 0.26761627197265625, 0.277374267578125, 0.28713226318359375, 0.2968902587890625, 0.30664825439453125, 0.31640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 13.0, 12.0, 16.0, 29.0, 41.0, 76.0, 77.0, 124.0, 142.0, 131.0, 111.0, 77.0, 55.0, 33.0, 21.0, 16.0, 15.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046661376953125, -0.04509735107421875, -0.0435333251953125, -0.04196929931640625, -0.0404052734375, -0.03884124755859375, -0.0372772216796875, -0.03571319580078125, -0.034149169921875, -0.03258514404296875, -0.0310211181640625, -0.02945709228515625, -0.02789306640625, -0.02632904052734375, -0.0247650146484375, -0.02320098876953125, -0.021636962890625, -0.02007293701171875, -0.0185089111328125, -0.01694488525390625, -0.015380859375, -0.01381683349609375, -0.0122528076171875, -0.01068878173828125, -0.009124755859375, -0.00756072998046875, -0.0059967041015625, -0.00443267822265625, -0.00286865234375, -0.00130462646484375, 0.0002593994140625, 0.00182342529296875, 0.003387451171875, 0.00495147705078125, 0.0065155029296875, 0.00807952880859375, 0.0096435546875, 0.01120758056640625, 0.0127716064453125, 0.01433563232421875, 0.015899658203125, 0.01746368408203125, 0.0190277099609375, 0.02059173583984375, 0.02215576171875, 0.02371978759765625, 0.0252838134765625, 0.02684783935546875, 0.028411865234375, 0.02997589111328125, 0.0315399169921875, 0.03310394287109375, 0.03466796875, 0.03623199462890625, 0.0377960205078125, 0.03936004638671875, 0.040924072265625, 0.04248809814453125, 0.0440521240234375, 0.04561614990234375, 0.04718017578125, 0.04874420166015625, 0.0503082275390625, 0.05187225341796875, 0.053436279296875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 6.0, 11.0, 15.0, 28.0, 31.0, 51.0, 65.0, 106.0, 160.0, 243.0, 395.0, 762.0, 1477.0, 3788.0, 11812.0, 48578.0, 243873.0, 544025.0, 148607.0, 30664.0, 8222.0, 2896.0, 1174.0, 589.0, 332.0, 205.0, 138.0, 99.0, 55.0, 42.0, 31.0, 21.0, 8.0, 9.0, 7.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26239585876464844, -0.2542839050292969, -0.2461719512939453, -0.23805999755859375, -0.2299480438232422, -0.22183609008789062, -0.21372413635253906, -0.2056121826171875, -0.19750022888183594, -0.18938827514648438, -0.1812763214111328, -0.17316436767578125, -0.1650524139404297, -0.15694046020507812, -0.14882850646972656, -0.140716552734375, -0.13260459899902344, -0.12449264526367188, -0.11638069152832031, -0.10826873779296875, -0.10015678405761719, -0.09204483032226562, -0.08393287658691406, -0.0758209228515625, -0.06770896911621094, -0.059597015380859375, -0.05148506164550781, -0.04337310791015625, -0.03526115417480469, -0.027149200439453125, -0.019037246704101562, -0.01092529296875, -0.0028133392333984375, 0.005298614501953125, 0.013410568237304688, 0.02152252197265625, 0.029634475708007812, 0.037746429443359375, 0.04585838317871094, 0.0539703369140625, 0.06208229064941406, 0.07019424438476562, 0.07830619812011719, 0.08641815185546875, 0.09453010559082031, 0.10264205932617188, 0.11075401306152344, 0.118865966796875, 0.12697792053222656, 0.13508987426757812, 0.1432018280029297, 0.15131378173828125, 0.1594257354736328, 0.16753768920898438, 0.17564964294433594, 0.1837615966796875, 0.19187355041503906, 0.19998550415039062, 0.2080974578857422, 0.21620941162109375, 0.2243213653564453, 0.23243331909179688, 0.24054527282714844, 0.2486572265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 6.0, 9.0, 10.0, 14.0, 11.0, 15.0, 25.0, 32.0, 44.0, 37.0, 41.0, 44.0, 43.0, 40.0, 53.0, 49.0, 47.0, 52.0, 57.0, 65.0, 62.0, 34.0, 34.0, 30.0, 34.0, 23.0, 21.0, 15.0, 7.0, 6.0, 6.0, 5.0, 6.0, 4.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1922607421875, -0.18689727783203125, -0.1815338134765625, -0.17617034912109375, -0.170806884765625, -0.16544342041015625, -0.1600799560546875, -0.15471649169921875, -0.14935302734375, -0.14398956298828125, -0.1386260986328125, -0.13326263427734375, -0.127899169921875, -0.12253570556640625, -0.1171722412109375, -0.11180877685546875, -0.1064453125, -0.10108184814453125, -0.0957183837890625, -0.09035491943359375, -0.084991455078125, -0.07962799072265625, -0.0742645263671875, -0.06890106201171875, -0.06353759765625, -0.05817413330078125, -0.0528106689453125, -0.04744720458984375, -0.042083740234375, -0.03672027587890625, -0.0313568115234375, -0.02599334716796875, -0.0206298828125, -0.01526641845703125, -0.0099029541015625, -0.00453948974609375, 0.000823974609375, 0.00618743896484375, 0.0115509033203125, 0.01691436767578125, 0.02227783203125, 0.02764129638671875, 0.0330047607421875, 0.03836822509765625, 0.043731689453125, 0.04909515380859375, 0.0544586181640625, 0.05982208251953125, 0.065185546875, 0.07054901123046875, 0.0759124755859375, 0.08127593994140625, 0.086639404296875, 0.09200286865234375, 0.0973663330078125, 0.10272979736328125, 0.10809326171875, 0.11345672607421875, 0.1188201904296875, 0.12418365478515625, 0.129547119140625, 0.13491058349609375, 0.1402740478515625, 0.14563751220703125, 0.1510009765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 5.0, 7.0, 10.0, 17.0, 26.0, 19.0, 37.0, 64.0, 62.0, 105.0, 191.0, 284.0, 449.0, 764.0, 1272.0, 2338.0, 4503.0, 9137.0, 20748.0, 53760.0, 166049.0, 426245.0, 238070.0, 73182.0, 27402.0, 11625.0, 5471.0, 2789.0, 1558.0, 877.0, 534.0, 314.0, 211.0, 124.0, 81.0, 66.0, 44.0, 24.0, 20.0, 18.0, 18.0, 8.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.09466552734375, -0.09185218811035156, -0.08903884887695312, -0.08622550964355469, -0.08341217041015625, -0.08059883117675781, -0.07778549194335938, -0.07497215270996094, -0.0721588134765625, -0.06934547424316406, -0.06653213500976562, -0.06371879577636719, -0.06090545654296875, -0.05809211730957031, -0.055278778076171875, -0.05246543884277344, -0.049652099609375, -0.04683876037597656, -0.044025421142578125, -0.04121208190917969, -0.03839874267578125, -0.03558540344238281, -0.032772064208984375, -0.029958724975585938, -0.0271453857421875, -0.024332046508789062, -0.021518707275390625, -0.018705368041992188, -0.01589202880859375, -0.013078689575195312, -0.010265350341796875, -0.0074520111083984375, -0.004638671875, -0.0018253326416015625, 0.000988006591796875, 0.0038013458251953125, 0.00661468505859375, 0.009428024291992188, 0.012241363525390625, 0.015054702758789062, 0.0178680419921875, 0.020681381225585938, 0.023494720458984375, 0.026308059692382812, 0.02912139892578125, 0.03193473815917969, 0.034748077392578125, 0.03756141662597656, 0.040374755859375, 0.04318809509277344, 0.046001434326171875, 0.04881477355957031, 0.05162811279296875, 0.05444145202636719, 0.057254791259765625, 0.06006813049316406, 0.0628814697265625, 0.06569480895996094, 0.06850814819335938, 0.07132148742675781, 0.07413482666015625, 0.07694816589355469, 0.07976150512695312, 0.08257484436035156, 0.08538818359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 14.0, 11.0, 18.0, 25.0, 36.0, 48.0, 46.0, 60.0, 61.0, 62.0, 84.0, 76.0, 65.0, 84.0, 53.0, 60.0, 38.0, 29.0, 17.0, 17.0, 22.0, 18.0, 10.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.55839729309082e-05, -3.456976264715195e-05, -3.355555236339569e-05, -3.2541342079639435e-05, -3.152713179588318e-05, -3.0512921512126923e-05, -2.9498711228370667e-05, -2.848450094461441e-05, -2.7470290660858154e-05, -2.6456080377101898e-05, -2.5441870093345642e-05, -2.4427659809589386e-05, -2.341344952583313e-05, -2.2399239242076874e-05, -2.1385028958320618e-05, -2.037081867456436e-05, -1.9356608390808105e-05, -1.834239810705185e-05, -1.7328187823295593e-05, -1.6313977539539337e-05, -1.529976725578308e-05, -1.4285556972026825e-05, -1.3271346688270569e-05, -1.2257136404514313e-05, -1.1242926120758057e-05, -1.02287158370018e-05, -9.214505553245544e-06, -8.200295269489288e-06, -7.186084985733032e-06, -6.171874701976776e-06, -5.15766441822052e-06, -4.143454134464264e-06, -3.129243850708008e-06, -2.1150335669517517e-06, -1.1008232831954956e-06, -8.66129994392395e-08, 9.275972843170166e-07, 1.9418075680732727e-06, 2.956017851829529e-06, 3.970228135585785e-06, 4.984438419342041e-06, 5.998648703098297e-06, 7.012858986854553e-06, 8.02706927061081e-06, 9.041279554367065e-06, 1.0055489838123322e-05, 1.1069700121879578e-05, 1.2083910405635834e-05, 1.309812068939209e-05, 1.4112330973148346e-05, 1.5126541256904602e-05, 1.6140751540660858e-05, 1.7154961824417114e-05, 1.816917210817337e-05, 1.9183382391929626e-05, 2.0197592675685883e-05, 2.121180295944214e-05, 2.2226013243198395e-05, 2.324022352695465e-05, 2.4254433810710907e-05, 2.5268644094467163e-05, 2.628285437822342e-05, 2.7297064661979675e-05, 2.831127494573593e-05, 2.9325485229492188e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 6.0, 16.0, 16.0, 31.0, 37.0, 54.0, 78.0, 140.0, 207.0, 390.0, 778.0, 1969.0, 6028.0, 25693.0, 166710.0, 703500.0, 114610.0, 19888.0, 5031.0, 1802.0, 726.0, 354.0, 167.0, 105.0, 74.0, 41.0, 21.0, 23.0, 13.0, 8.0, 7.0, 6.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1744384765625, -0.1687030792236328, -0.16296768188476562, -0.15723228454589844, -0.15149688720703125, -0.14576148986816406, -0.14002609252929688, -0.1342906951904297, -0.1285552978515625, -0.12281990051269531, -0.11708450317382812, -0.11134910583496094, -0.10561370849609375, -0.09987831115722656, -0.09414291381835938, -0.08840751647949219, -0.082672119140625, -0.07693672180175781, -0.07120132446289062, -0.06546592712402344, -0.05973052978515625, -0.05399513244628906, -0.048259735107421875, -0.04252433776855469, -0.0367889404296875, -0.031053543090820312, -0.025318145751953125, -0.019582748413085938, -0.01384735107421875, -0.008111953735351562, -0.002376556396484375, 0.0033588409423828125, 0.00909423828125, 0.014829635620117188, 0.020565032958984375, 0.026300430297851562, 0.03203582763671875, 0.03777122497558594, 0.043506622314453125, 0.04924201965332031, 0.0549774169921875, 0.06071281433105469, 0.06644821166992188, 0.07218360900878906, 0.07791900634765625, 0.08365440368652344, 0.08938980102539062, 0.09512519836425781, 0.100860595703125, 0.10659599304199219, 0.11233139038085938, 0.11806678771972656, 0.12380218505859375, 0.12953758239746094, 0.13527297973632812, 0.1410083770751953, 0.1467437744140625, 0.1524791717529297, 0.15821456909179688, 0.16394996643066406, 0.16968536376953125, 0.17542076110839844, 0.18115615844726562, 0.1868915557861328, 0.192626953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 7.0, 9.0, 9.0, 7.0, 20.0, 12.0, 28.0, 29.0, 53.0, 63.0, 82.0, 92.0, 94.0, 97.0, 77.0, 49.0, 39.0, 58.0, 30.0, 34.0, 25.0, 14.0, 9.0, 8.0, 15.0, 3.0, 5.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09930419921875, -0.0966024398803711, -0.09390068054199219, -0.09119892120361328, -0.08849716186523438, -0.08579540252685547, -0.08309364318847656, -0.08039188385009766, -0.07769012451171875, -0.07498836517333984, -0.07228660583496094, -0.06958484649658203, -0.06688308715820312, -0.06418132781982422, -0.06147956848144531, -0.058777809143066406, -0.0560760498046875, -0.053374290466308594, -0.05067253112792969, -0.04797077178955078, -0.045269012451171875, -0.04256725311279297, -0.03986549377441406, -0.037163734436035156, -0.03446197509765625, -0.031760215759277344, -0.029058456420898438, -0.02635669708251953, -0.023654937744140625, -0.02095317840576172, -0.018251419067382812, -0.015549659729003906, -0.012847900390625, -0.010146141052246094, -0.0074443817138671875, -0.004742622375488281, -0.002040863037109375, 0.0006608963012695312, 0.0033626556396484375, 0.006064414978027344, 0.00876617431640625, 0.011467933654785156, 0.014169692993164062, 0.01687145233154297, 0.019573211669921875, 0.02227497100830078, 0.024976730346679688, 0.027678489685058594, 0.0303802490234375, 0.033082008361816406, 0.03578376770019531, 0.03848552703857422, 0.041187286376953125, 0.04388904571533203, 0.04659080505371094, 0.049292564392089844, 0.05199432373046875, 0.054696083068847656, 0.05739784240722656, 0.06009960174560547, 0.06280136108398438, 0.06550312042236328, 0.06820487976074219, 0.0709066390991211, 0.0736083984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 10.0, 10.0, 14.0, 39.0, 60.0, 121.0, 176.0, 209.0, 156.0, 95.0, 52.0, 30.0, 13.0, 11.0, 10.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4192583560943604, -1.360929012298584, -1.3025997877120972, -1.2442704439163208, -1.1859411001205444, -1.1276118755340576, -1.0692825317382812, -1.0109531879425049, -0.9526238441467285, -0.8942945599555969, -0.8359652161598206, -0.777635931968689, -0.7193065881729126, -0.660977303981781, -0.6026480197906494, -0.544318675994873, -0.48598939180374146, -0.4276600778102875, -0.3693307638168335, -0.3110014796257019, -0.25267213582992554, -0.19434285163879395, -0.13601353764533997, -0.07768422365188599, -0.019354909658432007, 0.038974400609731674, 0.09730371087789536, 0.15563301742076874, 0.21396233141422272, 0.2722916305065155, 0.3306209444999695, 0.38895025849342346, 0.44727957248687744, 0.505608856678009, 0.5639382004737854, 0.622267484664917, 0.6805968284606934, 0.738926112651825, 0.7972553968429565, 0.8555847406387329, 0.9139140844345093, 0.9722433686256409, 1.0305726528167725, 1.0889019966125488, 1.1472313404083252, 1.2055606842041016, 1.2638899087905884, 1.3222192525863647, 1.3805484771728516, 1.438877820968628, 1.4972070455551147, 1.5555363893508911, 1.6138657331466675, 1.6721949577331543, 1.7305243015289307, 1.788853645324707, 1.8471829891204834, 1.9055123329162598, 1.9638415575027466, 2.0221710205078125, 2.0805001258850098, 2.138829469680786, 2.1971588134765625, 2.255488157272339, 2.3138175010681152]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 2.0, 3.0, 8.0, 13.0, 10.0, 14.0, 10.0, 17.0, 21.0, 17.0, 26.0, 31.0, 39.0, 41.0, 43.0, 40.0, 45.0, 37.0, 44.0, 48.0, 42.0, 44.0, 45.0, 48.0, 37.0, 40.0, 36.0, 28.0, 35.0, 20.0, 21.0, 20.0, 19.0, 10.0, 13.0, 5.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0357482433319092, -1.0045775175094604, -0.9734067916870117, -0.9422361254692078, -0.911065399646759, -0.8798946738243103, -0.8487240076065063, -0.8175532817840576, -0.7863825559616089, -0.7552118301391602, -0.7240411043167114, -0.6928704380989075, -0.6616997122764587, -0.63052898645401, -0.599358320236206, -0.5681875944137573, -0.5370168685913086, -0.5058461427688599, -0.4746754467487335, -0.4435047507286072, -0.41233402490615845, -0.3811632990837097, -0.3499926030635834, -0.31882190704345703, -0.2876511812210083, -0.25648045539855957, -0.22530975937843323, -0.1941390484571457, -0.16296833753585815, -0.13179762661457062, -0.10062691569328308, -0.06945620477199554, -0.03828549385070801, -0.007114782929420471, 0.024055927991867065, 0.0552266389131546, 0.08639734983444214, 0.11756806075572968, 0.1487387716770172, 0.17990948259830475, 0.21108019351959229, 0.24225090444087982, 0.27342161536216736, 0.3045923113822937, 0.33576303720474243, 0.36693376302719116, 0.3981044590473175, 0.42927515506744385, 0.4604458808898926, 0.4916166067123413, 0.52278733253479, 0.553957998752594, 0.5851287245750427, 0.6162994503974915, 0.6474701166152954, 0.6786408424377441, 0.7098115682601929, 0.7409822940826416, 0.7721530199050903, 0.8033236861228943, 0.834494411945343, 0.8656651377677917, 0.8968358039855957, 0.9280065298080444, 0.9591772556304932]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 9.0, 11.0, 15.0, 26.0, 38.0, 86.0, 147.0, 252.0, 597.0, 1308.0, 3464.0, 12346.0, 76736.0, 3840703.0, 226596.0, 22331.0, 5549.0, 2008.0, 893.0, 479.0, 245.0, 150.0, 84.0, 48.0, 42.0, 31.0, 13.0, 20.0, 12.0, 5.0, 7.0, 10.0, 10.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3680267333984375, -0.356414794921875, -0.3448028564453125, -0.33319091796875, -0.3215789794921875, -0.309967041015625, -0.2983551025390625, -0.2867431640625, -0.2751312255859375, -0.263519287109375, -0.2519073486328125, -0.24029541015625, -0.2286834716796875, -0.217071533203125, -0.2054595947265625, -0.19384765625, -0.1822357177734375, -0.170623779296875, -0.1590118408203125, -0.14739990234375, -0.1357879638671875, -0.124176025390625, -0.1125640869140625, -0.1009521484375, -0.0893402099609375, -0.077728271484375, -0.0661163330078125, -0.05450439453125, -0.0428924560546875, -0.031280517578125, -0.0196685791015625, -0.008056640625, 0.0035552978515625, 0.015167236328125, 0.0267791748046875, 0.03839111328125, 0.0500030517578125, 0.061614990234375, 0.0732269287109375, 0.0848388671875, 0.0964508056640625, 0.108062744140625, 0.1196746826171875, 0.13128662109375, 0.1428985595703125, 0.154510498046875, 0.1661224365234375, 0.177734375, 0.1893463134765625, 0.200958251953125, 0.2125701904296875, 0.22418212890625, 0.2357940673828125, 0.247406005859375, 0.2590179443359375, 0.2706298828125, 0.2822418212890625, 0.293853759765625, 0.3054656982421875, 0.31707763671875, 0.3286895751953125, 0.340301513671875, 0.3519134521484375, 0.363525390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 9.0, 13.0, 29.0, 29.0, 57.0, 50.0, 82.0, 104.0, 98.0, 93.0, 95.0, 81.0, 68.0, 43.0, 38.0, 30.0, 24.0, 17.0, 13.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04620361328125, -0.044681549072265625, -0.04315948486328125, -0.041637420654296875, -0.0401153564453125, -0.038593292236328125, -0.03707122802734375, -0.035549163818359375, -0.034027099609375, -0.032505035400390625, -0.03098297119140625, -0.029460906982421875, -0.0279388427734375, -0.026416778564453125, -0.02489471435546875, -0.023372650146484375, -0.0218505859375, -0.020328521728515625, -0.01880645751953125, -0.017284393310546875, -0.0157623291015625, -0.014240264892578125, -0.01271820068359375, -0.011196136474609375, -0.009674072265625, -0.008152008056640625, -0.00662994384765625, -0.005107879638671875, -0.0035858154296875, -0.002063751220703125, -0.00054168701171875, 0.000980377197265625, 0.00250244140625, 0.004024505615234375, 0.00554656982421875, 0.007068634033203125, 0.0085906982421875, 0.010112762451171875, 0.01163482666015625, 0.013156890869140625, 0.014678955078125, 0.016201019287109375, 0.01772308349609375, 0.019245147705078125, 0.0207672119140625, 0.022289276123046875, 0.02381134033203125, 0.025333404541015625, 0.02685546875, 0.028377532958984375, 0.02989959716796875, 0.031421661376953125, 0.0329437255859375, 0.034465789794921875, 0.03598785400390625, 0.037509918212890625, 0.039031982421875, 0.040554046630859375, 0.04207611083984375, 0.043598175048828125, 0.0451202392578125, 0.046642303466796875, 0.04816436767578125, 0.049686431884765625, 0.05120849609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 5.0, 5.0, 19.0, 17.0, 41.0, 49.0, 78.0, 150.0, 265.0, 535.0, 1420.0, 4663.0, 21308.0, 195002.0, 3803706.0, 143041.0, 17632.0, 4052.0, 1246.0, 499.0, 234.0, 134.0, 73.0, 40.0, 22.0, 11.0, 17.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3013496398925781, -0.28995513916015625, -0.2785606384277344, -0.2671661376953125, -0.2557716369628906, -0.24437713623046875, -0.23298263549804688, -0.221588134765625, -0.21019363403320312, -0.19879913330078125, -0.18740463256835938, -0.1760101318359375, -0.16461563110351562, -0.15322113037109375, -0.14182662963867188, -0.13043212890625, -0.11903762817382812, -0.10764312744140625, -0.09624862670898438, -0.0848541259765625, -0.07345962524414062, -0.06206512451171875, -0.050670623779296875, -0.039276123046875, -0.027881622314453125, -0.01648712158203125, -0.005092620849609375, 0.0063018798828125, 0.017696380615234375, 0.02909088134765625, 0.040485382080078125, 0.0518798828125, 0.06327438354492188, 0.07466888427734375, 0.08606338500976562, 0.0974578857421875, 0.10885238647460938, 0.12024688720703125, 0.13164138793945312, 0.143035888671875, 0.15443038940429688, 0.16582489013671875, 0.17721939086914062, 0.1886138916015625, 0.20000839233398438, 0.21140289306640625, 0.22279739379882812, 0.23419189453125, 0.24558639526367188, 0.25698089599609375, 0.2683753967285156, 0.2797698974609375, 0.2911643981933594, 0.30255889892578125, 0.3139533996582031, 0.325347900390625, 0.3367424011230469, 0.34813690185546875, 0.3595314025878906, 0.3709259033203125, 0.3823204040527344, 0.39371490478515625, 0.4051094055175781, 0.41650390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 10.0, 7.0, 8.0, 24.0, 21.0, 33.0, 83.0, 168.0, 386.0, 2200.0, 672.0, 200.0, 104.0, 59.0, 44.0, 26.0, 9.0, 13.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.11410140991210938, -0.11107635498046875, -0.10805130004882812, -0.1050262451171875, -0.10200119018554688, -0.09897613525390625, -0.09595108032226562, -0.092926025390625, -0.08990097045898438, -0.08687591552734375, -0.08385086059570312, -0.0808258056640625, -0.07780075073242188, -0.07477569580078125, -0.07175064086914062, -0.0687255859375, -0.06570053100585938, -0.06267547607421875, -0.059650421142578125, -0.0566253662109375, -0.053600311279296875, -0.05057525634765625, -0.047550201416015625, -0.044525146484375, -0.041500091552734375, -0.03847503662109375, -0.035449981689453125, -0.0324249267578125, -0.029399871826171875, -0.02637481689453125, -0.023349761962890625, -0.02032470703125, -0.017299652099609375, -0.01427459716796875, -0.011249542236328125, -0.0082244873046875, -0.005199432373046875, -0.00217437744140625, 0.000850677490234375, 0.003875732421875, 0.006900787353515625, 0.00992584228515625, 0.012950897216796875, 0.0159759521484375, 0.019001007080078125, 0.02202606201171875, 0.025051116943359375, 0.028076171875, 0.031101226806640625, 0.03412628173828125, 0.037151336669921875, 0.0401763916015625, 0.043201446533203125, 0.04622650146484375, 0.049251556396484375, 0.052276611328125, 0.055301666259765625, 0.05832672119140625, 0.061351776123046875, 0.0643768310546875, 0.06740188598632812, 0.07042694091796875, 0.07345199584960938, 0.07647705078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 16.0, 27.0, 72.0, 125.0, 200.0, 224.0, 166.0, 88.0, 41.0, 22.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7236816883087158, -0.705675482749939, -0.6876692175865173, -0.6696630120277405, -0.6516567468643188, -0.633650541305542, -0.6156443357467651, -0.5976380705833435, -0.5796318650245667, -0.5616256594657898, -0.5436193943023682, -0.5256131887435913, -0.5076069235801697, -0.4896007180213928, -0.4715944826602936, -0.45358824729919434, -0.4355820119380951, -0.41757577657699585, -0.3995695412158966, -0.38156330585479736, -0.3635571002960205, -0.34555086493492126, -0.327544629573822, -0.30953842401504517, -0.29153215885162354, -0.2735259234905243, -0.25551968812942505, -0.237513467669487, -0.21950724720954895, -0.2015010118484497, -0.18349477648735046, -0.16548855602741241, -0.14748233556747437, -0.12947610020637512, -0.11146987974643707, -0.09346364438533783, -0.07545741647481918, -0.05745118856430054, -0.039444953203201294, -0.021438732743263245, -0.0034324973821640015, 0.014573732390999794, 0.03257996216416359, 0.050586193799972534, 0.06859242171049118, 0.08659864962100983, 0.10460488498210907, 0.12261110544204712, 0.14061734080314636, 0.1586235761642456, 0.17662979662418365, 0.1946360319852829, 0.21264225244522095, 0.2306484878063202, 0.24865472316741943, 0.2666609287261963, 0.2846671938896179, 0.30267342925071716, 0.3206796646118164, 0.33868587017059326, 0.3566921055316925, 0.37469834089279175, 0.392704576253891, 0.41071081161499023, 0.4287170171737671]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 5.0, 10.0, 6.0, 13.0, 11.0, 14.0, 25.0, 29.0, 26.0, 28.0, 24.0, 30.0, 32.0, 35.0, 40.0, 46.0, 38.0, 45.0, 46.0, 45.0, 46.0, 53.0, 34.0, 44.0, 59.0, 35.0, 34.0, 18.0, 25.0, 18.0, 14.0, 19.0, 11.0, 7.0, 5.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19146603345870972, -0.18510855734348297, -0.17875108122825623, -0.17239362001419067, -0.16603614389896393, -0.15967866778373718, -0.15332119166851044, -0.1469637155532837, -0.14060625433921814, -0.1342487782239914, -0.12789130210876465, -0.1215338334441185, -0.11517636477947235, -0.1088188886642456, -0.10246141254901886, -0.09610393643379211, -0.08974646031856537, -0.08338898420333862, -0.07703151553869247, -0.07067403942346573, -0.06431657075881958, -0.057959094643592834, -0.05160161852836609, -0.04524414613842964, -0.038886673748493195, -0.03252920135855675, -0.02617172710597515, -0.019814252853393555, -0.013456780463457108, -0.00709930807352066, -0.0007418319582939148, 0.005615640431642532, 0.01197311282157898, 0.018330585211515427, 0.024688059464097023, 0.03104553371667862, 0.037403006106615067, 0.043760478496551514, 0.05011795461177826, 0.056475427001714706, 0.06283289939165115, 0.0691903755068779, 0.07554784417152405, 0.0819053202867508, 0.08826279640197754, 0.09462026506662369, 0.10097774118185043, 0.10733520984649658, 0.11369268596172333, 0.12005016207695007, 0.12640763819217682, 0.13276511430740356, 0.13912257552146912, 0.14548005163669586, 0.1518375277519226, 0.15819500386714935, 0.1645524799823761, 0.17090995609760284, 0.1772674322128296, 0.18362489342689514, 0.1899823695421219, 0.19633984565734863, 0.20269732177257538, 0.20905479788780212, 0.21541225910186768]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 9.0, 9.0, 5.0, 14.0, 19.0, 16.0, 34.0, 34.0, 38.0, 56.0, 82.0, 114.0, 125.0, 244.0, 294.0, 454.0, 783.0, 1346.0, 2417.0, 5163.0, 11257.0, 27857.0, 76779.0, 217311.0, 398357.0, 192265.0, 67634.0, 25146.0, 10259.0, 4724.0, 2306.0, 1236.0, 711.0, 463.0, 272.0, 189.0, 135.0, 120.0, 75.0, 50.0, 32.0, 24.0, 20.0, 18.0, 20.0, 15.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.1541748046875, -0.14969825744628906, -0.14522171020507812, -0.1407451629638672, -0.13626861572265625, -0.1317920684814453, -0.12731552124023438, -0.12283897399902344, -0.1183624267578125, -0.11388587951660156, -0.10940933227539062, -0.10493278503417969, -0.10045623779296875, -0.09597969055175781, -0.09150314331054688, -0.08702659606933594, -0.082550048828125, -0.07807350158691406, -0.07359695434570312, -0.06912040710449219, -0.06464385986328125, -0.06016731262207031, -0.055690765380859375, -0.05121421813964844, -0.0467376708984375, -0.04226112365722656, -0.037784576416015625, -0.03330802917480469, -0.02883148193359375, -0.024354934692382812, -0.019878387451171875, -0.015401840209960938, -0.01092529296875, -0.0064487457275390625, -0.001972198486328125, 0.0025043487548828125, 0.00698089599609375, 0.011457443237304688, 0.015933990478515625, 0.020410537719726562, 0.0248870849609375, 0.029363632202148438, 0.033840179443359375, 0.03831672668457031, 0.04279327392578125, 0.04726982116699219, 0.051746368408203125, 0.05622291564941406, 0.060699462890625, 0.06517601013183594, 0.06965255737304688, 0.07412910461425781, 0.07860565185546875, 0.08308219909667969, 0.08755874633789062, 0.09203529357910156, 0.0965118408203125, 0.10098838806152344, 0.10546493530273438, 0.10994148254394531, 0.11441802978515625, 0.11889457702636719, 0.12337112426757812, 0.12784767150878906, 0.13232421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 14.0, 17.0, 25.0, 32.0, 49.0, 62.0, 81.0, 71.0, 98.0, 94.0, 106.0, 79.0, 63.0, 46.0, 35.0, 40.0, 21.0, 16.0, 14.0, 9.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040679931640625, -0.03924703598022461, -0.03781414031982422, -0.03638124465942383, -0.03494834899902344, -0.03351545333862305, -0.032082557678222656, -0.030649662017822266, -0.029216766357421875, -0.027783870697021484, -0.026350975036621094, -0.024918079376220703, -0.023485183715820312, -0.022052288055419922, -0.02061939239501953, -0.01918649673461914, -0.01775360107421875, -0.01632070541381836, -0.014887809753417969, -0.013454914093017578, -0.012022018432617188, -0.010589122772216797, -0.009156227111816406, -0.007723331451416016, -0.006290435791015625, -0.004857540130615234, -0.0034246444702148438, -0.001991748809814453, -0.0005588531494140625, 0.0008740425109863281, 0.0023069381713867188, 0.0037398338317871094, 0.0051727294921875, 0.006605625152587891, 0.008038520812988281, 0.009471416473388672, 0.010904312133789062, 0.012337207794189453, 0.013770103454589844, 0.015202999114990234, 0.016635894775390625, 0.018068790435791016, 0.019501686096191406, 0.020934581756591797, 0.022367477416992188, 0.023800373077392578, 0.02523326873779297, 0.02666616439819336, 0.02809906005859375, 0.02953195571899414, 0.03096485137939453, 0.03239774703979492, 0.03383064270019531, 0.0352635383605957, 0.036696434020996094, 0.038129329681396484, 0.039562225341796875, 0.040995121002197266, 0.042428016662597656, 0.04386091232299805, 0.04529380798339844, 0.04672670364379883, 0.04815959930419922, 0.04959249496459961, 0.051025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 8.0, 5.0, 7.0, 15.0, 18.0, 26.0, 28.0, 38.0, 83.0, 122.0, 176.0, 252.0, 451.0, 769.0, 1533.0, 3762.0, 10068.0, 31500.0, 118679.0, 414501.0, 337663.0, 89792.0, 24733.0, 7981.0, 3069.0, 1422.0, 726.0, 402.0, 254.0, 157.0, 95.0, 81.0, 45.0, 30.0, 31.0, 7.0, 8.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16034507751464844, -0.15479660034179688, -0.1492481231689453, -0.14369964599609375, -0.1381511688232422, -0.13260269165039062, -0.12705421447753906, -0.1215057373046875, -0.11595726013183594, -0.11040878295898438, -0.10486030578613281, -0.09931182861328125, -0.09376335144042969, -0.08821487426757812, -0.08266639709472656, -0.077117919921875, -0.07156944274902344, -0.06602096557617188, -0.06047248840332031, -0.05492401123046875, -0.04937553405761719, -0.043827056884765625, -0.03827857971191406, -0.0327301025390625, -0.027181625366210938, -0.021633148193359375, -0.016084671020507812, -0.01053619384765625, -0.0049877166748046875, 0.000560760498046875, 0.0061092376708984375, 0.01165771484375, 0.017206192016601562, 0.022754669189453125, 0.028303146362304688, 0.03385162353515625, 0.03940010070800781, 0.044948577880859375, 0.05049705505371094, 0.0560455322265625, 0.06159400939941406, 0.06714248657226562, 0.07269096374511719, 0.07823944091796875, 0.08378791809082031, 0.08933639526367188, 0.09488487243652344, 0.100433349609375, 0.10598182678222656, 0.11153030395507812, 0.11707878112792969, 0.12262725830078125, 0.1281757354736328, 0.13372421264648438, 0.13927268981933594, 0.1448211669921875, 0.15036964416503906, 0.15591812133789062, 0.1614665985107422, 0.16701507568359375, 0.1725635528564453, 0.17811203002929688, 0.18366050720214844, 0.189208984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 6.0, 11.0, 15.0, 22.0, 27.0, 21.0, 32.0, 26.0, 37.0, 34.0, 38.0, 55.0, 48.0, 54.0, 61.0, 44.0, 55.0, 51.0, 41.0, 49.0, 31.0, 41.0, 44.0, 29.0, 19.0, 25.0, 13.0, 10.0, 7.0, 6.0, 12.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.15947532653808594, -0.15427780151367188, -0.1490802764892578, -0.14388275146484375, -0.1386852264404297, -0.13348770141601562, -0.12829017639160156, -0.1230926513671875, -0.11789512634277344, -0.11269760131835938, -0.10750007629394531, -0.10230255126953125, -0.09710502624511719, -0.09190750122070312, -0.08670997619628906, -0.081512451171875, -0.07631492614746094, -0.07111740112304688, -0.06591987609863281, -0.06072235107421875, -0.05552482604980469, -0.050327301025390625, -0.04512977600097656, -0.0399322509765625, -0.03473472595214844, -0.029537200927734375, -0.024339675903320312, -0.01914215087890625, -0.013944625854492188, -0.008747100830078125, -0.0035495758056640625, 0.00164794921875, 0.0068454742431640625, 0.012042999267578125, 0.017240524291992188, 0.02243804931640625, 0.027635574340820312, 0.032833099365234375, 0.03803062438964844, 0.0432281494140625, 0.04842567443847656, 0.053623199462890625, 0.05882072448730469, 0.06401824951171875, 0.06921577453613281, 0.07441329956054688, 0.07961082458496094, 0.084808349609375, 0.09000587463378906, 0.09520339965820312, 0.10040092468261719, 0.10559844970703125, 0.11079597473144531, 0.11599349975585938, 0.12119102478027344, 0.1263885498046875, 0.13158607482910156, 0.13678359985351562, 0.1419811248779297, 0.14717864990234375, 0.1523761749267578, 0.15757369995117188, 0.16277122497558594, 0.16796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 10.0, 8.0, 17.0, 25.0, 35.0, 51.0, 64.0, 115.0, 162.0, 266.0, 489.0, 864.0, 1586.0, 3258.0, 6968.0, 16751.0, 47565.0, 183508.0, 502037.0, 201019.0, 51647.0, 17702.0, 7168.0, 3392.0, 1661.0, 894.0, 502.0, 290.0, 182.0, 103.0, 67.0, 47.0, 32.0, 19.0, 14.0, 11.0, 4.0, 4.0, 5.0, 7.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07781982421875, -0.07535171508789062, -0.07288360595703125, -0.07041549682617188, -0.0679473876953125, -0.06547927856445312, -0.06301116943359375, -0.060543060302734375, -0.058074951171875, -0.055606842041015625, -0.05313873291015625, -0.050670623779296875, -0.0482025146484375, -0.045734405517578125, -0.04326629638671875, -0.040798187255859375, -0.038330078125, -0.035861968994140625, -0.03339385986328125, -0.030925750732421875, -0.0284576416015625, -0.025989532470703125, -0.02352142333984375, -0.021053314208984375, -0.018585205078125, -0.016117095947265625, -0.01364898681640625, -0.011180877685546875, -0.0087127685546875, -0.006244659423828125, -0.00377655029296875, -0.001308441162109375, 0.00115966796875, 0.003627777099609375, 0.00609588623046875, 0.008563995361328125, 0.0110321044921875, 0.013500213623046875, 0.01596832275390625, 0.018436431884765625, 0.020904541015625, 0.023372650146484375, 0.02584075927734375, 0.028308868408203125, 0.0307769775390625, 0.033245086669921875, 0.03571319580078125, 0.038181304931640625, 0.0406494140625, 0.043117523193359375, 0.04558563232421875, 0.048053741455078125, 0.0505218505859375, 0.052989959716796875, 0.05545806884765625, 0.057926177978515625, 0.060394287109375, 0.06286239624023438, 0.06533050537109375, 0.06779861450195312, 0.0702667236328125, 0.07273483276367188, 0.07520294189453125, 0.07767105102539062, 0.08013916015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 18.0, 13.0, 22.0, 16.0, 22.0, 24.0, 29.0, 34.0, 27.0, 45.0, 52.0, 61.0, 65.0, 65.0, 67.0, 55.0, 70.0, 53.0, 40.0, 37.0, 37.0, 32.0, 13.0, 17.0, 16.0, 14.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1636486053466797e-05, -2.0889565348625183e-05, -2.014264464378357e-05, -1.9395723938941956e-05, -1.8648803234100342e-05, -1.7901882529258728e-05, -1.7154961824417114e-05, -1.64080411195755e-05, -1.5661120414733887e-05, -1.4914199709892273e-05, -1.416727900505066e-05, -1.3420358300209045e-05, -1.2673437595367432e-05, -1.1926516890525818e-05, -1.1179596185684204e-05, -1.043267548084259e-05, -9.685754776000977e-06, -8.938834071159363e-06, -8.191913366317749e-06, -7.444992661476135e-06, -6.6980719566345215e-06, -5.951151251792908e-06, -5.204230546951294e-06, -4.45730984210968e-06, -3.7103891372680664e-06, -2.9634684324264526e-06, -2.216547727584839e-06, -1.469627022743225e-06, -7.227063179016113e-07, 2.421438694000244e-08, 7.711350917816162e-07, 1.51805579662323e-06, 2.2649765014648438e-06, 3.0118972063064575e-06, 3.7588179111480713e-06, 4.505738615989685e-06, 5.252659320831299e-06, 5.999580025672913e-06, 6.746500730514526e-06, 7.49342143535614e-06, 8.240342140197754e-06, 8.987262845039368e-06, 9.734183549880981e-06, 1.0481104254722595e-05, 1.1228024959564209e-05, 1.1974945664405823e-05, 1.2721866369247437e-05, 1.346878707408905e-05, 1.4215707778930664e-05, 1.4962628483772278e-05, 1.570954918861389e-05, 1.6456469893455505e-05, 1.720339059829712e-05, 1.7950311303138733e-05, 1.8697232007980347e-05, 1.944415271282196e-05, 2.0191073417663574e-05, 2.0937994122505188e-05, 2.1684914827346802e-05, 2.2431835532188416e-05, 2.317875623703003e-05, 2.3925676941871643e-05, 2.4672597646713257e-05, 2.541951835155487e-05, 2.6166439056396484e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 7.0, 2.0, 4.0, 5.0, 6.0, 1.0, 9.0, 12.0, 16.0, 21.0, 33.0, 64.0, 86.0, 138.0, 250.0, 474.0, 924.0, 1936.0, 4957.0, 14525.0, 60555.0, 472016.0, 416408.0, 54288.0, 13481.0, 4526.0, 1889.0, 850.0, 444.0, 232.0, 141.0, 94.0, 55.0, 38.0, 23.0, 19.0, 8.0, 10.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1162109375, -0.11257553100585938, -0.10894012451171875, -0.10530471801757812, -0.1016693115234375, -0.09803390502929688, -0.09439849853515625, -0.09076309204101562, -0.087127685546875, -0.08349227905273438, -0.07985687255859375, -0.07622146606445312, -0.0725860595703125, -0.06895065307617188, -0.06531524658203125, -0.061679840087890625, -0.05804443359375, -0.054409027099609375, -0.05077362060546875, -0.047138214111328125, -0.0435028076171875, -0.039867401123046875, -0.03623199462890625, -0.032596588134765625, -0.028961181640625, -0.025325775146484375, -0.02169036865234375, -0.018054962158203125, -0.0144195556640625, -0.010784149169921875, -0.00714874267578125, -0.003513336181640625, 0.0001220703125, 0.003757476806640625, 0.00739288330078125, 0.011028289794921875, 0.0146636962890625, 0.018299102783203125, 0.02193450927734375, 0.025569915771484375, 0.029205322265625, 0.032840728759765625, 0.03647613525390625, 0.040111541748046875, 0.0437469482421875, 0.047382354736328125, 0.05101776123046875, 0.054653167724609375, 0.05828857421875, 0.061923980712890625, 0.06555938720703125, 0.06919479370117188, 0.0728302001953125, 0.07646560668945312, 0.08010101318359375, 0.08373641967773438, 0.087371826171875, 0.09100723266601562, 0.09464263916015625, 0.09827804565429688, 0.1019134521484375, 0.10554885864257812, 0.10918426513671875, 0.11281967163085938, 0.116455078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 8.0, 5.0, 9.0, 14.0, 22.0, 23.0, 31.0, 48.0, 81.0, 88.0, 97.0, 120.0, 113.0, 80.0, 80.0, 40.0, 34.0, 19.0, 9.0, 15.0, 14.0, 11.0, 11.0, 3.0, 1.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08917236328125, -0.08665657043457031, -0.08414077758789062, -0.08162498474121094, -0.07910919189453125, -0.07659339904785156, -0.07407760620117188, -0.07156181335449219, -0.0690460205078125, -0.06653022766113281, -0.06401443481445312, -0.06149864196777344, -0.05898284912109375, -0.05646705627441406, -0.053951263427734375, -0.05143547058105469, -0.048919677734375, -0.04640388488769531, -0.043888092041015625, -0.04137229919433594, -0.03885650634765625, -0.03634071350097656, -0.033824920654296875, -0.03130912780761719, -0.0287933349609375, -0.026277542114257812, -0.023761749267578125, -0.021245956420898438, -0.01873016357421875, -0.016214370727539062, -0.013698577880859375, -0.011182785034179688, -0.0086669921875, -0.0061511993408203125, -0.003635406494140625, -0.0011196136474609375, 0.00139617919921875, 0.0039119720458984375, 0.006427764892578125, 0.008943557739257812, 0.0114593505859375, 0.013975143432617188, 0.016490936279296875, 0.019006729125976562, 0.02152252197265625, 0.024038314819335938, 0.026554107666015625, 0.029069900512695312, 0.031585693359375, 0.03410148620605469, 0.036617279052734375, 0.03913307189941406, 0.04164886474609375, 0.04416465759277344, 0.046680450439453125, 0.04919624328613281, 0.0517120361328125, 0.05422782897949219, 0.056743621826171875, 0.05925941467285156, 0.06177520751953125, 0.06429100036621094, 0.06680679321289062, 0.06932258605957031, 0.07183837890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 19.0, 32.0, 57.0, 108.0, 170.0, 187.0, 178.0, 122.0, 54.0, 32.0, 19.0, 13.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748592853546143, -1.1267269849777222, -1.07859468460083, -1.030462384223938, -0.9823301434516907, -0.9341978430747986, -0.8860656023025513, -0.8379333019256592, -0.7898010015487671, -0.741668701171875, -0.6935364007949829, -0.6454041600227356, -0.5972718596458435, -0.5491395592689514, -0.5010073184967041, -0.452875018119812, -0.4047427177429199, -0.35661041736602783, -0.30847814679145813, -0.2603458762168884, -0.21221357583999634, -0.16408129036426544, -0.11594900488853455, -0.06781673431396484, -0.019684433937072754, 0.028447851538658142, 0.07658013701438904, 0.12471242249011993, 0.17284470796585083, 0.22097699344158173, 0.2691092789173126, 0.3172415494918823, 0.3653738498687744, 0.4135061502456665, 0.4616384208202362, 0.5097706913948059, 0.557902991771698, 0.6060352921485901, 0.6541675329208374, 0.7022998332977295, 0.7504321336746216, 0.7985644340515137, 0.8466967344284058, 0.8948289752006531, 0.9429612755775452, 0.9910935759544373, 1.0392258167266846, 1.0873581171035767, 1.1354904174804688, 1.1836227178573608, 1.231755018234253, 1.279887318611145, 1.328019618988037, 1.3761518001556396, 1.4242841005325317, 1.4724164009094238, 1.520548701286316, 1.568681001663208, 1.6168133020401, 1.6649456024169922, 1.7130777835845947, 1.7612100839614868, 1.809342384338379, 1.857474684715271, 1.905606985092163]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 9.0, 7.0, 3.0, 15.0, 9.0, 8.0, 18.0, 20.0, 26.0, 35.0, 39.0, 39.0, 48.0, 36.0, 49.0, 43.0, 65.0, 58.0, 46.0, 54.0, 54.0, 38.0, 44.0, 27.0, 38.0, 32.0, 29.0, 23.0, 11.0, 17.0, 12.0, 12.0, 9.0, 6.0, 7.0, 9.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8695246577262878, -0.8401280641555786, -0.8107314109802246, -0.7813347578048706, -0.7519381642341614, -0.7225415706634521, -0.6931449174880981, -0.6637482643127441, -0.6343516707420349, -0.6049550771713257, -0.5755584239959717, -0.5461617708206177, -0.5167651772499084, -0.48736855387687683, -0.4579719305038452, -0.4285753071308136, -0.399178683757782, -0.36978206038475037, -0.34038543701171875, -0.31098881363868713, -0.2815921902656555, -0.2521955668926239, -0.22279894351959229, -0.19340232014656067, -0.16400569677352905, -0.13460907340049744, -0.10521245002746582, -0.0758158266544342, -0.04641920328140259, -0.01702257990837097, 0.012374043464660645, 0.04177066683769226, 0.0711672306060791, 0.10056385397911072, 0.12996047735214233, 0.15935710072517395, 0.18875372409820557, 0.21815034747123718, 0.2475469708442688, 0.2769435942173004, 0.30634021759033203, 0.33573684096336365, 0.36513346433639526, 0.3945300877094269, 0.4239267110824585, 0.4533233344554901, 0.48271995782852173, 0.512116551399231, 0.541513204574585, 0.570909857749939, 0.6003064513206482, 0.6297030448913574, 0.6590996980667114, 0.6884963512420654, 0.7178929448127747, 0.7472895383834839, 0.7766861915588379, 0.8060828447341919, 0.8354794383049011, 0.8648760318756104, 0.8942726850509644, 0.9236693382263184, 0.9530659317970276, 0.9824625253677368, 1.0118591785430908]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 6.0, 7.0, 11.0, 18.0, 25.0, 59.0, 116.0, 251.0, 652.0, 1838.0, 6783.0, 35274.0, 3599826.0, 515807.0, 25189.0, 5415.0, 1684.0, 627.0, 309.0, 145.0, 99.0, 55.0, 32.0, 16.0, 15.0, 9.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41162109375, -0.4004707336425781, -0.38932037353515625, -0.3781700134277344, -0.3670196533203125, -0.3558692932128906, -0.34471893310546875, -0.3335685729980469, -0.322418212890625, -0.3112678527832031, -0.30011749267578125, -0.2889671325683594, -0.2778167724609375, -0.2666664123535156, -0.25551605224609375, -0.24436569213867188, -0.23321533203125, -0.22206497192382812, -0.21091461181640625, -0.19976425170898438, -0.1886138916015625, -0.17746353149414062, -0.16631317138671875, -0.15516281127929688, -0.144012451171875, -0.13286209106445312, -0.12171173095703125, -0.11056137084960938, -0.0994110107421875, -0.08826065063476562, -0.07711029052734375, -0.06595993041992188, -0.0548095703125, -0.043659210205078125, -0.03250885009765625, -0.021358489990234375, -0.0102081298828125, 0.000942230224609375, 0.01209259033203125, 0.023242950439453125, 0.034393310546875, 0.045543670654296875, 0.05669403076171875, 0.06784439086914062, 0.0789947509765625, 0.09014511108398438, 0.10129547119140625, 0.11244583129882812, 0.12359619140625, 0.13474655151367188, 0.14589691162109375, 0.15704727172851562, 0.1681976318359375, 0.17934799194335938, 0.19049835205078125, 0.20164871215820312, 0.212799072265625, 0.22394943237304688, 0.23509979248046875, 0.24625015258789062, 0.2574005126953125, 0.2685508728027344, 0.27970123291015625, 0.2908515930175781, 0.302001953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 5.0, 7.0, 14.0, 15.0, 24.0, 21.0, 42.0, 62.0, 81.0, 79.0, 72.0, 90.0, 94.0, 100.0, 74.0, 52.0, 48.0, 34.0, 29.0, 17.0, 10.0, 11.0, 13.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047088623046875, -0.04561185836791992, -0.044135093688964844, -0.042658329010009766, -0.04118156433105469, -0.03970479965209961, -0.03822803497314453, -0.03675127029418945, -0.035274505615234375, -0.0337977409362793, -0.03232097625732422, -0.03084421157836914, -0.029367446899414062, -0.027890682220458984, -0.026413917541503906, -0.024937152862548828, -0.02346038818359375, -0.021983623504638672, -0.020506858825683594, -0.019030094146728516, -0.017553329467773438, -0.01607656478881836, -0.014599800109863281, -0.013123035430908203, -0.011646270751953125, -0.010169506072998047, -0.008692741394042969, -0.007215976715087891, -0.0057392120361328125, -0.004262447357177734, -0.0027856826782226562, -0.0013089179992675781, 0.0001678466796875, 0.0016446113586425781, 0.0031213760375976562, 0.004598140716552734, 0.0060749053955078125, 0.007551670074462891, 0.009028434753417969, 0.010505199432373047, 0.011981964111328125, 0.013458728790283203, 0.014935493469238281, 0.01641225814819336, 0.017889022827148438, 0.019365787506103516, 0.020842552185058594, 0.022319316864013672, 0.02379608154296875, 0.025272846221923828, 0.026749610900878906, 0.028226375579833984, 0.029703140258789062, 0.03117990493774414, 0.03265666961669922, 0.0341334342956543, 0.035610198974609375, 0.03708696365356445, 0.03856372833251953, 0.04004049301147461, 0.04151725769042969, 0.042994022369384766, 0.044470787048339844, 0.04594755172729492, 0.04742431640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 9.0, 23.0, 24.0, 57.0, 77.0, 125.0, 248.0, 553.0, 1233.0, 3239.0, 10296.0, 47230.0, 634711.0, 3395821.0, 78785.0, 14724.0, 4217.0, 1513.0, 682.0, 290.0, 167.0, 109.0, 53.0, 39.0, 13.0, 19.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.29577064514160156, -0.2875862121582031, -0.2794017791748047, -0.27121734619140625, -0.2630329132080078, -0.2548484802246094, -0.24666404724121094, -0.2384796142578125, -0.23029518127441406, -0.22211074829101562, -0.2139263153076172, -0.20574188232421875, -0.1975574493408203, -0.18937301635742188, -0.18118858337402344, -0.173004150390625, -0.16481971740722656, -0.15663528442382812, -0.1484508514404297, -0.14026641845703125, -0.1320819854736328, -0.12389755249023438, -0.11571311950683594, -0.1075286865234375, -0.09934425354003906, -0.09115982055664062, -0.08297538757324219, -0.07479095458984375, -0.06660652160644531, -0.058422088623046875, -0.05023765563964844, -0.04205322265625, -0.03386878967285156, -0.025684356689453125, -0.017499923706054688, -0.00931549072265625, -0.0011310577392578125, 0.007053375244140625, 0.015237808227539062, 0.0234222412109375, 0.03160667419433594, 0.039791107177734375, 0.04797554016113281, 0.05615997314453125, 0.06434440612792969, 0.07252883911132812, 0.08071327209472656, 0.088897705078125, 0.09708213806152344, 0.10526657104492188, 0.11345100402832031, 0.12163543701171875, 0.1298198699951172, 0.13800430297851562, 0.14618873596191406, 0.1543731689453125, 0.16255760192871094, 0.17074203491210938, 0.1789264678955078, 0.18711090087890625, 0.1952953338623047, 0.20347976684570312, 0.21166419982910156, 0.2198486328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 11.0, 8.0, 8.0, 13.0, 19.0, 17.0, 25.0, 43.0, 41.0, 73.0, 100.0, 177.0, 337.0, 1547.0, 881.0, 295.0, 138.0, 98.0, 52.0, 46.0, 22.0, 25.0, 19.0, 13.0, 15.0, 9.0, 6.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04449462890625, -0.04309892654418945, -0.041703224182128906, -0.04030752182006836, -0.03891181945800781, -0.037516117095947266, -0.03612041473388672, -0.03472471237182617, -0.033329010009765625, -0.03193330764770508, -0.03053760528564453, -0.029141902923583984, -0.027746200561523438, -0.02635049819946289, -0.024954795837402344, -0.023559093475341797, -0.02216339111328125, -0.020767688751220703, -0.019371986389160156, -0.01797628402709961, -0.016580581665039062, -0.015184879302978516, -0.013789176940917969, -0.012393474578857422, -0.010997772216796875, -0.009602069854736328, -0.008206367492675781, -0.006810665130615234, -0.0054149627685546875, -0.004019260406494141, -0.0026235580444335938, -0.0012278556823730469, 0.0001678466796875, 0.0015635490417480469, 0.0029592514038085938, 0.004354953765869141, 0.0057506561279296875, 0.007146358489990234, 0.008542060852050781, 0.009937763214111328, 0.011333465576171875, 0.012729167938232422, 0.014124870300292969, 0.015520572662353516, 0.016916275024414062, 0.01831197738647461, 0.019707679748535156, 0.021103382110595703, 0.02249908447265625, 0.023894786834716797, 0.025290489196777344, 0.02668619155883789, 0.028081893920898438, 0.029477596282958984, 0.03087329864501953, 0.03226900100708008, 0.033664703369140625, 0.03506040573120117, 0.03645610809326172, 0.037851810455322266, 0.03924751281738281, 0.04064321517944336, 0.042038917541503906, 0.04343461990356445, 0.044830322265625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 11.0, 25.0, 21.0, 42.0, 76.0, 101.0, 118.0, 109.0, 128.0, 110.0, 75.0, 65.0, 36.0, 24.0, 19.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2542146146297455, -0.24508729577064514, -0.2359599769115448, -0.22683264315128326, -0.21770532429218292, -0.20857800543308258, -0.19945067167282104, -0.1903233528137207, -0.18119603395462036, -0.17206871509552002, -0.16294139623641968, -0.15381406247615814, -0.1446867436170578, -0.13555942475795746, -0.12643209099769592, -0.11730477213859558, -0.10817745327949524, -0.0990501344203949, -0.08992280811071396, -0.08079548180103302, -0.07166816294193268, -0.06254084408283234, -0.0534135177731514, -0.04428619146347046, -0.03515887260437012, -0.026031550019979477, -0.016904227435588837, -0.007776904851198196, 0.0013504177331924438, 0.010477740317583084, 0.019605062901973724, 0.028732389211654663, 0.03785967826843262, 0.04698700085282326, 0.0561143234372139, 0.06524164974689484, 0.07436896860599518, 0.08349628746509552, 0.09262361377477646, 0.1017509400844574, 0.11087825894355774, 0.12000557780265808, 0.12913289666175842, 0.13826023042201996, 0.1473875492811203, 0.15651486814022064, 0.16564220190048218, 0.17476952075958252, 0.18389683961868286, 0.1930241584777832, 0.20215147733688354, 0.21127881109714508, 0.22040612995624542, 0.22953344881534576, 0.2386607825756073, 0.24778810143470764, 0.256915420293808, 0.2660427391529083, 0.27517005801200867, 0.284297376871109, 0.29342472553253174, 0.3025520443916321, 0.3116793632507324, 0.32080668210983276, 0.3299340009689331]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 1.0, 6.0, 7.0, 8.0, 11.0, 17.0, 18.0, 28.0, 19.0, 18.0, 30.0, 31.0, 31.0, 32.0, 32.0, 42.0, 41.0, 43.0, 34.0, 36.0, 51.0, 38.0, 53.0, 40.0, 25.0, 32.0, 29.0, 27.0, 32.0, 23.0, 24.0, 24.0, 15.0, 16.0, 12.0, 19.0, 14.0, 5.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.14361059665679932, -0.13893955945968628, -0.13426853716373444, -0.1295975148677826, -0.12492647767066956, -0.12025544792413712, -0.11558441817760468, -0.11091338843107224, -0.1062423586845398, -0.10157132893800735, -0.09690029919147491, -0.09222926944494247, -0.08755823969841003, -0.0828872099518776, -0.07821618020534515, -0.07354515045881271, -0.06887412071228027, -0.06420309096574783, -0.05953206121921539, -0.05486103147268295, -0.05019000172615051, -0.04551897197961807, -0.04084794223308563, -0.03617691248655319, -0.03150588274002075, -0.026834852993488312, -0.02216382324695587, -0.01749279350042343, -0.012821763753890991, -0.008150734007358551, -0.003479704260826111, 0.0011913254857063293, 0.0058623552322387695, 0.01053338497877121, 0.01520441472530365, 0.01987544447183609, 0.02454647421836853, 0.02921750396490097, 0.03388853371143341, 0.03855956345796585, 0.04323059320449829, 0.04790162295103073, 0.05257265269756317, 0.05724368244409561, 0.06191471219062805, 0.06658574193716049, 0.07125677168369293, 0.07592780143022537, 0.08059883117675781, 0.08526986092329025, 0.08994089066982269, 0.09461192041635513, 0.09928295016288757, 0.10395397990942001, 0.10862500965595245, 0.1132960394024849, 0.11796706914901733, 0.12263809889554977, 0.12730912864208221, 0.13198015093803406, 0.1366511881351471, 0.14132222533226013, 0.14599324762821198, 0.15066426992416382, 0.15533530712127686]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 8.0, 9.0, 15.0, 11.0, 35.0, 49.0, 52.0, 108.0, 174.0, 300.0, 498.0, 865.0, 1681.0, 3649.0, 8800.0, 24380.0, 77122.0, 256678.0, 432966.0, 163272.0, 49835.0, 16294.0, 6100.0, 2656.0, 1284.0, 677.0, 386.0, 242.0, 125.0, 74.0, 72.0, 39.0, 26.0, 18.0, 13.0, 15.0, 11.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1630859375, -0.15833282470703125, -0.1535797119140625, -0.14882659912109375, -0.144073486328125, -0.13932037353515625, -0.1345672607421875, -0.12981414794921875, -0.12506103515625, -0.12030792236328125, -0.1155548095703125, -0.11080169677734375, -0.106048583984375, -0.10129547119140625, -0.0965423583984375, -0.09178924560546875, -0.0870361328125, -0.08228302001953125, -0.0775299072265625, -0.07277679443359375, -0.068023681640625, -0.06327056884765625, -0.0585174560546875, -0.05376434326171875, -0.04901123046875, -0.04425811767578125, -0.0395050048828125, -0.03475189208984375, -0.029998779296875, -0.02524566650390625, -0.0204925537109375, -0.01573944091796875, -0.010986328125, -0.00623321533203125, -0.0014801025390625, 0.00327301025390625, 0.008026123046875, 0.01277923583984375, 0.0175323486328125, 0.02228546142578125, 0.02703857421875, 0.03179168701171875, 0.0365447998046875, 0.04129791259765625, 0.046051025390625, 0.05080413818359375, 0.0555572509765625, 0.06031036376953125, 0.0650634765625, 0.06981658935546875, 0.0745697021484375, 0.07932281494140625, 0.084075927734375, 0.08882904052734375, 0.0935821533203125, 0.09833526611328125, 0.10308837890625, 0.10784149169921875, 0.1125946044921875, 0.11734771728515625, 0.122100830078125, 0.12685394287109375, 0.1316070556640625, 0.13636016845703125, 0.14111328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 12.0, 6.0, 13.0, 23.0, 29.0, 38.0, 45.0, 56.0, 71.0, 73.0, 75.0, 89.0, 89.0, 76.0, 62.0, 59.0, 46.0, 37.0, 32.0, 20.0, 12.0, 9.0, 9.0, 8.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04254150390625, -0.04115629196166992, -0.039771080017089844, -0.038385868072509766, -0.03700065612792969, -0.03561544418334961, -0.03423023223876953, -0.03284502029418945, -0.031459808349609375, -0.030074596405029297, -0.02868938446044922, -0.02730417251586914, -0.025918960571289062, -0.024533748626708984, -0.023148536682128906, -0.021763324737548828, -0.02037811279296875, -0.018992900848388672, -0.017607688903808594, -0.016222476959228516, -0.014837265014648438, -0.01345205307006836, -0.012066841125488281, -0.010681629180908203, -0.009296417236328125, -0.007911205291748047, -0.006525993347167969, -0.005140781402587891, -0.0037555694580078125, -0.0023703575134277344, -0.0009851455688476562, 0.0004000663757324219, 0.0017852783203125, 0.003170490264892578, 0.004555702209472656, 0.005940914154052734, 0.0073261260986328125, 0.00871133804321289, 0.010096549987792969, 0.011481761932373047, 0.012866973876953125, 0.014252185821533203, 0.01563739776611328, 0.01702260971069336, 0.018407821655273438, 0.019793033599853516, 0.021178245544433594, 0.022563457489013672, 0.02394866943359375, 0.025333881378173828, 0.026719093322753906, 0.028104305267333984, 0.029489517211914062, 0.03087472915649414, 0.03225994110107422, 0.0336451530456543, 0.035030364990234375, 0.03641557693481445, 0.03780078887939453, 0.03918600082397461, 0.04057121276855469, 0.041956424713134766, 0.043341636657714844, 0.04472684860229492, 0.046112060546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 16.0, 19.0, 28.0, 41.0, 49.0, 85.0, 152.0, 243.0, 447.0, 879.0, 1870.0, 5242.0, 19394.0, 90482.0, 428159.0, 393802.0, 81557.0, 17528.0, 4867.0, 1843.0, 784.0, 451.0, 263.0, 136.0, 70.0, 52.0, 38.0, 19.0, 10.0, 6.0, 2.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12103271484375, -0.11526012420654297, -0.10948753356933594, -0.1037149429321289, -0.09794235229492188, -0.09216976165771484, -0.08639717102050781, -0.08062458038330078, -0.07485198974609375, -0.06907939910888672, -0.06330680847167969, -0.057534217834472656, -0.051761627197265625, -0.045989036560058594, -0.04021644592285156, -0.03444385528564453, -0.0286712646484375, -0.02289867401123047, -0.017126083374023438, -0.011353492736816406, -0.005580902099609375, 0.00019168853759765625, 0.0059642791748046875, 0.011736869812011719, 0.01750946044921875, 0.02328205108642578, 0.029054641723632812, 0.034827232360839844, 0.040599822998046875, 0.046372413635253906, 0.05214500427246094, 0.05791759490966797, 0.063690185546875, 0.06946277618408203, 0.07523536682128906, 0.0810079574584961, 0.08678054809570312, 0.09255313873291016, 0.09832572937011719, 0.10409832000732422, 0.10987091064453125, 0.11564350128173828, 0.12141609191894531, 0.12718868255615234, 0.13296127319335938, 0.1387338638305664, 0.14450645446777344, 0.15027904510498047, 0.1560516357421875, 0.16182422637939453, 0.16759681701660156, 0.1733694076538086, 0.17914199829101562, 0.18491458892822266, 0.1906871795654297, 0.19645977020263672, 0.20223236083984375, 0.20800495147705078, 0.2137775421142578, 0.21955013275146484, 0.22532272338867188, 0.2310953140258789, 0.23686790466308594, 0.24264049530029297, 0.2484130859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 8.0, 8.0, 10.0, 22.0, 15.0, 15.0, 25.0, 24.0, 38.0, 35.0, 36.0, 46.0, 50.0, 52.0, 52.0, 43.0, 57.0, 41.0, 63.0, 52.0, 43.0, 35.0, 36.0, 33.0, 29.0, 29.0, 24.0, 22.0, 12.0, 9.0, 5.0, 12.0, 3.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11395263671875, -0.1092233657836914, -0.10449409484863281, -0.09976482391357422, -0.09503555297851562, -0.09030628204345703, -0.08557701110839844, -0.08084774017333984, -0.07611846923828125, -0.07138919830322266, -0.06665992736816406, -0.06193065643310547, -0.057201385498046875, -0.05247211456298828, -0.04774284362792969, -0.043013572692871094, -0.0382843017578125, -0.033555030822753906, -0.028825759887695312, -0.02409648895263672, -0.019367218017578125, -0.014637947082519531, -0.009908676147460938, -0.005179405212402344, -0.00045013427734375, 0.004279136657714844, 0.009008407592773438, 0.013737678527832031, 0.018466949462890625, 0.02319622039794922, 0.027925491333007812, 0.032654762268066406, 0.037384033203125, 0.042113304138183594, 0.04684257507324219, 0.05157184600830078, 0.056301116943359375, 0.06103038787841797, 0.06575965881347656, 0.07048892974853516, 0.07521820068359375, 0.07994747161865234, 0.08467674255371094, 0.08940601348876953, 0.09413528442382812, 0.09886455535888672, 0.10359382629394531, 0.1083230972290039, 0.1130523681640625, 0.1177816390991211, 0.12251091003417969, 0.12724018096923828, 0.13196945190429688, 0.13669872283935547, 0.14142799377441406, 0.14615726470947266, 0.15088653564453125, 0.15561580657958984, 0.16034507751464844, 0.16507434844970703, 0.16980361938476562, 0.17453289031982422, 0.1792621612548828, 0.1839914321899414, 0.188720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 5.0, 6.0, 21.0, 28.0, 37.0, 54.0, 92.0, 142.0, 221.0, 324.0, 590.0, 1064.0, 1897.0, 3868.0, 8177.0, 20205.0, 62332.0, 258846.0, 478556.0, 146678.0, 38714.0, 14047.0, 6157.0, 2944.0, 1480.0, 820.0, 472.0, 274.0, 174.0, 117.0, 64.0, 44.0, 31.0, 23.0, 12.0, 14.0, 9.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059539794921875, -0.057436466217041016, -0.05533313751220703, -0.05322980880737305, -0.05112648010253906, -0.04902315139770508, -0.046919822692871094, -0.04481649398803711, -0.042713165283203125, -0.04060983657836914, -0.038506507873535156, -0.03640317916870117, -0.03429985046386719, -0.0321965217590332, -0.03009319305419922, -0.027989864349365234, -0.02588653564453125, -0.023783206939697266, -0.02167987823486328, -0.019576549530029297, -0.017473220825195312, -0.015369892120361328, -0.013266563415527344, -0.01116323471069336, -0.009059906005859375, -0.006956577301025391, -0.004853248596191406, -0.002749919891357422, -0.0006465911865234375, 0.0014567375183105469, 0.0035600662231445312, 0.005663394927978516, 0.0077667236328125, 0.009870052337646484, 0.011973381042480469, 0.014076709747314453, 0.016180038452148438, 0.018283367156982422, 0.020386695861816406, 0.02249002456665039, 0.024593353271484375, 0.02669668197631836, 0.028800010681152344, 0.030903339385986328, 0.03300666809082031, 0.0351099967956543, 0.03721332550048828, 0.039316654205322266, 0.04141998291015625, 0.043523311614990234, 0.04562664031982422, 0.0477299690246582, 0.04983329772949219, 0.05193662643432617, 0.054039955139160156, 0.05614328384399414, 0.058246612548828125, 0.06034994125366211, 0.062453269958496094, 0.06455659866333008, 0.06665992736816406, 0.06876325607299805, 0.07086658477783203, 0.07296991348266602, 0.0750732421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 8.0, 6.0, 11.0, 13.0, 29.0, 39.0, 38.0, 66.0, 70.0, 81.0, 86.0, 99.0, 102.0, 87.0, 76.0, 58.0, 27.0, 32.0, 19.0, 16.0, 11.0, 8.0, 9.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.218650817871094e-05, -3.080815076828003e-05, -2.942979335784912e-05, -2.8051435947418213e-05, -2.6673078536987305e-05, -2.5294721126556396e-05, -2.3916363716125488e-05, -2.253800630569458e-05, -2.1159648895263672e-05, -1.9781291484832764e-05, -1.8402934074401855e-05, -1.7024576663970947e-05, -1.564621925354004e-05, -1.4267861843109131e-05, -1.2889504432678223e-05, -1.1511147022247314e-05, -1.0132789611816406e-05, -8.754432201385498e-06, -7.37607479095459e-06, -5.997717380523682e-06, -4.6193599700927734e-06, -3.2410025596618652e-06, -1.862645149230957e-06, -4.842877388000488e-07, 8.940696716308594e-07, 2.2724270820617676e-06, 3.6507844924926758e-06, 5.029141902923584e-06, 6.407499313354492e-06, 7.7858567237854e-06, 9.164214134216309e-06, 1.0542571544647217e-05, 1.1920928955078125e-05, 1.3299286365509033e-05, 1.4677643775939941e-05, 1.605600118637085e-05, 1.7434358596801758e-05, 1.8812716007232666e-05, 2.0191073417663574e-05, 2.1569430828094482e-05, 2.294778823852539e-05, 2.43261456489563e-05, 2.5704503059387207e-05, 2.7082860469818115e-05, 2.8461217880249023e-05, 2.983957529067993e-05, 3.121793270111084e-05, 3.259629011154175e-05, 3.3974647521972656e-05, 3.5353004932403564e-05, 3.673136234283447e-05, 3.810971975326538e-05, 3.948807716369629e-05, 4.08664345741272e-05, 4.2244791984558105e-05, 4.3623149394989014e-05, 4.500150680541992e-05, 4.637986421585083e-05, 4.775822162628174e-05, 4.9136579036712646e-05, 5.0514936447143555e-05, 5.189329385757446e-05, 5.327165126800537e-05, 5.465000867843628e-05, 5.602836608886719e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 10.0, 7.0, 9.0, 12.0, 12.0, 30.0, 55.0, 73.0, 127.0, 239.0, 346.0, 739.0, 1440.0, 3248.0, 8354.0, 25193.0, 112008.0, 573650.0, 256185.0, 44735.0, 12963.0, 4837.0, 2065.0, 998.0, 494.0, 281.0, 158.0, 90.0, 63.0, 35.0, 30.0, 16.0, 16.0, 10.0, 9.0, 0.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080322265625, -0.07752513885498047, -0.07472801208496094, -0.0719308853149414, -0.06913375854492188, -0.06633663177490234, -0.06353950500488281, -0.06074237823486328, -0.05794525146484375, -0.05514812469482422, -0.05235099792480469, -0.049553871154785156, -0.046756744384765625, -0.043959617614746094, -0.04116249084472656, -0.03836536407470703, -0.0355682373046875, -0.03277111053466797, -0.029973983764648438, -0.027176856994628906, -0.024379730224609375, -0.021582603454589844, -0.018785476684570312, -0.01598834991455078, -0.01319122314453125, -0.010394096374511719, -0.0075969696044921875, -0.004799842834472656, -0.002002716064453125, 0.0007944107055664062, 0.0035915374755859375, 0.006388664245605469, 0.009185791015625, 0.011982917785644531, 0.014780044555664062, 0.017577171325683594, 0.020374298095703125, 0.023171424865722656, 0.025968551635742188, 0.02876567840576172, 0.03156280517578125, 0.03435993194580078, 0.03715705871582031, 0.039954185485839844, 0.042751312255859375, 0.045548439025878906, 0.04834556579589844, 0.05114269256591797, 0.0539398193359375, 0.05673694610595703, 0.05953407287597656, 0.062331199645996094, 0.06512832641601562, 0.06792545318603516, 0.07072257995605469, 0.07351970672607422, 0.07631683349609375, 0.07911396026611328, 0.08191108703613281, 0.08470821380615234, 0.08750534057617188, 0.0903024673461914, 0.09309959411621094, 0.09589672088623047, 0.09869384765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 7.0, 13.0, 12.0, 24.0, 29.0, 51.0, 59.0, 77.0, 93.0, 88.0, 109.0, 87.0, 66.0, 77.0, 61.0, 29.0, 24.0, 26.0, 13.0, 9.0, 10.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056732177734375, -0.05472898483276367, -0.052725791931152344, -0.050722599029541016, -0.04871940612792969, -0.04671621322631836, -0.04471302032470703, -0.0427098274230957, -0.040706634521484375, -0.03870344161987305, -0.03670024871826172, -0.03469705581665039, -0.03269386291503906, -0.030690670013427734, -0.028687477111816406, -0.026684284210205078, -0.02468109130859375, -0.022677898406982422, -0.020674705505371094, -0.018671512603759766, -0.016668319702148438, -0.01466512680053711, -0.012661933898925781, -0.010658740997314453, -0.008655548095703125, -0.006652355194091797, -0.004649162292480469, -0.0026459693908691406, -0.0006427764892578125, 0.0013604164123535156, 0.0033636093139648438, 0.005366802215576172, 0.0073699951171875, 0.009373188018798828, 0.011376380920410156, 0.013379573822021484, 0.015382766723632812, 0.01738595962524414, 0.01938915252685547, 0.021392345428466797, 0.023395538330078125, 0.025398731231689453, 0.02740192413330078, 0.02940511703491211, 0.03140830993652344, 0.033411502838134766, 0.035414695739746094, 0.03741788864135742, 0.03942108154296875, 0.04142427444458008, 0.043427467346191406, 0.045430660247802734, 0.04743385314941406, 0.04943704605102539, 0.05144023895263672, 0.05344343185424805, 0.055446624755859375, 0.0574498176574707, 0.05945301055908203, 0.06145620346069336, 0.06345939636230469, 0.06546258926391602, 0.06746578216552734, 0.06946897506713867, 0.07147216796875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 8.0, 16.0, 26.0, 51.0, 48.0, 68.0, 118.0, 113.0, 126.0, 104.0, 96.0, 73.0, 42.0, 34.0, 27.0, 16.0, 6.0, 4.0, 5.0, 4.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.873810887336731, -0.844957172870636, -0.816103458404541, -0.787249743938446, -0.7583960294723511, -0.7295423746109009, -0.7006886601448059, -0.6718349456787109, -0.642981231212616, -0.614127516746521, -0.585273802280426, -0.556420087814331, -0.5275664329528809, -0.4987126886844635, -0.4698590040206909, -0.44100528955459595, -0.412151575088501, -0.383297860622406, -0.35444414615631104, -0.32559046149253845, -0.2967367470264435, -0.2678830325603485, -0.23902933299541473, -0.21017563343048096, -0.181321918964386, -0.15246820449829102, -0.12361450493335724, -0.09476079791784286, -0.06590709090232849, -0.03705337643623352, -0.008199676871299744, 0.020654022693634033, 0.049507737159729004, 0.07836144417524338, 0.10721515119075775, 0.13606885075569153, 0.1649225652217865, 0.19377627968788147, 0.22262997925281525, 0.251483678817749, 0.280337393283844, 0.30919110774993896, 0.33804482221603394, 0.3668985068798065, 0.3957522213459015, 0.42460593581199646, 0.45345962047576904, 0.482313334941864, 0.511167049407959, 0.540020763874054, 0.5688744783401489, 0.5977281928062439, 0.6265819072723389, 0.6554355621337891, 0.684289276599884, 0.713142991065979, 0.741996705532074, 0.770850419998169, 0.7997041344642639, 0.8285578489303589, 0.8574115037918091, 0.8862652778625488, 0.915118932723999, 0.943972647190094, 0.972826361656189]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 4.0, 12.0, 19.0, 7.0, 17.0, 20.0, 14.0, 37.0, 33.0, 41.0, 45.0, 52.0, 68.0, 60.0, 62.0, 58.0, 64.0, 65.0, 46.0, 44.0, 48.0, 42.0, 36.0, 30.0, 21.0, 10.0, 13.0, 8.0, 4.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9815332889556885, -0.9500988721847534, -0.9186645150184631, -0.8872301578521729, -0.8557957410812378, -0.8243613243103027, -0.7929269671440125, -0.7614926099777222, -0.7300581932067871, -0.698623776435852, -0.6671894192695618, -0.6357550621032715, -0.6043206453323364, -0.5728862285614014, -0.5414518713951111, -0.5100175142288208, -0.47858309745788574, -0.44714871048927307, -0.4157143235206604, -0.38427993655204773, -0.35284554958343506, -0.3214111626148224, -0.2899767756462097, -0.25854238867759705, -0.22710800170898438, -0.1956736147403717, -0.16423922777175903, -0.13280484080314636, -0.10137045383453369, -0.06993606686592102, -0.03850167989730835, -0.007067292928695679, 0.024367094039916992, 0.05580148100852966, 0.08723586797714233, 0.118670254945755, 0.15010464191436768, 0.18153902888298035, 0.21297341585159302, 0.2444078028202057, 0.27584218978881836, 0.30727657675743103, 0.3387109637260437, 0.37014535069465637, 0.40157973766326904, 0.4330141246318817, 0.4644485116004944, 0.49588289856910706, 0.5273172855377197, 0.5587517023086548, 0.5901860594749451, 0.6216204166412354, 0.6530548334121704, 0.6844892501831055, 0.7159236073493958, 0.747357964515686, 0.7787923812866211, 0.8102267980575562, 0.8416611552238464, 0.8730955123901367, 0.9045299291610718, 0.9359643459320068, 0.9673987030982971, 0.9988330602645874, 1.0302674770355225]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 11.0, 17.0, 28.0, 61.0, 70.0, 129.0, 233.0, 396.0, 770.0, 1397.0, 3074.0, 7296.0, 20248.0, 80001.0, 2480232.0, 1493597.0, 73408.0, 19405.0, 6990.0, 3150.0, 1539.0, 815.0, 482.0, 284.0, 203.0, 129.0, 76.0, 50.0, 32.0, 36.0, 24.0, 22.0, 15.0, 14.0, 7.0, 7.0, 4.0, 6.0, 1.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2025146484375, -0.1961822509765625, -0.189849853515625, -0.1835174560546875, -0.17718505859375, -0.1708526611328125, -0.164520263671875, -0.1581878662109375, -0.15185546875, -0.1455230712890625, -0.139190673828125, -0.1328582763671875, -0.12652587890625, -0.1201934814453125, -0.113861083984375, -0.1075286865234375, -0.1011962890625, -0.0948638916015625, -0.088531494140625, -0.0821990966796875, -0.07586669921875, -0.0695343017578125, -0.063201904296875, -0.0568695068359375, -0.050537109375, -0.0442047119140625, -0.037872314453125, -0.0315399169921875, -0.02520751953125, -0.0188751220703125, -0.012542724609375, -0.0062103271484375, 0.0001220703125, 0.0064544677734375, 0.012786865234375, 0.0191192626953125, 0.02545166015625, 0.0317840576171875, 0.038116455078125, 0.0444488525390625, 0.05078125, 0.0571136474609375, 0.063446044921875, 0.0697784423828125, 0.07611083984375, 0.0824432373046875, 0.088775634765625, 0.0951080322265625, 0.1014404296875, 0.1077728271484375, 0.114105224609375, 0.1204376220703125, 0.12677001953125, 0.1331024169921875, 0.139434814453125, 0.1457672119140625, 0.152099609375, 0.1584320068359375, 0.164764404296875, 0.1710968017578125, 0.17742919921875, 0.1837615966796875, 0.190093994140625, 0.1964263916015625, 0.2027587890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 8.0, 11.0, 13.0, 28.0, 34.0, 51.0, 70.0, 70.0, 77.0, 86.0, 75.0, 95.0, 78.0, 81.0, 65.0, 34.0, 42.0, 15.0, 12.0, 11.0, 11.0, 10.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04193115234375, -0.04046344757080078, -0.03899574279785156, -0.037528038024902344, -0.036060333251953125, -0.034592628479003906, -0.03312492370605469, -0.03165721893310547, -0.03018951416015625, -0.02872180938720703, -0.027254104614257812, -0.025786399841308594, -0.024318695068359375, -0.022850990295410156, -0.021383285522460938, -0.01991558074951172, -0.0184478759765625, -0.01698017120361328, -0.015512466430664062, -0.014044761657714844, -0.012577056884765625, -0.011109352111816406, -0.009641647338867188, -0.008173942565917969, -0.00670623779296875, -0.005238533020019531, -0.0037708282470703125, -0.0023031234741210938, -0.000835418701171875, 0.0006322860717773438, 0.0020999908447265625, 0.0035676956176757812, 0.005035400390625, 0.006503105163574219, 0.007970809936523438, 0.009438514709472656, 0.010906219482421875, 0.012373924255371094, 0.013841629028320312, 0.015309333801269531, 0.01677703857421875, 0.01824474334716797, 0.019712448120117188, 0.021180152893066406, 0.022647857666015625, 0.024115562438964844, 0.025583267211914062, 0.02705097198486328, 0.0285186767578125, 0.02998638153076172, 0.03145408630371094, 0.032921791076660156, 0.034389495849609375, 0.035857200622558594, 0.03732490539550781, 0.03879261016845703, 0.04026031494140625, 0.04172801971435547, 0.04319572448730469, 0.044663429260253906, 0.046131134033203125, 0.047598838806152344, 0.04906654357910156, 0.05053424835205078, 0.052001953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 9.0, 17.0, 27.0, 33.0, 61.0, 89.0, 132.0, 218.0, 414.0, 701.0, 1310.0, 2748.0, 6122.0, 15746.0, 48169.0, 217607.0, 3215349.0, 562354.0, 83119.0, 23553.0, 8711.0, 3842.0, 1754.0, 904.0, 475.0, 282.0, 176.0, 99.0, 73.0, 45.0, 29.0, 31.0, 12.0, 6.0, 11.0, 5.0, 5.0, 2.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15880966186523438, -0.15380096435546875, -0.14879226684570312, -0.1437835693359375, -0.13877487182617188, -0.13376617431640625, -0.12875747680664062, -0.123748779296875, -0.11874008178710938, -0.11373138427734375, -0.10872268676757812, -0.1037139892578125, -0.09870529174804688, -0.09369659423828125, -0.08868789672851562, -0.08367919921875, -0.07867050170898438, -0.07366180419921875, -0.06865310668945312, -0.0636444091796875, -0.058635711669921875, -0.05362701416015625, -0.048618316650390625, -0.043609619140625, -0.038600921630859375, -0.03359222412109375, -0.028583526611328125, -0.0235748291015625, -0.018566131591796875, -0.01355743408203125, -0.008548736572265625, -0.0035400390625, 0.001468658447265625, 0.00647735595703125, 0.011486053466796875, 0.0164947509765625, 0.021503448486328125, 0.02651214599609375, 0.031520843505859375, 0.036529541015625, 0.041538238525390625, 0.04654693603515625, 0.051555633544921875, 0.0565643310546875, 0.061573028564453125, 0.06658172607421875, 0.07159042358398438, 0.07659912109375, 0.08160781860351562, 0.08661651611328125, 0.09162521362304688, 0.0966339111328125, 0.10164260864257812, 0.10665130615234375, 0.11166000366210938, 0.116668701171875, 0.12167739868164062, 0.12668609619140625, 0.13169479370117188, 0.1367034912109375, 0.14171218872070312, 0.14672088623046875, 0.15172958374023438, 0.15673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 6.0, 6.0, 5.0, 8.0, 13.0, 13.0, 17.0, 32.0, 34.0, 30.0, 38.0, 63.0, 103.0, 147.0, 267.0, 609.0, 1355.0, 563.0, 281.0, 130.0, 91.0, 56.0, 52.0, 30.0, 28.0, 25.0, 16.0, 12.0, 13.0, 7.0, 8.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046417236328125, -0.04452180862426758, -0.042626380920410156, -0.040730953216552734, -0.03883552551269531, -0.03694009780883789, -0.03504467010498047, -0.03314924240112305, -0.031253814697265625, -0.029358386993408203, -0.02746295928955078, -0.02556753158569336, -0.023672103881835938, -0.021776676177978516, -0.019881248474121094, -0.017985820770263672, -0.01609039306640625, -0.014194965362548828, -0.012299537658691406, -0.010404109954833984, -0.008508682250976562, -0.006613254547119141, -0.004717826843261719, -0.002822399139404297, -0.000926971435546875, 0.0009684562683105469, 0.0028638839721679688, 0.004759311676025391, 0.0066547393798828125, 0.008550167083740234, 0.010445594787597656, 0.012341022491455078, 0.0142364501953125, 0.016131877899169922, 0.018027305603027344, 0.019922733306884766, 0.021818161010742188, 0.02371358871459961, 0.02560901641845703, 0.027504444122314453, 0.029399871826171875, 0.0312952995300293, 0.03319072723388672, 0.03508615493774414, 0.03698158264160156, 0.038877010345458984, 0.040772438049316406, 0.04266786575317383, 0.04456329345703125, 0.04645872116088867, 0.048354148864746094, 0.050249576568603516, 0.05214500427246094, 0.05404043197631836, 0.05593585968017578, 0.0578312873840332, 0.059726715087890625, 0.06162214279174805, 0.06351757049560547, 0.06541299819946289, 0.06730842590332031, 0.06920385360717773, 0.07109928131103516, 0.07299470901489258, 0.07489013671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 6.0, 8.0, 9.0, 22.0, 52.0, 73.0, 118.0, 153.0, 161.0, 135.0, 103.0, 72.0, 44.0, 21.0, 7.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5998169183731079, -0.5819693803787231, -0.5641219019889832, -0.5462743639945984, -0.5284268856048584, -0.5105793476104736, -0.49273183941841125, -0.4748843312263489, -0.4570368230342865, -0.4391893148422241, -0.42134180665016174, -0.40349429845809937, -0.3856467604637146, -0.3677992820739746, -0.34995174407958984, -0.33210423588752747, -0.3142567276954651, -0.2964092195034027, -0.27856171131134033, -0.26071420311927795, -0.24286668002605438, -0.225019171833992, -0.20717164874076843, -0.18932414054870605, -0.17147663235664368, -0.1536291241645813, -0.13578161597251892, -0.11793409287929535, -0.10008658468723297, -0.0822390764951706, -0.06439156085252762, -0.046544045209884644, -0.028696537017822266, -0.01084902510046959, 0.006998486816883087, 0.024845998734235764, 0.04269351065158844, 0.06054101884365082, 0.07838853448629379, 0.09623605012893677, 0.11408355832099915, 0.13193106651306152, 0.1497785747051239, 0.16762609779834747, 0.18547360599040985, 0.20332111418247223, 0.2211686372756958, 0.23901614546775818, 0.25686365365982056, 0.27471116185188293, 0.2925586700439453, 0.3104061782360077, 0.32825368642807007, 0.34610122442245483, 0.3639487326145172, 0.3817962408065796, 0.39964374899864197, 0.41749125719070435, 0.4353387653827667, 0.4531862735748291, 0.47103381156921387, 0.48888128995895386, 0.5067288279533386, 0.5245763063430786, 0.5424238443374634]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 8.0, 12.0, 8.0, 19.0, 12.0, 18.0, 25.0, 35.0, 37.0, 36.0, 55.0, 52.0, 47.0, 46.0, 53.0, 62.0, 45.0, 53.0, 44.0, 42.0, 33.0, 35.0, 40.0, 30.0, 25.0, 33.0, 26.0, 10.0, 10.0, 12.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29416346549987793, -0.28543680906295776, -0.2767101526260376, -0.26798349618911743, -0.25925686955451965, -0.2505302131175995, -0.24180355668067932, -0.23307690024375916, -0.224350243806839, -0.21562358736991882, -0.20689694583415985, -0.19817028939723969, -0.18944363296031952, -0.18071699142456055, -0.17199033498764038, -0.16326367855072021, -0.15453703701496124, -0.14581038057804108, -0.1370837390422821, -0.12835708260536194, -0.11963042616844177, -0.1109037771821022, -0.10217712819576263, -0.09345047175884247, -0.0847238227725029, -0.07599717378616333, -0.06727051734924316, -0.058543868362903595, -0.04981721565127373, -0.04109056293964386, -0.03236391395330429, -0.023637261241674423, -0.014910608530044556, -0.006183956749737263, 0.00254269503057003, 0.011269345879554749, 0.019995998591184616, 0.028722651302814484, 0.03744930028915405, 0.04617595300078392, 0.05490260571241379, 0.06362925469875336, 0.07235591113567352, 0.08108256012201309, 0.08980920910835266, 0.09853586554527283, 0.1072625145316124, 0.11598916351795197, 0.12471581995487213, 0.1334424763917923, 0.14216911792755127, 0.15089577436447144, 0.1596224308013916, 0.16834908723831177, 0.17707572877407074, 0.1858023852109909, 0.19452902674674988, 0.20325568318367004, 0.21198232471942902, 0.22070898115634918, 0.22943563759326935, 0.23816227912902832, 0.2468889355659485, 0.25561559200286865, 0.2643422484397888]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 16.0, 10.0, 27.0, 35.0, 51.0, 68.0, 127.0, 148.0, 272.0, 471.0, 871.0, 1823.0, 4366.0, 11561.0, 34540.0, 127757.0, 531695.0, 246043.0, 58908.0, 17974.0, 6456.0, 2602.0, 1182.0, 590.0, 318.0, 207.0, 125.0, 84.0, 58.0, 43.0, 23.0, 19.0, 17.0, 14.0, 5.0, 5.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.233154296875, -0.22623825073242188, -0.21932220458984375, -0.21240615844726562, -0.2054901123046875, -0.19857406616210938, -0.19165802001953125, -0.18474197387695312, -0.177825927734375, -0.17090988159179688, -0.16399383544921875, -0.15707778930664062, -0.1501617431640625, -0.14324569702148438, -0.13632965087890625, -0.12941360473632812, -0.12249755859375, -0.11558151245117188, -0.10866546630859375, -0.10174942016601562, -0.0948333740234375, -0.08791732788085938, -0.08100128173828125, -0.07408523559570312, -0.067169189453125, -0.060253143310546875, -0.05333709716796875, -0.046421051025390625, -0.0395050048828125, -0.032588958740234375, -0.02567291259765625, -0.018756866455078125, -0.0118408203125, -0.004924774169921875, 0.00199127197265625, 0.008907318115234375, 0.0158233642578125, 0.022739410400390625, 0.02965545654296875, 0.036571502685546875, 0.043487548828125, 0.050403594970703125, 0.05731964111328125, 0.06423568725585938, 0.0711517333984375, 0.07806777954101562, 0.08498382568359375, 0.09189987182617188, 0.09881591796875, 0.10573196411132812, 0.11264801025390625, 0.11956405639648438, 0.1264801025390625, 0.13339614868164062, 0.14031219482421875, 0.14722824096679688, 0.154144287109375, 0.16106033325195312, 0.16797637939453125, 0.17489242553710938, 0.1818084716796875, 0.18872451782226562, 0.19564056396484375, 0.20255661010742188, 0.20947265625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 12.0, 11.0, 13.0, 12.0, 25.0, 59.0, 53.0, 71.0, 81.0, 94.0, 89.0, 105.0, 83.0, 93.0, 57.0, 53.0, 26.0, 26.0, 8.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053558349609375, -0.05197334289550781, -0.050388336181640625, -0.04880332946777344, -0.04721832275390625, -0.04563331604003906, -0.044048309326171875, -0.04246330261230469, -0.0408782958984375, -0.03929328918457031, -0.037708282470703125, -0.03612327575683594, -0.03453826904296875, -0.03295326232910156, -0.031368255615234375, -0.029783248901367188, -0.0281982421875, -0.026613235473632812, -0.025028228759765625, -0.023443222045898438, -0.02185821533203125, -0.020273208618164062, -0.018688201904296875, -0.017103195190429688, -0.0155181884765625, -0.013933181762695312, -0.012348175048828125, -0.010763168334960938, -0.00917816162109375, -0.0075931549072265625, -0.006008148193359375, -0.0044231414794921875, -0.002838134765625, -0.0012531280517578125, 0.000331878662109375, 0.0019168853759765625, 0.00350189208984375, 0.0050868988037109375, 0.006671905517578125, 0.008256912231445312, 0.0098419189453125, 0.011426925659179688, 0.013011932373046875, 0.014596939086914062, 0.01618194580078125, 0.017766952514648438, 0.019351959228515625, 0.020936965942382812, 0.02252197265625, 0.024106979370117188, 0.025691986083984375, 0.027276992797851562, 0.02886199951171875, 0.030447006225585938, 0.032032012939453125, 0.03361701965332031, 0.0352020263671875, 0.03678703308105469, 0.038372039794921875, 0.03995704650878906, 0.04154205322265625, 0.04312705993652344, 0.044712066650390625, 0.04629707336425781, 0.047882080078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 11.0, 15.0, 21.0, 32.0, 51.0, 57.0, 86.0, 126.0, 158.0, 250.0, 409.0, 634.0, 999.0, 1620.0, 3030.0, 5454.0, 10959.0, 25133.0, 60753.0, 160726.0, 392742.0, 234775.0, 85844.0, 34184.0, 14697.0, 6975.0, 3489.0, 1961.0, 1157.0, 746.0, 449.0, 301.0, 207.0, 149.0, 82.0, 85.0, 55.0, 41.0, 24.0, 11.0, 12.0, 11.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11004638671875, -0.10620975494384766, -0.10237312316894531, -0.09853649139404297, -0.09469985961914062, -0.09086322784423828, -0.08702659606933594, -0.0831899642944336, -0.07935333251953125, -0.0755167007446289, -0.07168006896972656, -0.06784343719482422, -0.06400680541992188, -0.06017017364501953, -0.05633354187011719, -0.052496910095214844, -0.0486602783203125, -0.044823646545410156, -0.04098701477050781, -0.03715038299560547, -0.033313751220703125, -0.02947711944580078, -0.025640487670898438, -0.021803855895996094, -0.01796722412109375, -0.014130592346191406, -0.010293960571289062, -0.006457328796386719, -0.002620697021484375, 0.0012159347534179688, 0.0050525665283203125, 0.008889198303222656, 0.012725830078125, 0.016562461853027344, 0.020399093627929688, 0.02423572540283203, 0.028072357177734375, 0.03190898895263672, 0.03574562072753906, 0.039582252502441406, 0.04341888427734375, 0.047255516052246094, 0.05109214782714844, 0.05492877960205078, 0.058765411376953125, 0.06260204315185547, 0.06643867492675781, 0.07027530670166016, 0.0741119384765625, 0.07794857025146484, 0.08178520202636719, 0.08562183380126953, 0.08945846557617188, 0.09329509735107422, 0.09713172912597656, 0.1009683609008789, 0.10480499267578125, 0.1086416244506836, 0.11247825622558594, 0.11631488800048828, 0.12015151977539062, 0.12398815155029297, 0.1278247833251953, 0.13166141510009766, 0.135498046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 12.0, 14.0, 6.0, 12.0, 12.0, 25.0, 17.0, 22.0, 20.0, 26.0, 38.0, 36.0, 38.0, 36.0, 49.0, 54.0, 48.0, 54.0, 52.0, 41.0, 40.0, 48.0, 39.0, 37.0, 40.0, 37.0, 27.0, 32.0, 21.0, 11.0, 13.0, 14.0, 11.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1583251953125, -0.15381431579589844, -0.14930343627929688, -0.1447925567626953, -0.14028167724609375, -0.1357707977294922, -0.13125991821289062, -0.12674903869628906, -0.1222381591796875, -0.11772727966308594, -0.11321640014648438, -0.10870552062988281, -0.10419464111328125, -0.09968376159667969, -0.09517288208007812, -0.09066200256347656, -0.086151123046875, -0.08164024353027344, -0.07712936401367188, -0.07261848449707031, -0.06810760498046875, -0.06359672546386719, -0.059085845947265625, -0.05457496643066406, -0.0500640869140625, -0.04555320739746094, -0.041042327880859375, -0.03653144836425781, -0.03202056884765625, -0.027509689331054688, -0.022998809814453125, -0.018487930297851562, -0.01397705078125, -0.009466171264648438, -0.004955291748046875, -0.0004444122314453125, 0.00406646728515625, 0.008577346801757812, 0.013088226318359375, 0.017599105834960938, 0.0221099853515625, 0.026620864868164062, 0.031131744384765625, 0.03564262390136719, 0.04015350341796875, 0.04466438293457031, 0.049175262451171875, 0.05368614196777344, 0.058197021484375, 0.06270790100097656, 0.06721878051757812, 0.07172966003417969, 0.07624053955078125, 0.08075141906738281, 0.08526229858398438, 0.08977317810058594, 0.0942840576171875, 0.09879493713378906, 0.10330581665039062, 0.10781669616699219, 0.11232757568359375, 0.11683845520019531, 0.12134933471679688, 0.12586021423339844, 0.13037109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 8.0, 19.0, 16.0, 21.0, 42.0, 77.0, 140.0, 269.0, 456.0, 863.0, 1595.0, 3412.0, 7972.0, 22199.0, 95983.0, 586159.0, 263334.0, 43231.0, 12686.0, 5011.0, 2356.0, 1237.0, 634.0, 320.0, 174.0, 117.0, 76.0, 47.0, 33.0, 14.0, 7.0, 13.0, 12.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.13231277465820312, -0.12827301025390625, -0.12423324584960938, -0.1201934814453125, -0.11615371704101562, -0.11211395263671875, -0.10807418823242188, -0.104034423828125, -0.09999465942382812, -0.09595489501953125, -0.09191513061523438, -0.0878753662109375, -0.08383560180664062, -0.07979583740234375, -0.07575607299804688, -0.07171630859375, -0.06767654418945312, -0.06363677978515625, -0.059597015380859375, -0.0555572509765625, -0.051517486572265625, -0.04747772216796875, -0.043437957763671875, -0.039398193359375, -0.035358428955078125, -0.03131866455078125, -0.027278900146484375, -0.0232391357421875, -0.019199371337890625, -0.01515960693359375, -0.011119842529296875, -0.007080078125, -0.003040313720703125, 0.00099945068359375, 0.005039215087890625, 0.0090789794921875, 0.013118743896484375, 0.01715850830078125, 0.021198272705078125, 0.025238037109375, 0.029277801513671875, 0.03331756591796875, 0.037357330322265625, 0.0413970947265625, 0.045436859130859375, 0.04947662353515625, 0.053516387939453125, 0.05755615234375, 0.061595916748046875, 0.06563568115234375, 0.06967544555664062, 0.0737152099609375, 0.07775497436523438, 0.08179473876953125, 0.08583450317382812, 0.089874267578125, 0.09391403198242188, 0.09795379638671875, 0.10199356079101562, 0.1060333251953125, 0.11007308959960938, 0.11411285400390625, 0.11815261840820312, 0.1221923828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 8.0, 8.0, 2.0, 7.0, 7.0, 15.0, 25.0, 32.0, 46.0, 45.0, 73.0, 94.0, 88.0, 87.0, 87.0, 84.0, 60.0, 51.0, 54.0, 48.0, 22.0, 15.0, 20.0, 12.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.64320182800293e-05, -4.516635090112686e-05, -4.3900683522224426e-05, -4.263501614332199e-05, -4.1369348764419556e-05, -4.010368138551712e-05, -3.8838014006614685e-05, -3.757234662771225e-05, -3.6306679248809814e-05, -3.504101186990738e-05, -3.3775344491004944e-05, -3.250967711210251e-05, -3.124400973320007e-05, -2.9978342354297638e-05, -2.8712674975395203e-05, -2.7447007596492767e-05, -2.6181340217590332e-05, -2.4915672838687897e-05, -2.365000545978546e-05, -2.2384338080883026e-05, -2.111867070198059e-05, -1.9853003323078156e-05, -1.858733594417572e-05, -1.7321668565273285e-05, -1.605600118637085e-05, -1.4790333807468414e-05, -1.3524666428565979e-05, -1.2258999049663544e-05, -1.0993331670761108e-05, -9.727664291858673e-06, -8.461996912956238e-06, -7.1963295340538025e-06, -5.930662155151367e-06, -4.664994776248932e-06, -3.3993273973464966e-06, -2.1336600184440613e-06, -8.67992639541626e-07, 3.976747393608093e-07, 1.6633421182632446e-06, 2.92900949716568e-06, 4.194676876068115e-06, 5.4603442549705505e-06, 6.726011633872986e-06, 7.991679012775421e-06, 9.257346391677856e-06, 1.0523013770580292e-05, 1.1788681149482727e-05, 1.3054348528385162e-05, 1.4320015907287598e-05, 1.5585683286190033e-05, 1.6851350665092468e-05, 1.8117018043994904e-05, 1.938268542289734e-05, 2.0648352801799774e-05, 2.191402018070221e-05, 2.3179687559604645e-05, 2.444535493850708e-05, 2.5711022317409515e-05, 2.697668969631195e-05, 2.8242357075214386e-05, 2.950802445411682e-05, 3.0773691833019257e-05, 3.203935921192169e-05, 3.330502659082413e-05, 3.457069396972656e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 13.0, 13.0, 20.0, 29.0, 46.0, 45.0, 80.0, 118.0, 199.0, 347.0, 602.0, 1313.0, 2903.0, 7025.0, 21087.0, 87356.0, 557240.0, 298482.0, 48954.0, 13447.0, 4935.0, 2085.0, 961.0, 519.0, 267.0, 175.0, 92.0, 67.0, 38.0, 30.0, 15.0, 20.0, 10.0, 6.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1343994140625, -0.13074874877929688, -0.12709808349609375, -0.12344741821289062, -0.1197967529296875, -0.11614608764648438, -0.11249542236328125, -0.10884475708007812, -0.105194091796875, -0.10154342651367188, -0.09789276123046875, -0.09424209594726562, -0.0905914306640625, -0.08694076538085938, -0.08329010009765625, -0.07963943481445312, -0.07598876953125, -0.07233810424804688, -0.06868743896484375, -0.06503677368164062, -0.0613861083984375, -0.057735443115234375, -0.05408477783203125, -0.050434112548828125, -0.046783447265625, -0.043132781982421875, -0.03948211669921875, -0.035831451416015625, -0.0321807861328125, -0.028530120849609375, -0.02487945556640625, -0.021228790283203125, -0.017578125, -0.013927459716796875, -0.01027679443359375, -0.006626129150390625, -0.0029754638671875, 0.000675201416015625, 0.00432586669921875, 0.007976531982421875, 0.011627197265625, 0.015277862548828125, 0.01892852783203125, 0.022579193115234375, 0.0262298583984375, 0.029880523681640625, 0.03353118896484375, 0.037181854248046875, 0.04083251953125, 0.044483184814453125, 0.04813385009765625, 0.051784515380859375, 0.0554351806640625, 0.059085845947265625, 0.06273651123046875, 0.06638717651367188, 0.070037841796875, 0.07368850708007812, 0.07733917236328125, 0.08098983764648438, 0.0846405029296875, 0.08829116821289062, 0.09194183349609375, 0.09559249877929688, 0.0992431640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 7.0, 8.0, 12.0, 12.0, 12.0, 23.0, 27.0, 39.0, 65.0, 103.0, 141.0, 148.0, 125.0, 76.0, 53.0, 31.0, 21.0, 20.0, 15.0, 11.0, 13.0, 6.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09014892578125, -0.08706188201904297, -0.08397483825683594, -0.0808877944946289, -0.07780075073242188, -0.07471370697021484, -0.07162666320800781, -0.06853961944580078, -0.06545257568359375, -0.06236553192138672, -0.05927848815917969, -0.056191444396972656, -0.053104400634765625, -0.050017356872558594, -0.04693031311035156, -0.04384326934814453, -0.0407562255859375, -0.03766918182373047, -0.03458213806152344, -0.031495094299316406, -0.028408050537109375, -0.025321006774902344, -0.022233963012695312, -0.01914691925048828, -0.01605987548828125, -0.012972831726074219, -0.009885787963867188, -0.006798744201660156, -0.003711700439453125, -0.0006246566772460938, 0.0024623870849609375, 0.005549430847167969, 0.008636474609375, 0.011723518371582031, 0.014810562133789062, 0.017897605895996094, 0.020984649658203125, 0.024071693420410156, 0.027158737182617188, 0.03024578094482422, 0.03333282470703125, 0.03641986846923828, 0.03950691223144531, 0.042593955993652344, 0.045680999755859375, 0.048768043518066406, 0.05185508728027344, 0.05494213104248047, 0.0580291748046875, 0.06111621856689453, 0.06420326232910156, 0.0672903060913086, 0.07037734985351562, 0.07346439361572266, 0.07655143737792969, 0.07963848114013672, 0.08272552490234375, 0.08581256866455078, 0.08889961242675781, 0.09198665618896484, 0.09507369995117188, 0.0981607437133789, 0.10124778747558594, 0.10433483123779297, 0.107421875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 8.0, 17.0, 17.0, 42.0, 49.0, 73.0, 111.0, 155.0, 161.0, 135.0, 82.0, 59.0, 26.0, 23.0, 17.0, 13.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6204460859298706, -1.5788004398345947, -1.5371546745300293, -1.4955090284347534, -1.4538633823394775, -1.4122177362442017, -1.3705719709396362, -1.3289263248443604, -1.2872806787490845, -1.2456350326538086, -1.2039892673492432, -1.1623436212539673, -1.1206979751586914, -1.0790523290634155, -1.03740656375885, -0.9957609176635742, -0.9541152119636536, -0.9124695062637329, -0.870823860168457, -0.8291781544685364, -0.7875325083732605, -0.7458868026733398, -0.704241156578064, -0.6625954508781433, -0.6209497451782227, -0.579304039478302, -0.5376583933830261, -0.49601268768310547, -0.4543670415878296, -0.41272133588790894, -0.37107565999031067, -0.3294299840927124, -0.2877843379974365, -0.24613866209983826, -0.20449298620224, -0.16284729540348053, -0.12120161950588226, -0.079555943608284, -0.037910252809524536, 0.0037354230880737305, 0.045381098985672, 0.08702677488327026, 0.12867245078086853, 0.170318141579628, 0.21196381747722626, 0.25360947847366333, 0.295255184173584, 0.33690086007118225, 0.3785465359687805, 0.4201922118663788, 0.46183788776397705, 0.5034835934638977, 0.5451292395591736, 0.5867749452590942, 0.6284205913543701, 0.6700662970542908, 0.7117120027542114, 0.7533577084541321, 0.795003354549408, 0.8366490602493286, 0.8782947063446045, 0.9199404120445251, 0.9615861177444458, 1.0032317638397217, 1.0448774099349976]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 5.0, 4.0, 2.0, 5.0, 10.0, 7.0, 16.0, 17.0, 17.0, 19.0, 21.0, 25.0, 20.0, 37.0, 31.0, 35.0, 43.0, 53.0, 43.0, 44.0, 49.0, 50.0, 51.0, 58.0, 47.0, 29.0, 33.0, 20.0, 28.0, 23.0, 26.0, 15.0, 23.0, 10.0, 13.0, 12.0, 11.0, 14.0, 8.0, 6.0, 7.0, 8.0, 3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0], "bins": [-0.834596574306488, -0.8115134835243225, -0.788430392742157, -0.7653473019599915, -0.7422642111778259, -0.7191811203956604, -0.6960979700088501, -0.6730148792266846, -0.649931788444519, -0.6268486976623535, -0.603765606880188, -0.5806825160980225, -0.5575994253158569, -0.5345163345336914, -0.5114332437515259, -0.48835012316703796, -0.4652670621871948, -0.4421839714050293, -0.41910088062286377, -0.39601778984069824, -0.3729346990585327, -0.3498516082763672, -0.3267684876918793, -0.30368539690971375, -0.2806023061275482, -0.2575192153453827, -0.23443612456321716, -0.21135301887989044, -0.18826992809772491, -0.1651868373155594, -0.14210373163223267, -0.11902064085006714, -0.09593760967254639, -0.07285451889038086, -0.049771420657634735, -0.02668832242488861, -0.0036052316427230835, 0.019477859139442444, 0.042560964822769165, 0.06564405560493469, 0.08872714638710022, 0.11181023716926575, 0.13489332795143127, 0.157976433634758, 0.18105952441692352, 0.20414261519908905, 0.22722572088241577, 0.2503088116645813, 0.2733919024467468, 0.29647499322891235, 0.3195580840110779, 0.3426411747932434, 0.36572426557540894, 0.38880735635757446, 0.4118904769420624, 0.4349735677242279, 0.45805665850639343, 0.48113974928855896, 0.5042228698730469, 0.5273059606552124, 0.5503890514373779, 0.5734721422195435, 0.596555233001709, 0.6196383237838745, 0.64272141456604]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 24.0, 27.0, 36.0, 89.0, 142.0, 224.0, 392.0, 735.0, 1417.0, 3398.0, 10741.0, 49887.0, 2565261.0, 1497441.0, 46888.0, 10646.0, 3518.0, 1538.0, 790.0, 416.0, 243.0, 143.0, 96.0, 58.0, 31.0, 26.0, 19.0, 8.0, 9.0, 6.0, 3.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.286865234375, -0.27889442443847656, -0.2709236145019531, -0.2629528045654297, -0.25498199462890625, -0.2470111846923828, -0.23904037475585938, -0.23106956481933594, -0.2230987548828125, -0.21512794494628906, -0.20715713500976562, -0.1991863250732422, -0.19121551513671875, -0.1832447052001953, -0.17527389526367188, -0.16730308532714844, -0.159332275390625, -0.15136146545410156, -0.14339065551757812, -0.1354198455810547, -0.12744903564453125, -0.11947822570800781, -0.11150741577148438, -0.10353660583496094, -0.0955657958984375, -0.08759498596191406, -0.07962417602539062, -0.07165336608886719, -0.06368255615234375, -0.05571174621582031, -0.047740936279296875, -0.03977012634277344, -0.03179931640625, -0.023828506469726562, -0.015857696533203125, -0.007886886596679688, 8.392333984375e-05, 0.008054733276367188, 0.016025543212890625, 0.023996353149414062, 0.0319671630859375, 0.03993797302246094, 0.047908782958984375, 0.05587959289550781, 0.06385040283203125, 0.07182121276855469, 0.07979202270507812, 0.08776283264160156, 0.095733642578125, 0.10370445251464844, 0.11167526245117188, 0.11964607238769531, 0.12761688232421875, 0.1355876922607422, 0.14355850219726562, 0.15152931213378906, 0.1595001220703125, 0.16747093200683594, 0.17544174194335938, 0.1834125518798828, 0.19138336181640625, 0.1993541717529297, 0.20732498168945312, 0.21529579162597656, 0.2232666015625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 18.0, 23.0, 24.0, 30.0, 47.0, 79.0, 68.0, 87.0, 86.0, 82.0, 75.0, 81.0, 75.0, 57.0, 34.0, 30.0, 31.0, 13.0, 15.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050140380859375, -0.048645973205566406, -0.04715156555175781, -0.04565715789794922, -0.044162750244140625, -0.04266834259033203, -0.04117393493652344, -0.039679527282714844, -0.03818511962890625, -0.036690711975097656, -0.03519630432128906, -0.03370189666748047, -0.032207489013671875, -0.03071308135986328, -0.029218673706054688, -0.027724266052246094, -0.0262298583984375, -0.024735450744628906, -0.023241043090820312, -0.02174663543701172, -0.020252227783203125, -0.01875782012939453, -0.017263412475585938, -0.015769004821777344, -0.01427459716796875, -0.012780189514160156, -0.011285781860351562, -0.009791374206542969, -0.008296966552734375, -0.006802558898925781, -0.0053081512451171875, -0.0038137435913085938, -0.0023193359375, -0.0008249282836914062, 0.0006694793701171875, 0.0021638870239257812, 0.003658294677734375, 0.005152702331542969, 0.0066471099853515625, 0.008141517639160156, 0.00963592529296875, 0.011130332946777344, 0.012624740600585938, 0.014119148254394531, 0.015613555908203125, 0.01710796356201172, 0.018602371215820312, 0.020096778869628906, 0.0215911865234375, 0.023085594177246094, 0.024580001831054688, 0.02607440948486328, 0.027568817138671875, 0.02906322479248047, 0.030557632446289062, 0.032052040100097656, 0.03354644775390625, 0.035040855407714844, 0.03653526306152344, 0.03802967071533203, 0.039524078369140625, 0.04101848602294922, 0.04251289367675781, 0.044007301330566406, 0.045501708984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 8.0, 4.0, 9.0, 9.0, 11.0, 21.0, 17.0, 37.0, 53.0, 67.0, 109.0, 152.0, 296.0, 514.0, 1062.0, 2448.0, 7246.0, 31867.0, 283341.0, 3710269.0, 128691.0, 19264.0, 5036.0, 1842.0, 800.0, 421.0, 264.0, 133.0, 86.0, 64.0, 36.0, 32.0, 29.0, 18.0, 10.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24853515625, -0.23976898193359375, -0.2310028076171875, -0.22223663330078125, -0.213470458984375, -0.20470428466796875, -0.1959381103515625, -0.18717193603515625, -0.17840576171875, -0.16963958740234375, -0.1608734130859375, -0.15210723876953125, -0.143341064453125, -0.13457489013671875, -0.1258087158203125, -0.11704254150390625, -0.1082763671875, -0.09951019287109375, -0.0907440185546875, -0.08197784423828125, -0.073211669921875, -0.06444549560546875, -0.0556793212890625, -0.04691314697265625, -0.03814697265625, -0.02938079833984375, -0.0206146240234375, -0.01184844970703125, -0.003082275390625, 0.00568389892578125, 0.0144500732421875, 0.02321624755859375, 0.031982421875, 0.04074859619140625, 0.0495147705078125, 0.05828094482421875, 0.067047119140625, 0.07581329345703125, 0.0845794677734375, 0.09334564208984375, 0.10211181640625, 0.11087799072265625, 0.1196441650390625, 0.12841033935546875, 0.137176513671875, 0.14594268798828125, 0.1547088623046875, 0.16347503662109375, 0.1722412109375, 0.18100738525390625, 0.1897735595703125, 0.19853973388671875, 0.207305908203125, 0.21607208251953125, 0.2248382568359375, 0.23360443115234375, 0.24237060546875, 0.25113677978515625, 0.2599029541015625, 0.26866912841796875, 0.277435302734375, 0.28620147705078125, 0.2949676513671875, 0.30373382568359375, 0.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 8.0, 10.0, 35.0, 44.0, 74.0, 156.0, 383.0, 2331.0, 609.0, 178.0, 107.0, 68.0, 25.0, 16.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13791370391845703, -0.13434791564941406, -0.1307821273803711, -0.12721633911132812, -0.12365055084228516, -0.12008476257324219, -0.11651897430419922, -0.11295318603515625, -0.10938739776611328, -0.10582160949707031, -0.10225582122802734, -0.09869003295898438, -0.0951242446899414, -0.09155845642089844, -0.08799266815185547, -0.0844268798828125, -0.08086109161376953, -0.07729530334472656, -0.0737295150756836, -0.07016372680664062, -0.06659793853759766, -0.06303215026855469, -0.05946636199951172, -0.05590057373046875, -0.05233478546142578, -0.04876899719238281, -0.045203208923339844, -0.041637420654296875, -0.038071632385253906, -0.03450584411621094, -0.03094005584716797, -0.027374267578125, -0.02380847930908203, -0.020242691040039062, -0.016676902770996094, -0.013111114501953125, -0.009545326232910156, -0.0059795379638671875, -0.0024137496948242188, 0.00115203857421875, 0.004717826843261719, 0.008283615112304688, 0.011849403381347656, 0.015415191650390625, 0.018980979919433594, 0.022546768188476562, 0.02611255645751953, 0.0296783447265625, 0.03324413299560547, 0.03680992126464844, 0.040375709533691406, 0.043941497802734375, 0.047507286071777344, 0.05107307434082031, 0.05463886260986328, 0.05820465087890625, 0.06177043914794922, 0.06533622741699219, 0.06890201568603516, 0.07246780395507812, 0.0760335922241211, 0.07959938049316406, 0.08316516876220703, 0.08673095703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 17.0, 15.0, 40.0, 60.0, 89.0, 117.0, 162.0, 144.0, 111.0, 98.0, 68.0, 28.0, 11.0, 15.0, 10.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5916775465011597, -0.5743805766105652, -0.5570836663246155, -0.539786696434021, -0.5224897861480713, -0.5051928162574768, -0.4878958463668823, -0.47059890627861023, -0.45330196619033813, -0.43600502610206604, -0.41870808601379395, -0.40141111612319946, -0.38411417603492737, -0.3668172359466553, -0.3495202660560608, -0.3322233259677887, -0.3149263858795166, -0.2976294457912445, -0.2803325057029724, -0.26303553581237793, -0.24573859572410583, -0.22844165563583374, -0.21114470064640045, -0.19384774565696716, -0.17655080556869507, -0.15925386548042297, -0.14195691049098969, -0.124659962952137, -0.1073630154132843, -0.09006606787443161, -0.07276912033557892, -0.05547217279672623, -0.03817516565322876, -0.020878218114376068, -0.0035812705755233765, 0.013715676963329315, 0.031012624502182007, 0.0483095720410347, 0.06560651957988739, 0.08290346711874008, 0.10020041465759277, 0.11749736219644547, 0.13479430973529816, 0.15209126472473145, 0.16938820481300354, 0.18668514490127563, 0.20398209989070892, 0.2212790548801422, 0.2385759949684143, 0.2558729350566864, 0.2731698751449585, 0.290466845035553, 0.3077637851238251, 0.32506072521209717, 0.34235769510269165, 0.35965463519096375, 0.37695157527923584, 0.39424851536750793, 0.41154545545578003, 0.4288424253463745, 0.4461393654346466, 0.4634363055229187, 0.4807332754135132, 0.4980302155017853, 0.5153271555900574]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 5.0, 9.0, 10.0, 9.0, 11.0, 13.0, 12.0, 22.0, 38.0, 31.0, 26.0, 27.0, 31.0, 36.0, 43.0, 43.0, 45.0, 26.0, 47.0, 35.0, 49.0, 41.0, 42.0, 46.0, 32.0, 40.0, 37.0, 41.0, 23.0, 22.0, 13.0, 17.0, 11.0, 13.0, 10.0, 8.0, 7.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.25157982110977173, -0.24420452117919922, -0.2368292212486267, -0.2294539213180542, -0.2220786213874817, -0.21470332145690918, -0.20732800662517548, -0.19995270669460297, -0.19257740676403046, -0.18520210683345795, -0.17782680690288544, -0.17045150697231293, -0.16307619214057922, -0.1557008922100067, -0.1483255922794342, -0.1409502923488617, -0.13357499241828918, -0.12619969248771667, -0.11882439255714417, -0.11144908517599106, -0.10407378524541855, -0.09669848531484604, -0.08932317793369293, -0.08194787800312042, -0.07457257807254791, -0.0671972781419754, -0.059821974486112595, -0.052446670830249786, -0.04507137089967728, -0.03769607096910477, -0.03032076731324196, -0.02294546365737915, -0.01557016372680664, -0.008194861933588982, -0.0008195601403713226, 0.006555741652846336, 0.013931043446063995, 0.021306343376636505, 0.028681647032499313, 0.03605695068836212, 0.04343225061893463, 0.05080755054950714, 0.05818285420536995, 0.06555815786123276, 0.07293345779180527, 0.08030875772237778, 0.08768406510353088, 0.0950593650341034, 0.1024346649646759, 0.10980996489524841, 0.11718526482582092, 0.12456057220697403, 0.13193586468696594, 0.13931116461753845, 0.14668647944927216, 0.15406177937984467, 0.16143707931041718, 0.16881237924098969, 0.1761876791715622, 0.1835629791021347, 0.1909382939338684, 0.19831359386444092, 0.20568889379501343, 0.21306419372558594, 0.22043949365615845]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 8.0, 7.0, 8.0, 15.0, 20.0, 20.0, 34.0, 52.0, 68.0, 106.0, 175.0, 289.0, 433.0, 764.0, 1373.0, 2550.0, 5088.0, 10433.0, 23842.0, 59217.0, 156533.0, 389954.0, 244034.0, 89509.0, 34881.0, 14815.0, 6811.0, 3336.0, 1723.0, 1022.0, 551.0, 285.0, 199.0, 145.0, 81.0, 49.0, 38.0, 27.0, 13.0, 18.0, 11.0, 3.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1456298828125, -0.14055824279785156, -0.13548660278320312, -0.1304149627685547, -0.12534332275390625, -0.12027168273925781, -0.11520004272460938, -0.11012840270996094, -0.1050567626953125, -0.09998512268066406, -0.09491348266601562, -0.08984184265136719, -0.08477020263671875, -0.07969856262207031, -0.07462692260742188, -0.06955528259277344, -0.064483642578125, -0.05941200256347656, -0.054340362548828125, -0.04926872253417969, -0.04419708251953125, -0.03912544250488281, -0.034053802490234375, -0.028982162475585938, -0.0239105224609375, -0.018838882446289062, -0.013767242431640625, -0.008695602416992188, -0.00362396240234375, 0.0014476776123046875, 0.006519317626953125, 0.011590957641601562, 0.01666259765625, 0.021734237670898438, 0.026805877685546875, 0.03187751770019531, 0.03694915771484375, 0.04202079772949219, 0.047092437744140625, 0.05216407775878906, 0.0572357177734375, 0.06230735778808594, 0.06737899780273438, 0.07245063781738281, 0.07752227783203125, 0.08259391784667969, 0.08766555786132812, 0.09273719787597656, 0.097808837890625, 0.10288047790527344, 0.10795211791992188, 0.11302375793457031, 0.11809539794921875, 0.12316703796386719, 0.12823867797851562, 0.13331031799316406, 0.1383819580078125, 0.14345359802246094, 0.14852523803710938, 0.1535968780517578, 0.15866851806640625, 0.1637401580810547, 0.16881179809570312, 0.17388343811035156, 0.178955078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 8.0, 21.0, 31.0, 34.0, 37.0, 55.0, 67.0, 58.0, 78.0, 84.0, 73.0, 71.0, 73.0, 53.0, 53.0, 48.0, 37.0, 28.0, 24.0, 16.0, 11.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04705810546875, -0.045607566833496094, -0.04415702819824219, -0.04270648956298828, -0.041255950927734375, -0.03980541229248047, -0.03835487365722656, -0.036904335021972656, -0.03545379638671875, -0.034003257751464844, -0.03255271911621094, -0.03110218048095703, -0.029651641845703125, -0.02820110321044922, -0.026750564575195312, -0.025300025939941406, -0.0238494873046875, -0.022398948669433594, -0.020948410034179688, -0.01949787139892578, -0.018047332763671875, -0.01659679412841797, -0.015146255493164062, -0.013695716857910156, -0.01224517822265625, -0.010794639587402344, -0.009344100952148438, -0.007893562316894531, -0.006443023681640625, -0.004992485046386719, -0.0035419464111328125, -0.0020914077758789062, -0.000640869140625, 0.0008096694946289062, 0.0022602081298828125, 0.0037107467651367188, 0.005161285400390625, 0.006611824035644531, 0.008062362670898438, 0.009512901306152344, 0.01096343994140625, 0.012413978576660156, 0.013864517211914062, 0.015315055847167969, 0.016765594482421875, 0.01821613311767578, 0.019666671752929688, 0.021117210388183594, 0.0225677490234375, 0.024018287658691406, 0.025468826293945312, 0.02691936492919922, 0.028369903564453125, 0.02982044219970703, 0.03127098083496094, 0.032721519470214844, 0.03417205810546875, 0.035622596740722656, 0.03707313537597656, 0.03852367401123047, 0.039974212646484375, 0.04142475128173828, 0.04287528991699219, 0.044325828552246094, 0.0457763671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 10.0, 4.0, 11.0, 13.0, 13.0, 17.0, 25.0, 41.0, 71.0, 79.0, 128.0, 146.0, 246.0, 344.0, 589.0, 1089.0, 2063.0, 4242.0, 9920.0, 25412.0, 71432.0, 212906.0, 424781.0, 190478.0, 63769.0, 23199.0, 9085.0, 3919.0, 1767.0, 989.0, 612.0, 372.0, 226.0, 156.0, 117.0, 81.0, 60.0, 44.0, 24.0, 21.0, 20.0, 15.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1341552734375, -0.12974929809570312, -0.12534332275390625, -0.12093734741210938, -0.1165313720703125, -0.11212539672851562, -0.10771942138671875, -0.10331344604492188, -0.098907470703125, -0.09450149536132812, -0.09009552001953125, -0.08568954467773438, -0.0812835693359375, -0.07687759399414062, -0.07247161865234375, -0.06806564331054688, -0.06365966796875, -0.059253692626953125, -0.05484771728515625, -0.050441741943359375, -0.0460357666015625, -0.041629791259765625, -0.03722381591796875, -0.032817840576171875, -0.028411865234375, -0.024005889892578125, -0.01959991455078125, -0.015193939208984375, -0.0107879638671875, -0.006381988525390625, -0.00197601318359375, 0.002429962158203125, 0.0068359375, 0.011241912841796875, 0.01564788818359375, 0.020053863525390625, 0.0244598388671875, 0.028865814208984375, 0.03327178955078125, 0.037677764892578125, 0.042083740234375, 0.046489715576171875, 0.05089569091796875, 0.055301666259765625, 0.0597076416015625, 0.06411361694335938, 0.06851959228515625, 0.07292556762695312, 0.07733154296875, 0.08173751831054688, 0.08614349365234375, 0.09054946899414062, 0.0949554443359375, 0.09936141967773438, 0.10376739501953125, 0.10817337036132812, 0.112579345703125, 0.11698532104492188, 0.12139129638671875, 0.12579727172851562, 0.1302032470703125, 0.13460922241210938, 0.13901519775390625, 0.14342117309570312, 0.1478271484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 4.0, 9.0, 9.0, 9.0, 10.0, 14.0, 15.0, 29.0, 18.0, 22.0, 25.0, 27.0, 37.0, 32.0, 20.0, 31.0, 37.0, 44.0, 40.0, 48.0, 47.0, 39.0, 36.0, 39.0, 27.0, 39.0, 36.0, 24.0, 22.0, 20.0, 23.0, 28.0, 21.0, 22.0, 12.0, 13.0, 9.0, 14.0, 10.0, 6.0, 4.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 4.0], "bins": [-0.1370849609375, -0.13332366943359375, -0.1295623779296875, -0.12580108642578125, -0.122039794921875, -0.11827850341796875, -0.1145172119140625, -0.11075592041015625, -0.10699462890625, -0.10323333740234375, -0.0994720458984375, -0.09571075439453125, -0.091949462890625, -0.08818817138671875, -0.0844268798828125, -0.08066558837890625, -0.076904296875, -0.07314300537109375, -0.0693817138671875, -0.06562042236328125, -0.061859130859375, -0.05809783935546875, -0.0543365478515625, -0.05057525634765625, -0.04681396484375, -0.04305267333984375, -0.0392913818359375, -0.03553009033203125, -0.031768798828125, -0.02800750732421875, -0.0242462158203125, -0.02048492431640625, -0.0167236328125, -0.01296234130859375, -0.0092010498046875, -0.00543975830078125, -0.001678466796875, 0.00208282470703125, 0.0058441162109375, 0.00960540771484375, 0.01336669921875, 0.01712799072265625, 0.0208892822265625, 0.02465057373046875, 0.028411865234375, 0.03217315673828125, 0.0359344482421875, 0.03969573974609375, 0.04345703125, 0.04721832275390625, 0.0509796142578125, 0.05474090576171875, 0.058502197265625, 0.06226348876953125, 0.0660247802734375, 0.06978607177734375, 0.07354736328125, 0.07730865478515625, 0.0810699462890625, 0.08483123779296875, 0.088592529296875, 0.09235382080078125, 0.0961151123046875, 0.09987640380859375, 0.1036376953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 5.0, 6.0, 17.0, 14.0, 25.0, 38.0, 65.0, 94.0, 151.0, 267.0, 512.0, 1005.0, 2017.0, 4531.0, 10589.0, 28232.0, 88856.0, 331504.0, 408122.0, 114465.0, 34774.0, 12975.0, 5323.0, 2386.0, 1205.0, 601.0, 320.0, 191.0, 87.0, 66.0, 39.0, 30.0, 14.0, 10.0, 4.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09466552734375, -0.09196853637695312, -0.08927154541015625, -0.08657455444335938, -0.0838775634765625, -0.08118057250976562, -0.07848358154296875, -0.07578659057617188, -0.073089599609375, -0.07039260864257812, -0.06769561767578125, -0.06499862670898438, -0.0623016357421875, -0.059604644775390625, -0.05690765380859375, -0.054210662841796875, -0.051513671875, -0.048816680908203125, -0.04611968994140625, -0.043422698974609375, -0.0407257080078125, -0.038028717041015625, -0.03533172607421875, -0.032634735107421875, -0.029937744140625, -0.027240753173828125, -0.02454376220703125, -0.021846771240234375, -0.0191497802734375, -0.016452789306640625, -0.01375579833984375, -0.011058807373046875, -0.00836181640625, -0.005664825439453125, -0.00296783447265625, -0.000270843505859375, 0.0024261474609375, 0.005123138427734375, 0.00782012939453125, 0.010517120361328125, 0.013214111328125, 0.015911102294921875, 0.01860809326171875, 0.021305084228515625, 0.0240020751953125, 0.026699066162109375, 0.02939605712890625, 0.032093048095703125, 0.0347900390625, 0.037487030029296875, 0.04018402099609375, 0.042881011962890625, 0.0455780029296875, 0.048274993896484375, 0.05097198486328125, 0.053668975830078125, 0.056365966796875, 0.059062957763671875, 0.06175994873046875, 0.06445693969726562, 0.0671539306640625, 0.06985092163085938, 0.07254791259765625, 0.07524490356445312, 0.07794189453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 7.0, 12.0, 22.0, 24.0, 28.0, 25.0, 30.0, 47.0, 49.0, 58.0, 61.0, 74.0, 53.0, 58.0, 66.0, 69.0, 50.0, 29.0, 28.0, 26.0, 27.0, 22.0, 25.0, 13.0, 11.0, 8.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-05, -2.2427178919315338e-05, -2.1608546376228333e-05, -2.0789913833141327e-05, -1.997128129005432e-05, -1.9152648746967316e-05, -1.833401620388031e-05, -1.7515383660793304e-05, -1.66967511177063e-05, -1.5878118574619293e-05, -1.5059486031532288e-05, -1.4240853488445282e-05, -1.3422220945358276e-05, -1.260358840227127e-05, -1.1784955859184265e-05, -1.096632331609726e-05, -1.0147690773010254e-05, -9.329058229923248e-06, -8.510425686836243e-06, -7.691793143749237e-06, -6.8731606006622314e-06, -6.054528057575226e-06, -5.23589551448822e-06, -4.417262971401215e-06, -3.598630428314209e-06, -2.7799978852272034e-06, -1.9613653421401978e-06, -1.1427327990531921e-06, -3.241002559661865e-07, 4.945322871208191e-07, 1.3131648302078247e-06, 2.1317973732948303e-06, 2.950429916381836e-06, 3.7690624594688416e-06, 4.587695002555847e-06, 5.406327545642853e-06, 6.224960088729858e-06, 7.043592631816864e-06, 7.86222517490387e-06, 8.680857717990875e-06, 9.499490261077881e-06, 1.0318122804164886e-05, 1.1136755347251892e-05, 1.1955387890338898e-05, 1.2774020433425903e-05, 1.3592652976512909e-05, 1.4411285519599915e-05, 1.522991806268692e-05, 1.6048550605773926e-05, 1.686718314886093e-05, 1.7685815691947937e-05, 1.8504448235034943e-05, 1.9323080778121948e-05, 2.0141713321208954e-05, 2.096034586429596e-05, 2.1778978407382965e-05, 2.259761095046997e-05, 2.3416243493556976e-05, 2.4234876036643982e-05, 2.5053508579730988e-05, 2.5872141122817993e-05, 2.6690773665905e-05, 2.7509406208992004e-05, 2.832803875207901e-05, 2.9146671295166016e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 16.0, 27.0, 29.0, 51.0, 60.0, 106.0, 178.0, 298.0, 527.0, 958.0, 1897.0, 4298.0, 10687.0, 30707.0, 111962.0, 443395.0, 328322.0, 77061.0, 22753.0, 8177.0, 3413.0, 1654.0, 808.0, 424.0, 238.0, 162.0, 109.0, 70.0, 50.0, 25.0, 20.0, 21.0, 8.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07940673828125, -0.07655715942382812, -0.07370758056640625, -0.07085800170898438, -0.0680084228515625, -0.06515884399414062, -0.06230926513671875, -0.059459686279296875, -0.056610107421875, -0.053760528564453125, -0.05091094970703125, -0.048061370849609375, -0.0452117919921875, -0.042362213134765625, -0.03951263427734375, -0.036663055419921875, -0.0338134765625, -0.030963897705078125, -0.02811431884765625, -0.025264739990234375, -0.0224151611328125, -0.019565582275390625, -0.01671600341796875, -0.013866424560546875, -0.011016845703125, -0.008167266845703125, -0.00531768798828125, -0.002468109130859375, 0.0003814697265625, 0.003231048583984375, 0.00608062744140625, 0.008930206298828125, 0.01177978515625, 0.014629364013671875, 0.01747894287109375, 0.020328521728515625, 0.0231781005859375, 0.026027679443359375, 0.02887725830078125, 0.031726837158203125, 0.034576416015625, 0.037425994873046875, 0.04027557373046875, 0.043125152587890625, 0.0459747314453125, 0.048824310302734375, 0.05167388916015625, 0.054523468017578125, 0.057373046875, 0.060222625732421875, 0.06307220458984375, 0.06592178344726562, 0.0687713623046875, 0.07162094116210938, 0.07447052001953125, 0.07732009887695312, 0.080169677734375, 0.08301925659179688, 0.08586883544921875, 0.08871841430664062, 0.0915679931640625, 0.09441757202148438, 0.09726715087890625, 0.10011672973632812, 0.10296630859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 8.0, 12.0, 17.0, 18.0, 20.0, 23.0, 45.0, 40.0, 62.0, 53.0, 49.0, 58.0, 63.0, 77.0, 59.0, 61.0, 54.0, 46.0, 41.0, 32.0, 33.0, 24.0, 17.0, 11.0, 9.0, 7.0, 8.0, 4.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06341552734375, -0.06151771545410156, -0.059619903564453125, -0.05772209167480469, -0.05582427978515625, -0.05392646789550781, -0.052028656005859375, -0.05013084411621094, -0.0482330322265625, -0.04633522033691406, -0.044437408447265625, -0.04253959655761719, -0.04064178466796875, -0.03874397277832031, -0.036846160888671875, -0.03494834899902344, -0.033050537109375, -0.031152725219726562, -0.029254913330078125, -0.027357101440429688, -0.02545928955078125, -0.023561477661132812, -0.021663665771484375, -0.019765853881835938, -0.0178680419921875, -0.015970230102539062, -0.014072418212890625, -0.012174606323242188, -0.01027679443359375, -0.008378982543945312, -0.006481170654296875, -0.0045833587646484375, -0.002685546875, -0.0007877349853515625, 0.001110076904296875, 0.0030078887939453125, 0.00490570068359375, 0.0068035125732421875, 0.008701324462890625, 0.010599136352539062, 0.0124969482421875, 0.014394760131835938, 0.016292572021484375, 0.018190383911132812, 0.02008819580078125, 0.021986007690429688, 0.023883819580078125, 0.025781631469726562, 0.027679443359375, 0.029577255249023438, 0.031475067138671875, 0.03337287902832031, 0.03527069091796875, 0.03716850280761719, 0.039066314697265625, 0.04096412658691406, 0.0428619384765625, 0.04475975036621094, 0.046657562255859375, 0.04855537414550781, 0.05045318603515625, 0.05235099792480469, 0.054248809814453125, 0.05614662170410156, 0.05804443359375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 10.0, 20.0, 32.0, 60.0, 94.0, 111.0, 162.0, 147.0, 127.0, 91.0, 70.0, 33.0, 20.0, 9.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5653105974197388, -1.519366979598999, -1.4734232425689697, -1.4274795055389404, -1.3815358877182007, -1.335592269897461, -1.2896485328674316, -1.2437047958374023, -1.1977611780166626, -1.1518175601959229, -1.1058738231658936, -1.0599300861358643, -1.0139864683151245, -0.96804279088974, -0.9220991134643555, -0.876155436038971, -0.8302117586135864, -0.7842680811882019, -0.7383244037628174, -0.6923807263374329, -0.6464370489120483, -0.6004933714866638, -0.5545496940612793, -0.5086060166358948, -0.46266233921051025, -0.41671866178512573, -0.3707749843597412, -0.3248313069343567, -0.27888762950897217, -0.23294395208358765, -0.18700027465820312, -0.1410565972328186, -0.09511303901672363, -0.04916936159133911, -0.00322568416595459, 0.04271799325942993, 0.08866167068481445, 0.13460534811019897, 0.1805490255355835, 0.22649270296096802, 0.27243638038635254, 0.31838005781173706, 0.3643237352371216, 0.4102674126625061, 0.4562110900878906, 0.5021547675132751, 0.5480984449386597, 0.5940421223640442, 0.6399857997894287, 0.6859294772148132, 0.7318731546401978, 0.7778168320655823, 0.8237605094909668, 0.8697041869163513, 0.9156478643417358, 0.9615915417671204, 1.0075352191925049, 1.0534789562225342, 1.099422574043274, 1.1453661918640137, 1.191309928894043, 1.2372536659240723, 1.283197283744812, 1.3291409015655518, 1.375084638595581]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 3.0, 8.0, 9.0, 8.0, 10.0, 17.0, 20.0, 14.0, 23.0, 24.0, 35.0, 35.0, 36.0, 36.0, 36.0, 48.0, 49.0, 51.0, 47.0, 48.0, 41.0, 46.0, 47.0, 34.0, 34.0, 34.0, 34.0, 32.0, 29.0, 23.0, 20.0, 13.0, 14.0, 9.0, 7.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8134320974349976, -0.7879867553710938, -0.7625414133071899, -0.7370960712432861, -0.7116507291793823, -0.6862053871154785, -0.6607600450515747, -0.6353147029876709, -0.6098693609237671, -0.5844240188598633, -0.5589786767959595, -0.5335333347320557, -0.5080879926681519, -0.48264265060424805, -0.4571973383426666, -0.4317519962787628, -0.4063066840171814, -0.3808613419532776, -0.3554159998893738, -0.32997065782546997, -0.30452531576156616, -0.27907997369766235, -0.25363466143608093, -0.22818931937217712, -0.20274397730827332, -0.1772986352443695, -0.1518532931804657, -0.12640796601772308, -0.10096262395381927, -0.07551728188991547, -0.05007195472717285, -0.024626612663269043, 0.000818789005279541, 0.02626412734389305, 0.05170946568250656, 0.07715480029582977, 0.10260014235973358, 0.1280454844236374, 0.15349081158638, 0.1789361536502838, 0.20438149571418762, 0.22982683777809143, 0.25527217984199524, 0.28071749210357666, 0.30616283416748047, 0.3316081762313843, 0.3570535182952881, 0.3824988603591919, 0.4079442024230957, 0.4333895444869995, 0.4588348865509033, 0.48428022861480713, 0.5097255706787109, 0.5351709127426147, 0.5606162548065186, 0.5860615968704224, 0.6115069389343262, 0.63695228099823, 0.6623976230621338, 0.6878429651260376, 0.7132883071899414, 0.7387336492538452, 0.764178991317749, 0.7896243333816528, 0.8150696158409119]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 18.0, 16.0, 27.0, 36.0, 55.0, 85.0, 142.0, 237.0, 389.0, 664.0, 1113.0, 2017.0, 3946.0, 8124.0, 18769.0, 53958.0, 266129.0, 3533598.0, 222291.0, 48472.0, 17263.0, 7733.0, 3820.0, 2037.0, 1126.0, 746.0, 474.0, 294.0, 208.0, 130.0, 77.0, 78.0, 60.0, 33.0, 21.0, 23.0, 18.0, 8.0, 9.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.1678466796875, -0.16283035278320312, -0.15781402587890625, -0.15279769897460938, -0.1477813720703125, -0.14276504516601562, -0.13774871826171875, -0.13273239135742188, -0.127716064453125, -0.12269973754882812, -0.11768341064453125, -0.11266708374023438, -0.1076507568359375, -0.10263442993164062, -0.09761810302734375, -0.09260177612304688, -0.08758544921875, -0.08256912231445312, -0.07755279541015625, -0.07253646850585938, -0.0675201416015625, -0.06250381469726562, -0.05748748779296875, -0.052471160888671875, -0.047454833984375, -0.042438507080078125, -0.03742218017578125, -0.032405853271484375, -0.0273895263671875, -0.022373199462890625, -0.01735687255859375, -0.012340545654296875, -0.00732421875, -0.002307891845703125, 0.00270843505859375, 0.007724761962890625, 0.0127410888671875, 0.017757415771484375, 0.02277374267578125, 0.027790069580078125, 0.032806396484375, 0.037822723388671875, 0.04283905029296875, 0.047855377197265625, 0.0528717041015625, 0.057888031005859375, 0.06290435791015625, 0.06792068481445312, 0.07293701171875, 0.07795333862304688, 0.08296966552734375, 0.08798599243164062, 0.0930023193359375, 0.09801864624023438, 0.10303497314453125, 0.10805130004882812, 0.113067626953125, 0.11808395385742188, 0.12310028076171875, 0.12811660766601562, 0.1331329345703125, 0.13814926147460938, 0.14316558837890625, 0.14818191528320312, 0.1531982421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 11.0, 8.0, 15.0, 25.0, 37.0, 33.0, 68.0, 59.0, 67.0, 67.0, 91.0, 69.0, 67.0, 61.0, 71.0, 41.0, 55.0, 39.0, 25.0, 21.0, 15.0, 8.0, 8.0, 6.0, 4.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043609619140625, -0.04212760925292969, -0.040645599365234375, -0.03916358947753906, -0.03768157958984375, -0.03619956970214844, -0.034717559814453125, -0.03323554992675781, -0.0317535400390625, -0.030271530151367188, -0.028789520263671875, -0.027307510375976562, -0.02582550048828125, -0.024343490600585938, -0.022861480712890625, -0.021379470825195312, -0.0198974609375, -0.018415451049804688, -0.016933441162109375, -0.015451431274414062, -0.01396942138671875, -0.012487411499023438, -0.011005401611328125, -0.009523391723632812, -0.0080413818359375, -0.0065593719482421875, -0.005077362060546875, -0.0035953521728515625, -0.00211334228515625, -0.0006313323974609375, 0.000850677490234375, 0.0023326873779296875, 0.003814697265625, 0.0052967071533203125, 0.006778717041015625, 0.008260726928710938, 0.00974273681640625, 0.011224746704101562, 0.012706756591796875, 0.014188766479492188, 0.0156707763671875, 0.017152786254882812, 0.018634796142578125, 0.020116806030273438, 0.02159881591796875, 0.023080825805664062, 0.024562835693359375, 0.026044845581054688, 0.02752685546875, 0.029008865356445312, 0.030490875244140625, 0.03197288513183594, 0.03345489501953125, 0.03493690490722656, 0.036418914794921875, 0.03790092468261719, 0.0393829345703125, 0.04086494445800781, 0.042346954345703125, 0.04382896423339844, 0.04531097412109375, 0.04679298400878906, 0.048274993896484375, 0.04975700378417969, 0.051239013671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 8.0, 9.0, 17.0, 23.0, 36.0, 49.0, 89.0, 128.0, 199.0, 334.0, 559.0, 958.0, 1670.0, 3036.0, 6347.0, 14384.0, 36850.0, 119816.0, 1028056.0, 2739306.0, 163639.0, 45781.0, 17267.0, 7518.0, 3621.0, 1919.0, 1029.0, 620.0, 369.0, 235.0, 153.0, 78.0, 61.0, 24.0, 32.0, 12.0, 13.0, 16.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.177734375, -0.17281150817871094, -0.16788864135742188, -0.1629657745361328, -0.15804290771484375, -0.1531200408935547, -0.14819717407226562, -0.14327430725097656, -0.1383514404296875, -0.13342857360839844, -0.12850570678710938, -0.12358283996582031, -0.11865997314453125, -0.11373710632324219, -0.10881423950195312, -0.10389137268066406, -0.098968505859375, -0.09404563903808594, -0.08912277221679688, -0.08419990539550781, -0.07927703857421875, -0.07435417175292969, -0.06943130493164062, -0.06450843811035156, -0.0595855712890625, -0.05466270446777344, -0.049739837646484375, -0.04481697082519531, -0.03989410400390625, -0.03497123718261719, -0.030048370361328125, -0.025125503540039062, -0.02020263671875, -0.015279769897460938, -0.010356903076171875, -0.0054340362548828125, -0.00051116943359375, 0.0044116973876953125, 0.009334564208984375, 0.014257431030273438, 0.0191802978515625, 0.024103164672851562, 0.029026031494140625, 0.03394889831542969, 0.03887176513671875, 0.04379463195800781, 0.048717498779296875, 0.05364036560058594, 0.058563232421875, 0.06348609924316406, 0.06840896606445312, 0.07333183288574219, 0.07825469970703125, 0.08317756652832031, 0.08810043334960938, 0.09302330017089844, 0.0979461669921875, 0.10286903381347656, 0.10779190063476562, 0.11271476745605469, 0.11763763427734375, 0.12256050109863281, 0.12748336791992188, 0.13240623474121094, 0.1373291015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 8.0, 9.0, 14.0, 9.0, 22.0, 28.0, 41.0, 56.0, 71.0, 145.0, 244.0, 674.0, 1650.0, 475.0, 206.0, 139.0, 64.0, 56.0, 41.0, 22.0, 24.0, 15.0, 12.0, 9.0, 5.0, 10.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.09368896484375, -0.09118175506591797, -0.08867454528808594, -0.0861673355102539, -0.08366012573242188, -0.08115291595458984, -0.07864570617675781, -0.07613849639892578, -0.07363128662109375, -0.07112407684326172, -0.06861686706542969, -0.06610965728759766, -0.06360244750976562, -0.061095237731933594, -0.05858802795410156, -0.05608081817626953, -0.0535736083984375, -0.05106639862060547, -0.04855918884277344, -0.046051979064941406, -0.043544769287109375, -0.041037559509277344, -0.03853034973144531, -0.03602313995361328, -0.03351593017578125, -0.03100872039794922, -0.028501510620117188, -0.025994300842285156, -0.023487091064453125, -0.020979881286621094, -0.018472671508789062, -0.01596546173095703, -0.013458251953125, -0.010951042175292969, -0.008443832397460938, -0.005936622619628906, -0.003429412841796875, -0.0009222030639648438, 0.0015850067138671875, 0.004092216491699219, 0.00659942626953125, 0.009106636047363281, 0.011613845825195312, 0.014121055603027344, 0.016628265380859375, 0.019135475158691406, 0.021642684936523438, 0.02414989471435547, 0.0266571044921875, 0.02916431427001953, 0.03167152404785156, 0.034178733825683594, 0.036685943603515625, 0.039193153381347656, 0.04170036315917969, 0.04420757293701172, 0.04671478271484375, 0.04922199249267578, 0.05172920227050781, 0.054236412048339844, 0.056743621826171875, 0.059250831604003906, 0.06175804138183594, 0.06426525115966797, 0.0667724609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 9.0, 19.0, 11.0, 21.0, 39.0, 39.0, 78.0, 87.0, 94.0, 119.0, 114.0, 111.0, 83.0, 55.0, 38.0, 30.0, 20.0, 14.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5666863918304443, -0.5516281723976135, -0.5365700125694275, -0.5215117931365967, -0.5064535737037659, -0.49139538407325745, -0.476337194442749, -0.4612789750099182, -0.4462207853794098, -0.43116259574890137, -0.41610437631607056, -0.40104618668556213, -0.3859879970550537, -0.3709297776222229, -0.3558715879917145, -0.34081339836120605, -0.32575517892837524, -0.3106969892978668, -0.295638769865036, -0.2805805802345276, -0.2655223608016968, -0.25046417117118835, -0.23540598154067993, -0.22034777700901031, -0.2052895724773407, -0.19023136794567108, -0.17517316341400146, -0.16011497378349304, -0.14505676925182343, -0.1299985647201538, -0.11494036763906479, -0.09988217055797577, -0.08482396602630615, -0.06976576149463654, -0.054707564413547516, -0.0396493636071682, -0.02459116280078888, -0.009532958269119263, 0.005525238811969757, 0.020583435893058777, 0.035641640424728394, 0.05069984123110771, 0.06575804203748703, 0.08081623911857605, 0.09587444365024567, 0.11093264818191528, 0.1259908378124237, 0.14104904234409332, 0.15610724687576294, 0.17116545140743256, 0.18622365593910217, 0.2012818455696106, 0.2163400501012802, 0.23139825463294983, 0.24645644426345825, 0.26151466369628906, 0.2765728533267975, 0.2916310429573059, 0.3066892623901367, 0.32174745202064514, 0.33680564165115356, 0.3518638610839844, 0.3669220507144928, 0.3819802403450012, 0.39703845977783203]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 10.0, 10.0, 14.0, 10.0, 9.0, 13.0, 19.0, 30.0, 33.0, 21.0, 34.0, 42.0, 45.0, 34.0, 40.0, 37.0, 48.0, 40.0, 40.0, 50.0, 44.0, 34.0, 44.0, 33.0, 54.0, 32.0, 21.0, 25.0, 24.0, 13.0, 20.0, 11.0, 12.0, 9.0, 6.0, 6.0, 11.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2719373106956482, -0.26371222734451294, -0.2554871439933777, -0.24726206064224243, -0.23903697729110718, -0.23081189393997192, -0.22258679568767548, -0.21436171233654022, -0.20613662898540497, -0.19791154563426971, -0.18968646228313446, -0.1814613789319992, -0.17323628067970276, -0.1650111973285675, -0.15678611397743225, -0.148561030626297, -0.14033594727516174, -0.1321108639240265, -0.12388578057289124, -0.11566068977117538, -0.10743560642004013, -0.09921052306890488, -0.09098543226718903, -0.08276034891605377, -0.07453526556491852, -0.06631018221378326, -0.05808509513735771, -0.04986000806093216, -0.041634924709796906, -0.03340984135866165, -0.0251847542822361, -0.016959667205810547, -0.008734583854675293, -0.0005094986408948898, 0.007715586572885513, 0.015940671786665916, 0.02416575700044632, 0.032390840351581573, 0.040615927428007126, 0.04884101450443268, 0.05706609785556793, 0.06529118120670319, 0.07351626455783844, 0.08174135535955429, 0.08996643871068954, 0.0981915220618248, 0.10641661286354065, 0.1146416962146759, 0.12286677956581116, 0.1310918629169464, 0.13931694626808167, 0.14754202961921692, 0.15576711297035217, 0.16399219632148743, 0.17221729457378387, 0.18044237792491913, 0.18866746127605438, 0.19689254462718964, 0.2051176279783249, 0.21334271132946014, 0.2215678095817566, 0.22979289293289185, 0.2380179762840271, 0.24624305963516235, 0.2544681429862976]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 13.0, 14.0, 21.0, 36.0, 65.0, 132.0, 220.0, 356.0, 761.0, 1626.0, 3701.0, 9836.0, 28742.0, 103420.0, 655218.0, 180032.0, 41640.0, 13604.0, 5064.0, 2061.0, 945.0, 491.0, 224.0, 113.0, 86.0, 42.0, 34.0, 22.0, 13.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.25537109375, -0.24778366088867188, -0.24019622802734375, -0.23260879516601562, -0.2250213623046875, -0.21743392944335938, -0.20984649658203125, -0.20225906372070312, -0.194671630859375, -0.18708419799804688, -0.17949676513671875, -0.17190933227539062, -0.1643218994140625, -0.15673446655273438, -0.14914703369140625, -0.14155960083007812, -0.13397216796875, -0.12638473510742188, -0.11879730224609375, -0.11120986938476562, -0.1036224365234375, -0.09603500366210938, -0.08844757080078125, -0.08086013793945312, -0.073272705078125, -0.06568527221679688, -0.05809783935546875, -0.050510406494140625, -0.0429229736328125, -0.035335540771484375, -0.02774810791015625, -0.020160675048828125, -0.0125732421875, -0.004985809326171875, 0.00260162353515625, 0.010189056396484375, 0.0177764892578125, 0.025363922119140625, 0.03295135498046875, 0.040538787841796875, 0.048126220703125, 0.055713653564453125, 0.06330108642578125, 0.07088851928710938, 0.0784759521484375, 0.08606338500976562, 0.09365081787109375, 0.10123825073242188, 0.10882568359375, 0.11641311645507812, 0.12400054931640625, 0.13158798217773438, 0.1391754150390625, 0.14676284790039062, 0.15435028076171875, 0.16193771362304688, 0.169525146484375, 0.17711257934570312, 0.18470001220703125, 0.19228744506835938, 0.1998748779296875, 0.20746231079101562, 0.21504974365234375, 0.22263717651367188, 0.230224609375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 11.0, 9.0, 25.0, 22.0, 30.0, 54.0, 57.0, 86.0, 79.0, 87.0, 79.0, 85.0, 70.0, 71.0, 54.0, 47.0, 32.0, 28.0, 21.0, 10.0, 9.0, 9.0, 4.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0537109375, -0.0520625114440918, -0.050414085388183594, -0.04876565933227539, -0.04711723327636719, -0.045468807220458984, -0.04382038116455078, -0.04217195510864258, -0.040523529052734375, -0.03887510299682617, -0.03722667694091797, -0.035578250885009766, -0.03392982482910156, -0.03228139877319336, -0.030632972717285156, -0.028984546661376953, -0.02733612060546875, -0.025687694549560547, -0.024039268493652344, -0.02239084243774414, -0.020742416381835938, -0.019093990325927734, -0.01744556427001953, -0.015797138214111328, -0.014148712158203125, -0.012500286102294922, -0.010851860046386719, -0.009203433990478516, -0.0075550079345703125, -0.005906581878662109, -0.004258155822753906, -0.002609729766845703, -0.0009613037109375, 0.0006871223449707031, 0.0023355484008789062, 0.003983974456787109, 0.0056324005126953125, 0.007280826568603516, 0.008929252624511719, 0.010577678680419922, 0.012226104736328125, 0.013874530792236328, 0.015522956848144531, 0.017171382904052734, 0.018819808959960938, 0.02046823501586914, 0.022116661071777344, 0.023765087127685547, 0.02541351318359375, 0.027061939239501953, 0.028710365295410156, 0.03035879135131836, 0.03200721740722656, 0.033655643463134766, 0.03530406951904297, 0.03695249557495117, 0.038600921630859375, 0.04024934768676758, 0.04189777374267578, 0.043546199798583984, 0.04519462585449219, 0.04684305191040039, 0.048491477966308594, 0.0501399040222168, 0.051788330078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 9.0, 5.0, 9.0, 8.0, 11.0, 14.0, 26.0, 16.0, 36.0, 64.0, 105.0, 134.0, 196.0, 309.0, 564.0, 937.0, 1689.0, 3060.0, 6924.0, 18865.0, 68212.0, 492802.0, 368684.0, 56488.0, 16322.0, 6233.0, 3060.0, 1501.0, 877.0, 483.0, 307.0, 197.0, 120.0, 79.0, 55.0, 40.0, 39.0, 19.0, 13.0, 13.0, 7.0, 12.0, 1.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.2152099609375, -0.20922088623046875, -0.2032318115234375, -0.19724273681640625, -0.191253662109375, -0.18526458740234375, -0.1792755126953125, -0.17328643798828125, -0.16729736328125, -0.16130828857421875, -0.1553192138671875, -0.14933013916015625, -0.143341064453125, -0.13735198974609375, -0.1313629150390625, -0.12537384033203125, -0.119384765625, -0.11339569091796875, -0.1074066162109375, -0.10141754150390625, -0.095428466796875, -0.08943939208984375, -0.0834503173828125, -0.07746124267578125, -0.07147216796875, -0.06548309326171875, -0.0594940185546875, -0.05350494384765625, -0.047515869140625, -0.04152679443359375, -0.0355377197265625, -0.02954864501953125, -0.0235595703125, -0.01757049560546875, -0.0115814208984375, -0.00559234619140625, 0.000396728515625, 0.00638580322265625, 0.0123748779296875, 0.01836395263671875, 0.02435302734375, 0.03034210205078125, 0.0363311767578125, 0.04232025146484375, 0.048309326171875, 0.05429840087890625, 0.0602874755859375, 0.06627655029296875, 0.072265625, 0.07825469970703125, 0.0842437744140625, 0.09023284912109375, 0.096221923828125, 0.10221099853515625, 0.1082000732421875, 0.11418914794921875, 0.12017822265625, 0.12616729736328125, 0.1321563720703125, 0.13814544677734375, 0.144134521484375, 0.15012359619140625, 0.1561126708984375, 0.16210174560546875, 0.1680908203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 1.0, 7.0, 10.0, 10.0, 20.0, 21.0, 19.0, 24.0, 28.0, 48.0, 44.0, 51.0, 52.0, 64.0, 70.0, 63.0, 66.0, 57.0, 50.0, 44.0, 52.0, 38.0, 35.0, 32.0, 23.0, 21.0, 10.0, 8.0, 4.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.15790748596191406, -0.15211868286132812, -0.1463298797607422, -0.14054107666015625, -0.1347522735595703, -0.12896347045898438, -0.12317466735839844, -0.1173858642578125, -0.11159706115722656, -0.10580825805664062, -0.10001945495605469, -0.09423065185546875, -0.08844184875488281, -0.08265304565429688, -0.07686424255371094, -0.071075439453125, -0.06528663635253906, -0.059497833251953125, -0.05370903015136719, -0.04792022705078125, -0.04213142395019531, -0.036342620849609375, -0.030553817749023438, -0.0247650146484375, -0.018976211547851562, -0.013187408447265625, -0.0073986053466796875, -0.00160980224609375, 0.0041790008544921875, 0.009967803955078125, 0.015756607055664062, 0.02154541015625, 0.027334213256835938, 0.033123016357421875, 0.03891181945800781, 0.04470062255859375, 0.05048942565917969, 0.056278228759765625, 0.06206703186035156, 0.0678558349609375, 0.07364463806152344, 0.07943344116210938, 0.08522224426269531, 0.09101104736328125, 0.09679985046386719, 0.10258865356445312, 0.10837745666503906, 0.114166259765625, 0.11995506286621094, 0.12574386596679688, 0.1315326690673828, 0.13732147216796875, 0.1431102752685547, 0.14889907836914062, 0.15468788146972656, 0.1604766845703125, 0.16626548767089844, 0.17205429077148438, 0.1778430938720703, 0.18363189697265625, 0.1894207000732422, 0.19520950317382812, 0.20099830627441406, 0.206787109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 10.0, 18.0, 25.0, 33.0, 57.0, 113.0, 198.0, 341.0, 757.0, 1688.0, 4978.0, 17465.0, 84205.0, 786537.0, 120351.0, 22052.0, 5862.0, 2028.0, 881.0, 409.0, 205.0, 138.0, 65.0, 36.0, 27.0, 18.0, 7.0, 10.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.1829833984375, -0.17824077606201172, -0.17349815368652344, -0.16875553131103516, -0.16401290893554688, -0.1592702865600586, -0.1545276641845703, -0.14978504180908203, -0.14504241943359375, -0.14029979705810547, -0.1355571746826172, -0.1308145523071289, -0.12607192993164062, -0.12132930755615234, -0.11658668518066406, -0.11184406280517578, -0.1071014404296875, -0.10235881805419922, -0.09761619567871094, -0.09287357330322266, -0.08813095092773438, -0.0833883285522461, -0.07864570617675781, -0.07390308380126953, -0.06916046142578125, -0.06441783905029297, -0.05967521667480469, -0.054932594299316406, -0.050189971923828125, -0.045447349548339844, -0.04070472717285156, -0.03596210479736328, -0.031219482421875, -0.02647686004638672, -0.021734237670898438, -0.016991615295410156, -0.012248992919921875, -0.007506370544433594, -0.0027637481689453125, 0.0019788742065429688, 0.00672149658203125, 0.011464118957519531, 0.016206741333007812, 0.020949363708496094, 0.025691986083984375, 0.030434608459472656, 0.03517723083496094, 0.03991985321044922, 0.0446624755859375, 0.04940509796142578, 0.05414772033691406, 0.058890342712402344, 0.06363296508789062, 0.0683755874633789, 0.07311820983886719, 0.07786083221435547, 0.08260345458984375, 0.08734607696533203, 0.09208869934082031, 0.0968313217163086, 0.10157394409179688, 0.10631656646728516, 0.11105918884277344, 0.11580181121826172, 0.12054443359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 15.0, 11.0, 17.0, 35.0, 36.0, 66.0, 88.0, 119.0, 135.0, 125.0, 91.0, 69.0, 46.0, 46.0, 30.0, 16.0, 9.0, 14.0, 6.0, 8.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.37905502319336e-05, -7.21421092748642e-05, -7.04936683177948e-05, -6.88452273607254e-05, -6.7196786403656e-05, -6.554834544658661e-05, -6.389990448951721e-05, -6.225146353244781e-05, -6.060302257537842e-05, -5.895458161830902e-05, -5.7306140661239624e-05, -5.565769970417023e-05, -5.400925874710083e-05, -5.236081779003143e-05, -5.0712376832962036e-05, -4.906393587589264e-05, -4.741549491882324e-05, -4.5767053961753845e-05, -4.411861300468445e-05, -4.247017204761505e-05, -4.0821731090545654e-05, -3.917329013347626e-05, -3.752484917640686e-05, -3.587640821933746e-05, -3.4227967262268066e-05, -3.257952630519867e-05, -3.093108534812927e-05, -2.9282644391059875e-05, -2.763420343399048e-05, -2.598576247692108e-05, -2.4337321519851685e-05, -2.2688880562782288e-05, -2.104043960571289e-05, -1.9391998648643494e-05, -1.7743557691574097e-05, -1.60951167345047e-05, -1.4446675777435303e-05, -1.2798234820365906e-05, -1.1149793863296509e-05, -9.501352906227112e-06, -7.852911949157715e-06, -6.204470992088318e-06, -4.556030035018921e-06, -2.907589077949524e-06, -1.259148120880127e-06, 3.8929283618927e-07, 2.037733793258667e-06, 3.686174750328064e-06, 5.334615707397461e-06, 6.983056664466858e-06, 8.631497621536255e-06, 1.0279938578605652e-05, 1.1928379535675049e-05, 1.3576820492744446e-05, 1.5225261449813843e-05, 1.687370240688324e-05, 1.8522143363952637e-05, 2.0170584321022034e-05, 2.181902527809143e-05, 2.3467466235160828e-05, 2.5115907192230225e-05, 2.676434814929962e-05, 2.841278910636902e-05, 3.0061230063438416e-05, 3.170967102050781e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 10.0, 10.0, 7.0, 14.0, 17.0, 21.0, 50.0, 60.0, 75.0, 128.0, 230.0, 378.0, 763.0, 1654.0, 3824.0, 10677.0, 37318.0, 289773.0, 626041.0, 54570.0, 14077.0, 4716.0, 2033.0, 957.0, 466.0, 272.0, 133.0, 83.0, 52.0, 34.0, 24.0, 34.0, 16.0, 13.0, 3.0, 3.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1181640625, -0.11410713195800781, -0.11005020141601562, -0.10599327087402344, -0.10193634033203125, -0.09787940979003906, -0.09382247924804688, -0.08976554870605469, -0.0857086181640625, -0.08165168762207031, -0.07759475708007812, -0.07353782653808594, -0.06948089599609375, -0.06542396545410156, -0.061367034912109375, -0.05731010437011719, -0.053253173828125, -0.04919624328613281, -0.045139312744140625, -0.04108238220214844, -0.03702545166015625, -0.03296852111816406, -0.028911590576171875, -0.024854660034179688, -0.0207977294921875, -0.016740798950195312, -0.012683868408203125, -0.008626937866210938, -0.00457000732421875, -0.0005130767822265625, 0.003543853759765625, 0.0076007843017578125, 0.01165771484375, 0.015714645385742188, 0.019771575927734375, 0.023828506469726562, 0.02788543701171875, 0.03194236755371094, 0.035999298095703125, 0.04005622863769531, 0.0441131591796875, 0.04817008972167969, 0.052227020263671875, 0.05628395080566406, 0.06034088134765625, 0.06439781188964844, 0.06845474243164062, 0.07251167297363281, 0.076568603515625, 0.08062553405761719, 0.08468246459960938, 0.08873939514160156, 0.09279632568359375, 0.09685325622558594, 0.10091018676757812, 0.10496711730957031, 0.1090240478515625, 0.11308097839355469, 0.11713790893554688, 0.12119483947753906, 0.12525177001953125, 0.12930870056152344, 0.13336563110351562, 0.1374225616455078, 0.1414794921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 5.0, 15.0, 17.0, 23.0, 30.0, 60.0, 110.0, 218.0, 203.0, 125.0, 59.0, 47.0, 16.0, 21.0, 10.0, 6.0, 11.0, 5.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1138916015625, -0.1105508804321289, -0.10721015930175781, -0.10386943817138672, -0.10052871704101562, -0.09718799591064453, -0.09384727478027344, -0.09050655364990234, -0.08716583251953125, -0.08382511138916016, -0.08048439025878906, -0.07714366912841797, -0.07380294799804688, -0.07046222686767578, -0.06712150573730469, -0.0637807846069336, -0.0604400634765625, -0.057099342346191406, -0.05375862121582031, -0.05041790008544922, -0.047077178955078125, -0.04373645782470703, -0.04039573669433594, -0.037055015563964844, -0.03371429443359375, -0.030373573303222656, -0.027032852172851562, -0.02369213104248047, -0.020351409912109375, -0.01701068878173828, -0.013669967651367188, -0.010329246520996094, -0.006988525390625, -0.0036478042602539062, -0.0003070831298828125, 0.0030336380004882812, 0.006374359130859375, 0.009715080261230469, 0.013055801391601562, 0.016396522521972656, 0.01973724365234375, 0.023077964782714844, 0.026418685913085938, 0.02975940704345703, 0.033100128173828125, 0.03644084930419922, 0.03978157043457031, 0.043122291564941406, 0.0464630126953125, 0.049803733825683594, 0.05314445495605469, 0.05648517608642578, 0.059825897216796875, 0.06316661834716797, 0.06650733947753906, 0.06984806060791016, 0.07318878173828125, 0.07652950286865234, 0.07987022399902344, 0.08321094512939453, 0.08655166625976562, 0.08989238739013672, 0.09323310852050781, 0.0965738296508789, 0.09991455078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 22.0, 35.0, 118.0, 195.0, 223.0, 219.0, 109.0, 46.0, 23.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.665393352508545, -3.5882980823516846, -3.511202573776245, -3.4341073036193848, -3.3570117950439453, -3.279916524887085, -3.2028210163116455, -3.125725746154785, -3.0486302375793457, -2.9715349674224854, -2.894439458847046, -2.8173441886901855, -2.740248680114746, -2.6631534099578857, -2.5860579013824463, -2.508962631225586, -2.4318673610687256, -2.3547720909118652, -2.277676582336426, -2.2005813121795654, -2.123485803604126, -2.0463905334472656, -1.9692951440811157, -1.8921997547149658, -1.815104365348816, -1.738008975982666, -1.6609135866165161, -1.5838181972503662, -1.5067229270935059, -1.4296274185180664, -1.352532148361206, -1.2754367589950562, -1.1983413696289062, -1.1212459802627563, -1.0441505908966064, -0.9670552611351013, -0.8899598717689514, -0.8128644824028015, -0.7357691526412964, -0.6586737632751465, -0.5815783739089966, -0.5044829845428467, -0.42738762497901917, -0.35029226541519165, -0.27319687604904175, -0.19610148668289185, -0.11900612711906433, -0.041910767555236816, 0.035184621810913086, 0.1122799962759018, 0.1893753707408905, 0.266470730304718, 0.3435661196708679, 0.4206615090370178, 0.49775686860084534, 0.5748522281646729, 0.6519476175308228, 0.7290430068969727, 0.8061383962631226, 0.8832337260246277, 0.9603291153907776, 1.0374245643615723, 1.1145198345184326, 1.1916152238845825, 1.2687106132507324]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 2.0, 8.0, 7.0, 13.0, 14.0, 11.0, 18.0, 30.0, 18.0, 27.0, 25.0, 26.0, 36.0, 28.0, 46.0, 37.0, 44.0, 38.0, 46.0, 30.0, 33.0, 45.0, 40.0, 33.0, 29.0, 28.0, 34.0, 23.0, 35.0, 19.0, 24.0, 23.0, 21.0, 21.0, 12.0, 14.0, 18.0, 6.0, 9.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.6341946125030518, -0.6144767999649048, -0.5947589874267578, -0.5750411748886108, -0.5553233027458191, -0.5356054902076721, -0.5158876776695251, -0.4961698651313782, -0.4764520525932312, -0.45673424005508423, -0.43701639771461487, -0.4172985851764679, -0.3975807726383209, -0.37786293029785156, -0.3581451177597046, -0.3384273052215576, -0.31870946288108826, -0.2989916503429413, -0.2792738080024719, -0.25955599546432495, -0.23983818292617798, -0.2201203554868698, -0.20040252804756165, -0.18068471550941467, -0.1609668880701065, -0.14124906063079834, -0.12153124809265137, -0.1018134206533432, -0.08209560066461563, -0.06237778067588806, -0.042659953236579895, -0.022942140698432922, -0.003224313259124756, 0.016493508592247963, 0.03621133044362068, 0.05592915415763855, 0.07564697414636612, 0.09536479413509369, 0.11508262157440186, 0.13480043411254883, 0.154518261551857, 0.17423608899116516, 0.19395390152931213, 0.2136717289686203, 0.23338955640792847, 0.25310736894607544, 0.2728251814842224, 0.2925429940223694, 0.31226083636283875, 0.3319786489009857, 0.3516964912414551, 0.37141430377960205, 0.391132116317749, 0.410849928855896, 0.43056777119636536, 0.45028558373451233, 0.4700034260749817, 0.48972123861312866, 0.5094390511512756, 0.5291569232940674, 0.5488747358322144, 0.5685925483703613, 0.5883103609085083, 0.6080281734466553, 0.6277459859848022]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 12.0, 6.0, 8.0, 10.0, 30.0, 32.0, 46.0, 63.0, 119.0, 189.0, 268.0, 515.0, 936.0, 1744.0, 3344.0, 7053.0, 17439.0, 56789.0, 483919.0, 3480138.0, 97432.0, 24990.0, 9582.0, 4376.0, 2267.0, 1163.0, 724.0, 386.0, 224.0, 153.0, 106.0, 65.0, 59.0, 32.0, 14.0, 14.0, 13.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.17600440979003906, -0.16975784301757812, -0.1635112762451172, -0.15726470947265625, -0.1510181427001953, -0.14477157592773438, -0.13852500915527344, -0.1322784423828125, -0.12603187561035156, -0.11978530883789062, -0.11353874206542969, -0.10729217529296875, -0.10104560852050781, -0.09479904174804688, -0.08855247497558594, -0.082305908203125, -0.07605934143066406, -0.06981277465820312, -0.06356620788574219, -0.05731964111328125, -0.05107307434082031, -0.044826507568359375, -0.03857994079589844, -0.0323333740234375, -0.026086807250976562, -0.019840240478515625, -0.013593673706054688, -0.00734710693359375, -0.0011005401611328125, 0.005146026611328125, 0.011392593383789062, 0.01763916015625, 0.023885726928710938, 0.030132293701171875, 0.03637886047363281, 0.04262542724609375, 0.04887199401855469, 0.055118560791015625, 0.06136512756347656, 0.0676116943359375, 0.07385826110839844, 0.08010482788085938, 0.08635139465332031, 0.09259796142578125, 0.09884452819824219, 0.10509109497070312, 0.11133766174316406, 0.117584228515625, 0.12383079528808594, 0.13007736206054688, 0.1363239288330078, 0.14257049560546875, 0.1488170623779297, 0.15506362915039062, 0.16131019592285156, 0.1675567626953125, 0.17380332946777344, 0.18004989624023438, 0.1862964630126953, 0.19254302978515625, 0.1987895965576172, 0.20503616333007812, 0.21128273010253906, 0.217529296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 7.0, 12.0, 24.0, 20.0, 27.0, 57.0, 69.0, 69.0, 67.0, 71.0, 88.0, 64.0, 67.0, 74.0, 69.0, 46.0, 39.0, 43.0, 26.0, 12.0, 13.0, 7.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054901123046875, -0.05318927764892578, -0.05147743225097656, -0.049765586853027344, -0.048053741455078125, -0.046341896057128906, -0.04463005065917969, -0.04291820526123047, -0.04120635986328125, -0.03949451446533203, -0.03778266906738281, -0.036070823669433594, -0.034358978271484375, -0.032647132873535156, -0.030935287475585938, -0.02922344207763672, -0.0275115966796875, -0.02579975128173828, -0.024087905883789062, -0.022376060485839844, -0.020664215087890625, -0.018952369689941406, -0.017240524291992188, -0.015528678894042969, -0.01381683349609375, -0.012104988098144531, -0.010393142700195312, -0.008681297302246094, -0.006969451904296875, -0.005257606506347656, -0.0035457611083984375, -0.0018339157104492188, -0.0001220703125, 0.0015897750854492188, 0.0033016204833984375, 0.005013465881347656, 0.006725311279296875, 0.008437156677246094, 0.010149002075195312, 0.011860847473144531, 0.01357269287109375, 0.015284538269042969, 0.016996383666992188, 0.018708229064941406, 0.020420074462890625, 0.022131919860839844, 0.023843765258789062, 0.02555561065673828, 0.0272674560546875, 0.02897930145263672, 0.030691146850585938, 0.032402992248535156, 0.034114837646484375, 0.035826683044433594, 0.03753852844238281, 0.03925037384033203, 0.04096221923828125, 0.04267406463623047, 0.04438591003417969, 0.046097755432128906, 0.047809600830078125, 0.049521446228027344, 0.05123329162597656, 0.05294513702392578, 0.054656982421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 14.0, 14.0, 17.0, 28.0, 45.0, 51.0, 80.0, 91.0, 131.0, 212.0, 287.0, 455.0, 687.0, 1176.0, 2066.0, 3939.0, 9040.0, 23641.0, 77256.0, 793258.0, 3117565.0, 111864.0, 29770.0, 11495.0, 4957.0, 2401.0, 1371.0, 816.0, 513.0, 310.0, 223.0, 142.0, 102.0, 72.0, 38.0, 40.0, 28.0, 22.0, 15.0, 16.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217041015625, -0.2106800079345703, -0.20431900024414062, -0.19795799255371094, -0.19159698486328125, -0.18523597717285156, -0.17887496948242188, -0.1725139617919922, -0.1661529541015625, -0.1597919464111328, -0.15343093872070312, -0.14706993103027344, -0.14070892333984375, -0.13434791564941406, -0.12798690795898438, -0.12162590026855469, -0.115264892578125, -0.10890388488769531, -0.10254287719726562, -0.09618186950683594, -0.08982086181640625, -0.08345985412597656, -0.07709884643554688, -0.07073783874511719, -0.0643768310546875, -0.05801582336425781, -0.051654815673828125, -0.04529380798339844, -0.03893280029296875, -0.03257179260253906, -0.026210784912109375, -0.019849777221679688, -0.01348876953125, -0.0071277618408203125, -0.000766754150390625, 0.0055942535400390625, 0.01195526123046875, 0.018316268920898438, 0.024677276611328125, 0.031038284301757812, 0.0373992919921875, 0.04376029968261719, 0.050121307373046875, 0.05648231506347656, 0.06284332275390625, 0.06920433044433594, 0.07556533813476562, 0.08192634582519531, 0.088287353515625, 0.09464836120605469, 0.10100936889648438, 0.10737037658691406, 0.11373138427734375, 0.12009239196777344, 0.12645339965820312, 0.1328144073486328, 0.1391754150390625, 0.1455364227294922, 0.15189743041992188, 0.15825843811035156, 0.16461944580078125, 0.17098045349121094, 0.17734146118164062, 0.1837024688720703, 0.1900634765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 11.0, 11.0, 11.0, 26.0, 27.0, 43.0, 62.0, 164.0, 392.0, 2082.0, 747.0, 218.0, 98.0, 49.0, 38.0, 23.0, 16.0, 8.0, 12.0, 9.0, 6.0, 6.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11456298828125, -0.1113576889038086, -0.10815238952636719, -0.10494709014892578, -0.10174179077148438, -0.09853649139404297, -0.09533119201660156, -0.09212589263916016, -0.08892059326171875, -0.08571529388427734, -0.08250999450683594, -0.07930469512939453, -0.07609939575195312, -0.07289409637451172, -0.06968879699707031, -0.0664834976196289, -0.0632781982421875, -0.060072898864746094, -0.05686759948730469, -0.05366230010986328, -0.050457000732421875, -0.04725170135498047, -0.04404640197753906, -0.040841102600097656, -0.03763580322265625, -0.034430503845214844, -0.031225204467773438, -0.02801990509033203, -0.024814605712890625, -0.02160930633544922, -0.018404006958007812, -0.015198707580566406, -0.011993408203125, -0.008788108825683594, -0.0055828094482421875, -0.0023775100708007812, 0.000827789306640625, 0.004033088684082031, 0.0072383880615234375, 0.010443687438964844, 0.01364898681640625, 0.016854286193847656, 0.020059585571289062, 0.02326488494873047, 0.026470184326171875, 0.02967548370361328, 0.03288078308105469, 0.036086082458496094, 0.0392913818359375, 0.042496681213378906, 0.04570198059082031, 0.04890727996826172, 0.052112579345703125, 0.05531787872314453, 0.05852317810058594, 0.061728477478027344, 0.06493377685546875, 0.06813907623291016, 0.07134437561035156, 0.07454967498779297, 0.07775497436523438, 0.08096027374267578, 0.08416557312011719, 0.0873708724975586, 0.090576171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 13.0, 15.0, 21.0, 45.0, 64.0, 88.0, 112.0, 141.0, 144.0, 118.0, 104.0, 45.0, 31.0, 25.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5436254143714905, -0.526502788066864, -0.5093802213668823, -0.49225762486457825, -0.47513502836227417, -0.4580124020576477, -0.44088980555534363, -0.42376720905303955, -0.4066446125507355, -0.3895220160484314, -0.3723994195461273, -0.35527682304382324, -0.3381541967391968, -0.3210316300392151, -0.3039090037345886, -0.28678640723228455, -0.26966381072998047, -0.2525412142276764, -0.23541861772537231, -0.21829600632190704, -0.20117340981960297, -0.1840508133172989, -0.16692820191383362, -0.14980560541152954, -0.13268300890922546, -0.11556041240692139, -0.09843780845403671, -0.08131520450115204, -0.06419260799884796, -0.047070011496543884, -0.02994740754365921, -0.012824803590774536, 0.004297852516174316, 0.021420452743768692, 0.03854305297136307, 0.05566565319895744, 0.07278825342655182, 0.0899108499288559, 0.10703345388174057, 0.12415605783462524, 0.14127865433692932, 0.1584012508392334, 0.17552384734153748, 0.19264645874500275, 0.20976905524730682, 0.2268916517496109, 0.24401426315307617, 0.26113685965538025, 0.2782594561576843, 0.2953820526599884, 0.3125046491622925, 0.32962724566459656, 0.34674984216690063, 0.3638724684715271, 0.3809950649738312, 0.39811766147613525, 0.41524025797843933, 0.4323628544807434, 0.4494854509830475, 0.46660804748535156, 0.483730673789978, 0.5008532404899597, 0.5179758667945862, 0.5350984334945679, 0.5522210597991943]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 4.0, 2.0, 9.0, 10.0, 16.0, 14.0, 10.0, 18.0, 23.0, 34.0, 26.0, 24.0, 28.0, 36.0, 40.0, 34.0, 28.0, 28.0, 47.0, 32.0, 38.0, 43.0, 46.0, 40.0, 22.0, 39.0, 31.0, 30.0, 41.0, 30.0, 20.0, 28.0, 17.0, 15.0, 18.0, 14.0, 11.0, 8.0, 8.0, 7.0, 2.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.20087182521820068, -0.19409941136837006, -0.18732699751853943, -0.1805545836687088, -0.17378216981887817, -0.16700975596904755, -0.16023734211921692, -0.1534649133682251, -0.14669251441955566, -0.13992010056972504, -0.1331476867198944, -0.12637527287006378, -0.11960285902023315, -0.11283044517040253, -0.1060580238699913, -0.09928561002016068, -0.09251318871974945, -0.08574077486991882, -0.0789683610200882, -0.07219594717025757, -0.06542353332042694, -0.058651115745306015, -0.05187869817018509, -0.04510628432035446, -0.038333870470523834, -0.03156145662069321, -0.02478904090821743, -0.018016625195741653, -0.011244211345911026, -0.0044717974960803986, 0.0023006200790405273, 0.009073033928871155, 0.015845447778701782, 0.02261786162853241, 0.029390277341008186, 0.03616269305348396, 0.04293510690331459, 0.04970752075314522, 0.056479938328266144, 0.06325235217809677, 0.0700247660279274, 0.07679717987775803, 0.08356959372758865, 0.09034201502799988, 0.0971144288778305, 0.10388684272766113, 0.11065925657749176, 0.11743167042732239, 0.12420408427715302, 0.13097649812698364, 0.13774891197681427, 0.1445213258266449, 0.15129373967647552, 0.15806615352630615, 0.16483858227729797, 0.1716109812259674, 0.17838340997695923, 0.18515582382678986, 0.19192823767662048, 0.1987006515264511, 0.20547306537628174, 0.21224547922611237, 0.219017893075943, 0.22579032182693481, 0.23256272077560425]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 12.0, 35.0, 53.0, 79.0, 140.0, 315.0, 619.0, 1513.0, 3970.0, 11566.0, 39863.0, 219009.0, 650165.0, 87400.0, 22470.0, 7053.0, 2485.0, 879.0, 426.0, 204.0, 115.0, 64.0, 37.0, 30.0, 15.0, 11.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.2386474609375, -0.23168373107910156, -0.22472000122070312, -0.2177562713623047, -0.21079254150390625, -0.2038288116455078, -0.19686508178710938, -0.18990135192871094, -0.1829376220703125, -0.17597389221191406, -0.16901016235351562, -0.1620464324951172, -0.15508270263671875, -0.1481189727783203, -0.14115524291992188, -0.13419151306152344, -0.127227783203125, -0.12026405334472656, -0.11330032348632812, -0.10633659362792969, -0.09937286376953125, -0.09240913391113281, -0.08544540405273438, -0.07848167419433594, -0.0715179443359375, -0.06455421447753906, -0.057590484619140625, -0.05062675476074219, -0.04366302490234375, -0.03669929504394531, -0.029735565185546875, -0.022771835327148438, -0.01580810546875, -0.008844375610351562, -0.001880645751953125, 0.0050830841064453125, 0.01204681396484375, 0.019010543823242188, 0.025974273681640625, 0.03293800354003906, 0.0399017333984375, 0.04686546325683594, 0.053829193115234375, 0.06079292297363281, 0.06775665283203125, 0.07472038269042969, 0.08168411254882812, 0.08864784240722656, 0.095611572265625, 0.10257530212402344, 0.10953903198242188, 0.11650276184082031, 0.12346649169921875, 0.1304302215576172, 0.13739395141601562, 0.14435768127441406, 0.1513214111328125, 0.15828514099121094, 0.16524887084960938, 0.1722126007080078, 0.17917633056640625, 0.1861400604248047, 0.19310379028320312, 0.20006752014160156, 0.20703125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 13.0, 13.0, 24.0, 19.0, 27.0, 50.0, 54.0, 60.0, 55.0, 88.0, 77.0, 65.0, 82.0, 77.0, 73.0, 46.0, 52.0, 35.0, 23.0, 16.0, 14.0, 13.0, 6.0, 5.0, 7.0, 0.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.060821533203125, -0.059103965759277344, -0.05738639831542969, -0.05566883087158203, -0.053951263427734375, -0.05223369598388672, -0.05051612854003906, -0.048798561096191406, -0.04708099365234375, -0.045363426208496094, -0.04364585876464844, -0.04192829132080078, -0.040210723876953125, -0.03849315643310547, -0.03677558898925781, -0.035058021545410156, -0.0333404541015625, -0.031622886657714844, -0.029905319213867188, -0.02818775177001953, -0.026470184326171875, -0.02475261688232422, -0.023035049438476562, -0.021317481994628906, -0.01959991455078125, -0.017882347106933594, -0.016164779663085938, -0.014447212219238281, -0.012729644775390625, -0.011012077331542969, -0.009294509887695312, -0.007576942443847656, -0.005859375, -0.004141807556152344, -0.0024242401123046875, -0.0007066726684570312, 0.001010894775390625, 0.0027284622192382812, 0.0044460296630859375, 0.006163597106933594, 0.00788116455078125, 0.009598731994628906, 0.011316299438476562, 0.013033866882324219, 0.014751434326171875, 0.01646900177001953, 0.018186569213867188, 0.019904136657714844, 0.0216217041015625, 0.023339271545410156, 0.025056838989257812, 0.02677440643310547, 0.028491973876953125, 0.03020954132080078, 0.03192710876464844, 0.033644676208496094, 0.03536224365234375, 0.037079811096191406, 0.03879737854003906, 0.04051494598388672, 0.042232513427734375, 0.04395008087158203, 0.04566764831542969, 0.047385215759277344, 0.049102783203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 13.0, 13.0, 19.0, 27.0, 50.0, 107.0, 148.0, 324.0, 704.0, 1514.0, 3723.0, 9594.0, 28763.0, 121474.0, 753297.0, 90183.0, 24438.0, 8393.0, 3203.0, 1320.0, 573.0, 283.0, 158.0, 90.0, 59.0, 29.0, 24.0, 8.0, 10.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.22017860412597656, -0.21269607543945312, -0.2052135467529297, -0.19773101806640625, -0.1902484893798828, -0.18276596069335938, -0.17528343200683594, -0.1678009033203125, -0.16031837463378906, -0.15283584594726562, -0.1453533172607422, -0.13787078857421875, -0.1303882598876953, -0.12290573120117188, -0.11542320251464844, -0.107940673828125, -0.10045814514160156, -0.09297561645507812, -0.08549308776855469, -0.07801055908203125, -0.07052803039550781, -0.06304550170898438, -0.05556297302246094, -0.0480804443359375, -0.04059791564941406, -0.033115386962890625, -0.025632858276367188, -0.01815032958984375, -0.010667800903320312, -0.003185272216796875, 0.0042972564697265625, 0.01177978515625, 0.019262313842773438, 0.026744842529296875, 0.03422737121582031, 0.04170989990234375, 0.04919242858886719, 0.056674957275390625, 0.06415748596191406, 0.0716400146484375, 0.07912254333496094, 0.08660507202148438, 0.09408760070800781, 0.10157012939453125, 0.10905265808105469, 0.11653518676757812, 0.12401771545410156, 0.131500244140625, 0.13898277282714844, 0.14646530151367188, 0.1539478302001953, 0.16143035888671875, 0.1689128875732422, 0.17639541625976562, 0.18387794494628906, 0.1913604736328125, 0.19884300231933594, 0.20632553100585938, 0.2138080596923828, 0.22129058837890625, 0.2287731170654297, 0.23625564575195312, 0.24373817443847656, 0.251220703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 5.0, 8.0, 11.0, 20.0, 23.0, 37.0, 30.0, 46.0, 42.0, 63.0, 63.0, 78.0, 75.0, 65.0, 67.0, 62.0, 63.0, 41.0, 46.0, 22.0, 27.0, 24.0, 23.0, 12.0, 7.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.277587890625, -0.2702445983886719, -0.26290130615234375, -0.2555580139160156, -0.2482147216796875, -0.24087142944335938, -0.23352813720703125, -0.22618484497070312, -0.218841552734375, -0.21149826049804688, -0.20415496826171875, -0.19681167602539062, -0.1894683837890625, -0.18212509155273438, -0.17478179931640625, -0.16743850708007812, -0.16009521484375, -0.15275192260742188, -0.14540863037109375, -0.13806533813476562, -0.1307220458984375, -0.12337875366210938, -0.11603546142578125, -0.10869216918945312, -0.101348876953125, -0.09400558471679688, -0.08666229248046875, -0.07931900024414062, -0.0719757080078125, -0.06463241577148438, -0.05728912353515625, -0.049945831298828125, -0.0426025390625, -0.035259246826171875, -0.02791595458984375, -0.020572662353515625, -0.0132293701171875, -0.005886077880859375, 0.00145721435546875, 0.008800506591796875, 0.016143798828125, 0.023487091064453125, 0.03083038330078125, 0.038173675537109375, 0.0455169677734375, 0.052860260009765625, 0.06020355224609375, 0.06754684448242188, 0.07489013671875, 0.08223342895507812, 0.08957672119140625, 0.09692001342773438, 0.1042633056640625, 0.11160659790039062, 0.11894989013671875, 0.12629318237304688, 0.133636474609375, 0.14097976684570312, 0.14832305908203125, 0.15566635131835938, 0.1630096435546875, 0.17035293579101562, 0.17769622802734375, 0.18503952026367188, 0.1923828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 5.0, 9.0, 17.0, 17.0, 23.0, 31.0, 56.0, 102.0, 122.0, 203.0, 287.0, 505.0, 931.0, 1755.0, 3780.0, 9428.0, 30452.0, 245933.0, 688643.0, 43933.0, 12698.0, 4802.0, 2144.0, 1053.0, 628.0, 341.0, 208.0, 134.0, 99.0, 64.0, 39.0, 32.0, 23.0, 13.0, 19.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14453125, -0.1395702362060547, -0.13460922241210938, -0.12964820861816406, -0.12468719482421875, -0.11972618103027344, -0.11476516723632812, -0.10980415344238281, -0.1048431396484375, -0.09988212585449219, -0.09492111206054688, -0.08996009826660156, -0.08499908447265625, -0.08003807067871094, -0.07507705688476562, -0.07011604309082031, -0.065155029296875, -0.06019401550292969, -0.055233001708984375, -0.05027198791503906, -0.04531097412109375, -0.04034996032714844, -0.035388946533203125, -0.030427932739257812, -0.0254669189453125, -0.020505905151367188, -0.015544891357421875, -0.010583877563476562, -0.00562286376953125, -0.0006618499755859375, 0.004299163818359375, 0.009260177612304688, 0.01422119140625, 0.019182205200195312, 0.024143218994140625, 0.029104232788085938, 0.03406524658203125, 0.03902626037597656, 0.043987274169921875, 0.04894828796386719, 0.0539093017578125, 0.05887031555175781, 0.06383132934570312, 0.06879234313964844, 0.07375335693359375, 0.07871437072753906, 0.08367538452148438, 0.08863639831542969, 0.093597412109375, 0.09855842590332031, 0.10351943969726562, 0.10848045349121094, 0.11344146728515625, 0.11840248107910156, 0.12336349487304688, 0.1283245086669922, 0.1332855224609375, 0.1382465362548828, 0.14320755004882812, 0.14816856384277344, 0.15312957763671875, 0.15809059143066406, 0.16305160522460938, 0.1680126190185547, 0.1729736328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 5.0, 11.0, 6.0, 17.0, 22.0, 37.0, 56.0, 59.0, 81.0, 120.0, 91.0, 103.0, 110.0, 60.0, 52.0, 36.0, 28.0, 25.0, 26.0, 13.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86102294921875e-05, -2.7223490178585052e-05, -2.5836750864982605e-05, -2.4450011551380157e-05, -2.306327223777771e-05, -2.1676532924175262e-05, -2.0289793610572815e-05, -1.8903054296970367e-05, -1.751631498336792e-05, -1.6129575669765472e-05, -1.4742836356163025e-05, -1.3356097042560577e-05, -1.196935772895813e-05, -1.0582618415355682e-05, -9.195879101753235e-06, -7.809139788150787e-06, -6.42240047454834e-06, -5.035661160945892e-06, -3.648921847343445e-06, -2.2621825337409973e-06, -8.754432201385498e-07, 5.112960934638977e-07, 1.8980354070663452e-06, 3.2847747206687927e-06, 4.67151403427124e-06, 6.058253347873688e-06, 7.444992661476135e-06, 8.831731975078583e-06, 1.021847128868103e-05, 1.1605210602283478e-05, 1.2991949915885925e-05, 1.4378689229488373e-05, 1.576542854309082e-05, 1.7152167856693268e-05, 1.8538907170295715e-05, 1.9925646483898163e-05, 2.131238579750061e-05, 2.2699125111103058e-05, 2.4085864424705505e-05, 2.5472603738307953e-05, 2.68593430519104e-05, 2.8246082365512848e-05, 2.9632821679115295e-05, 3.101956099271774e-05, 3.240630030632019e-05, 3.379303961992264e-05, 3.5179778933525085e-05, 3.656651824712753e-05, 3.795325756072998e-05, 3.933999687433243e-05, 4.0726736187934875e-05, 4.211347550153732e-05, 4.350021481513977e-05, 4.488695412874222e-05, 4.6273693442344666e-05, 4.766043275594711e-05, 4.904717206954956e-05, 5.043391138315201e-05, 5.1820650696754456e-05, 5.32073900103569e-05, 5.459412932395935e-05, 5.59808686375618e-05, 5.7367607951164246e-05, 5.875434726476669e-05, 6.014108657836914e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 18.0, 14.0, 23.0, 42.0, 63.0, 88.0, 174.0, 258.0, 483.0, 1031.0, 2180.0, 5203.0, 14883.0, 53522.0, 780202.0, 149692.0, 26030.0, 8193.0, 3275.0, 1515.0, 678.0, 407.0, 217.0, 130.0, 80.0, 52.0, 26.0, 22.0, 11.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.1596698760986328, -0.15430068969726562, -0.14893150329589844, -0.14356231689453125, -0.13819313049316406, -0.13282394409179688, -0.1274547576904297, -0.1220855712890625, -0.11671638488769531, -0.11134719848632812, -0.10597801208496094, -0.10060882568359375, -0.09523963928222656, -0.08987045288085938, -0.08450126647949219, -0.079132080078125, -0.07376289367675781, -0.06839370727539062, -0.06302452087402344, -0.05765533447265625, -0.05228614807128906, -0.046916961669921875, -0.04154777526855469, -0.0361785888671875, -0.030809402465820312, -0.025440216064453125, -0.020071029663085938, -0.01470184326171875, -0.009332656860351562, -0.003963470458984375, 0.0014057159423828125, 0.00677490234375, 0.012144088745117188, 0.017513275146484375, 0.022882461547851562, 0.02825164794921875, 0.03362083435058594, 0.038990020751953125, 0.04435920715332031, 0.0497283935546875, 0.05509757995605469, 0.060466766357421875, 0.06583595275878906, 0.07120513916015625, 0.07657432556152344, 0.08194351196289062, 0.08731269836425781, 0.092681884765625, 0.09805107116699219, 0.10342025756835938, 0.10878944396972656, 0.11415863037109375, 0.11952781677246094, 0.12489700317382812, 0.1302661895751953, 0.1356353759765625, 0.1410045623779297, 0.14637374877929688, 0.15174293518066406, 0.15711212158203125, 0.16248130798339844, 0.16785049438476562, 0.1732196807861328, 0.1785888671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 7.0, 10.0, 10.0, 7.0, 12.0, 26.0, 32.0, 53.0, 110.0, 264.0, 219.0, 103.0, 36.0, 18.0, 21.0, 18.0, 14.0, 5.0, 6.0, 6.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.08849048614501953, -0.08378028869628906, -0.0790700912475586, -0.07435989379882812, -0.06964969635009766, -0.06493949890136719, -0.06022930145263672, -0.05551910400390625, -0.05080890655517578, -0.04609870910644531, -0.041388511657714844, -0.036678314208984375, -0.031968116760253906, -0.027257919311523438, -0.02254772186279297, -0.0178375244140625, -0.013127326965332031, -0.008417129516601562, -0.0037069320678710938, 0.001003265380859375, 0.005713462829589844, 0.010423660278320312, 0.015133857727050781, 0.01984405517578125, 0.02455425262451172, 0.029264450073242188, 0.033974647521972656, 0.038684844970703125, 0.043395042419433594, 0.04810523986816406, 0.05281543731689453, 0.057525634765625, 0.06223583221435547, 0.06694602966308594, 0.0716562271118164, 0.07636642456054688, 0.08107662200927734, 0.08578681945800781, 0.09049701690673828, 0.09520721435546875, 0.09991741180419922, 0.10462760925292969, 0.10933780670166016, 0.11404800415039062, 0.1187582015991211, 0.12346839904785156, 0.12817859649658203, 0.1328887939453125, 0.13759899139404297, 0.14230918884277344, 0.1470193862915039, 0.15172958374023438, 0.15643978118896484, 0.1611499786376953, 0.16586017608642578, 0.17057037353515625, 0.17528057098388672, 0.1799907684326172, 0.18470096588134766, 0.18941116333007812, 0.1941213607788086, 0.19883155822753906, 0.20354175567626953, 0.208251953125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 18.0, 21.0, 26.0, 40.0, 60.0, 98.0, 95.0, 115.0, 109.0, 108.0, 92.0, 69.0, 40.0, 27.0, 26.0, 14.0, 13.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2618948221206665, -1.2237956523895264, -1.1856964826583862, -1.1475971937179565, -1.1094980239868164, -1.0713988542556763, -1.0332996845245361, -0.995200514793396, -0.9571012854576111, -0.919002115726471, -0.880902886390686, -0.8428037166595459, -0.8047045469284058, -0.7666053175926208, -0.7285061478614807, -0.6904069185256958, -0.6523077487945557, -0.6142085790634155, -0.5761093497276306, -0.5380101799964905, -0.49991098046302795, -0.46181178092956543, -0.4237126111984253, -0.38561341166496277, -0.34751421213150024, -0.3094150125980377, -0.2713158130645752, -0.23321664333343506, -0.19511744379997253, -0.15701824426651, -0.11891905963420868, -0.08081987500190735, -0.042720675468444824, -0.004621483385562897, 0.03347770869731903, 0.07157690078020096, 0.10967609286308289, 0.1477752923965454, 0.18587447702884674, 0.22397366166114807, 0.2620728611946106, 0.3001720607280731, 0.33827126026153564, 0.3763704299926758, 0.4144696295261383, 0.45256882905960083, 0.49066799879074097, 0.5287672281265259, 0.566866397857666, 0.6049655675888062, 0.6430647969245911, 0.6811639666557312, 0.7192631959915161, 0.7573623657226562, 0.7954615354537964, 0.8335607051849365, 0.8716599345207214, 0.9097591042518616, 0.9478583335876465, 0.9859575033187866, 1.0240566730499268, 1.0621559619903564, 1.1002551317214966, 1.1383543014526367, 1.1764534711837769]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 8.0, 8.0, 18.0, 25.0, 25.0, 13.0, 25.0, 29.0, 23.0, 29.0, 41.0, 30.0, 40.0, 39.0, 36.0, 43.0, 37.0, 41.0, 38.0, 42.0, 40.0, 35.0, 30.0, 34.0, 27.0, 24.0, 29.0, 20.0, 22.0, 18.0, 14.0, 20.0, 17.0, 8.0, 10.0, 10.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-0.7505302429199219, -0.727845311164856, -0.7051604390144348, -0.6824755072593689, -0.659790575504303, -0.6371057033538818, -0.6144207715988159, -0.59173583984375, -0.5690509080886841, -0.5463659763336182, -0.523681104183197, -0.5009961724281311, -0.4783112406730652, -0.45562633872032166, -0.4329414367675781, -0.4102565050125122, -0.38757163286209106, -0.36488673090934753, -0.3422017991542816, -0.3195168972015381, -0.29683196544647217, -0.27414706349372864, -0.2514621615409851, -0.22877724468708038, -0.20609232783317566, -0.18340741097927094, -0.1607224941253662, -0.13803759217262268, -0.11535267531871796, -0.09266775846481323, -0.0699828565120697, -0.04729793965816498, -0.024613022804260254, -0.0019281096756458282, 0.020756803452968597, 0.043441712856292725, 0.06612662971019745, 0.08881154656410217, 0.1114964485168457, 0.13418136537075043, 0.15686628222465515, 0.17955119907855988, 0.2022361159324646, 0.22492101788520813, 0.24760593473911285, 0.2702908515930176, 0.2929757535457611, 0.31566065549850464, 0.33834558725357056, 0.3610304892063141, 0.38371542096138, 0.40640032291412354, 0.42908525466918945, 0.451770156621933, 0.4744550585746765, 0.49713999032974243, 0.5198248624801636, 0.5425097942352295, 0.5651946663856506, 0.5878795981407166, 0.6105645298957825, 0.6332494020462036, 0.6559343338012695, 0.6786192655563354, 0.7013041973114014]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 12.0, 18.0, 21.0, 41.0, 52.0, 84.0, 159.0, 239.0, 391.0, 648.0, 1203.0, 2378.0, 5116.0, 11864.0, 31627.0, 123389.0, 3584981.0, 344376.0, 54658.0, 17906.0, 7440.0, 3432.0, 1784.0, 937.0, 558.0, 361.0, 212.0, 140.0, 81.0, 69.0, 33.0, 26.0, 21.0, 7.0, 9.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2828559875488281, -0.27494049072265625, -0.2670249938964844, -0.2591094970703125, -0.2511940002441406, -0.24327850341796875, -0.23536300659179688, -0.227447509765625, -0.21953201293945312, -0.21161651611328125, -0.20370101928710938, -0.1957855224609375, -0.18787002563476562, -0.17995452880859375, -0.17203903198242188, -0.16412353515625, -0.15620803833007812, -0.14829254150390625, -0.14037704467773438, -0.1324615478515625, -0.12454605102539062, -0.11663055419921875, -0.10871505737304688, -0.100799560546875, -0.09288406372070312, -0.08496856689453125, -0.07705307006835938, -0.0691375732421875, -0.061222076416015625, -0.05330657958984375, -0.045391082763671875, -0.0374755859375, -0.029560089111328125, -0.02164459228515625, -0.013729095458984375, -0.0058135986328125, 0.002101898193359375, 0.01001739501953125, 0.017932891845703125, 0.025848388671875, 0.033763885498046875, 0.04167938232421875, 0.049594879150390625, 0.0575103759765625, 0.06542587280273438, 0.07334136962890625, 0.08125686645507812, 0.08917236328125, 0.09708786010742188, 0.10500335693359375, 0.11291885375976562, 0.1208343505859375, 0.12874984741210938, 0.13666534423828125, 0.14458084106445312, 0.152496337890625, 0.16041183471679688, 0.16832733154296875, 0.17624282836914062, 0.1841583251953125, 0.19207382202148438, 0.19998931884765625, 0.20790481567382812, 0.2158203125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 9.0, 19.0, 23.0, 30.0, 35.0, 49.0, 53.0, 61.0, 71.0, 64.0, 69.0, 77.0, 63.0, 57.0, 63.0, 61.0, 45.0, 32.0, 22.0, 21.0, 25.0, 10.0, 8.0, 8.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0576171875, -0.05589008331298828, -0.05416297912597656, -0.052435874938964844, -0.050708770751953125, -0.048981666564941406, -0.04725456237792969, -0.04552745819091797, -0.04380035400390625, -0.04207324981689453, -0.04034614562988281, -0.038619041442871094, -0.036891937255859375, -0.035164833068847656, -0.03343772888183594, -0.03171062469482422, -0.0299835205078125, -0.02825641632080078, -0.026529312133789062, -0.024802207946777344, -0.023075103759765625, -0.021347999572753906, -0.019620895385742188, -0.01789379119873047, -0.01616668701171875, -0.014439582824707031, -0.012712478637695312, -0.010985374450683594, -0.009258270263671875, -0.007531166076660156, -0.0058040618896484375, -0.004076957702636719, -0.002349853515625, -0.0006227493286132812, 0.0011043548583984375, 0.0028314590454101562, 0.004558563232421875, 0.006285667419433594, 0.008012771606445312, 0.009739875793457031, 0.01146697998046875, 0.013194084167480469, 0.014921188354492188, 0.016648292541503906, 0.018375396728515625, 0.020102500915527344, 0.021829605102539062, 0.02355670928955078, 0.0252838134765625, 0.02701091766357422, 0.028738021850585938, 0.030465126037597656, 0.032192230224609375, 0.033919334411621094, 0.03564643859863281, 0.03737354278564453, 0.03910064697265625, 0.04082775115966797, 0.04255485534667969, 0.044281959533691406, 0.046009063720703125, 0.047736167907714844, 0.04946327209472656, 0.05119037628173828, 0.05291748046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 13.0, 21.0, 33.0, 48.0, 60.0, 69.0, 126.0, 145.0, 217.0, 266.0, 432.0, 621.0, 919.0, 1389.0, 2478.0, 4353.0, 8451.0, 17294.0, 39472.0, 113366.0, 743228.0, 3003607.0, 163094.0, 50243.0, 21279.0, 9958.0, 5121.0, 2954.0, 1634.0, 1085.0, 733.0, 451.0, 323.0, 213.0, 174.0, 115.0, 83.0, 68.0, 41.0, 36.0, 16.0, 17.0, 8.0, 12.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2142333984375, -0.2075672149658203, -0.20090103149414062, -0.19423484802246094, -0.18756866455078125, -0.18090248107910156, -0.17423629760742188, -0.1675701141357422, -0.1609039306640625, -0.1542377471923828, -0.14757156372070312, -0.14090538024902344, -0.13423919677734375, -0.12757301330566406, -0.12090682983398438, -0.11424064636230469, -0.107574462890625, -0.10090827941894531, -0.09424209594726562, -0.08757591247558594, -0.08090972900390625, -0.07424354553222656, -0.06757736206054688, -0.06091117858886719, -0.0542449951171875, -0.04757881164550781, -0.040912628173828125, -0.03424644470214844, -0.02758026123046875, -0.020914077758789062, -0.014247894287109375, -0.0075817108154296875, -0.00091552734375, 0.0057506561279296875, 0.012416839599609375, 0.019083023071289062, 0.02574920654296875, 0.03241539001464844, 0.039081573486328125, 0.04574775695800781, 0.0524139404296875, 0.05908012390136719, 0.06574630737304688, 0.07241249084472656, 0.07907867431640625, 0.08574485778808594, 0.09241104125976562, 0.09907722473144531, 0.105743408203125, 0.11240959167480469, 0.11907577514648438, 0.12574195861816406, 0.13240814208984375, 0.13907432556152344, 0.14574050903320312, 0.1524066925048828, 0.1590728759765625, 0.1657390594482422, 0.17240524291992188, 0.17907142639160156, 0.18573760986328125, 0.19240379333496094, 0.19906997680664062, 0.2057361602783203, 0.21240234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 12.0, 17.0, 10.0, 26.0, 30.0, 34.0, 50.0, 92.0, 142.0, 318.0, 2118.0, 687.0, 215.0, 101.0, 63.0, 43.0, 27.0, 21.0, 21.0, 13.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12115478515625, -0.11722278594970703, -0.11329078674316406, -0.1093587875366211, -0.10542678833007812, -0.10149478912353516, -0.09756278991699219, -0.09363079071044922, -0.08969879150390625, -0.08576679229736328, -0.08183479309082031, -0.07790279388427734, -0.07397079467773438, -0.0700387954711914, -0.06610679626464844, -0.06217479705810547, -0.0582427978515625, -0.05431079864501953, -0.05037879943847656, -0.046446800231933594, -0.042514801025390625, -0.038582801818847656, -0.03465080261230469, -0.03071880340576172, -0.02678680419921875, -0.02285480499267578, -0.018922805786132812, -0.014990806579589844, -0.011058807373046875, -0.007126808166503906, -0.0031948089599609375, 0.0007371902465820312, 0.004669189453125, 0.008601188659667969, 0.012533187866210938, 0.016465187072753906, 0.020397186279296875, 0.024329185485839844, 0.028261184692382812, 0.03219318389892578, 0.03612518310546875, 0.04005718231201172, 0.04398918151855469, 0.047921180725097656, 0.051853179931640625, 0.055785179138183594, 0.05971717834472656, 0.06364917755126953, 0.0675811767578125, 0.07151317596435547, 0.07544517517089844, 0.0793771743774414, 0.08330917358398438, 0.08724117279052734, 0.09117317199707031, 0.09510517120361328, 0.09903717041015625, 0.10296916961669922, 0.10690116882324219, 0.11083316802978516, 0.11476516723632812, 0.1186971664428711, 0.12262916564941406, 0.12656116485595703, 0.1304931640625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 12.0, 23.0, 32.0, 58.0, 68.0, 149.0, 152.0, 155.0, 128.0, 93.0, 50.0, 34.0, 20.0, 12.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.161692500114441, -1.1336348056793213, -1.1055772304534912, -1.0775195360183716, -1.0494619607925415, -1.0214042663574219, -0.9933466911315918, -0.9652889966964722, -0.9372313618659973, -0.9091737270355225, -0.8811160922050476, -0.8530584573745728, -0.8250008225440979, -0.796943187713623, -0.7688854932785034, -0.7408278584480286, -0.7127702236175537, -0.6847125887870789, -0.656654953956604, -0.6285973191261292, -0.6005396842956543, -0.5724819898605347, -0.5444244146347046, -0.516366720199585, -0.4883091449737549, -0.46025151014328003, -0.4321938753128052, -0.4041362404823303, -0.3760785758495331, -0.3480209410190582, -0.3199633061885834, -0.29190564155578613, -0.2638480067253113, -0.23579037189483643, -0.20773272216320038, -0.17967508733272552, -0.15161743760108948, -0.12355980277061462, -0.09550216794013977, -0.06744451820850372, -0.03938688337802887, -0.011329242959618568, 0.016728397458791733, 0.044786036014556885, 0.07284367829561234, 0.10090132057666779, 0.12895895540714264, 0.1570166051387787, 0.18507423996925354, 0.2131318747997284, 0.24118952453136444, 0.2692471742630005, 0.29730480909347534, 0.3253624439239502, 0.35342007875442505, 0.3814777135848999, 0.40953534841537476, 0.4375929832458496, 0.46565061807632446, 0.4937082529067993, 0.5217658877372742, 0.549823522567749, 0.5778812170028687, 0.6059388518333435, 0.6339964866638184]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 6.0, 6.0, 16.0, 8.0, 13.0, 13.0, 16.0, 18.0, 28.0, 29.0, 30.0, 36.0, 41.0, 30.0, 30.0, 33.0, 44.0, 39.0, 44.0, 24.0, 43.0, 39.0, 41.0, 46.0, 32.0, 32.0, 34.0, 35.0, 27.0, 12.0, 23.0, 20.0, 17.0, 20.0, 11.0, 13.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31650543212890625, -0.3055785298347473, -0.29465165734291077, -0.28372475504875183, -0.2727978527545929, -0.26187095046043396, -0.2509440779685974, -0.24001717567443848, -0.22909027338027954, -0.2181633859872818, -0.20723648369312286, -0.19630959630012512, -0.1853826940059662, -0.17445580661296844, -0.1635289192199707, -0.15260201692581177, -0.14167512953281403, -0.13074824213981628, -0.11982133984565735, -0.1088944524526596, -0.09796755015850067, -0.08704066276550293, -0.07611376792192459, -0.06518687307834625, -0.054259978234767914, -0.043333083391189575, -0.03240618854761124, -0.021479297429323196, -0.010552402585744858, 0.00037449225783348083, 0.011301383376121521, 0.02222827821969986, 0.0331551730632782, 0.04408206790685654, 0.055008962750434875, 0.06593585014343262, 0.07686275243759155, 0.0877896398305893, 0.09871653467416763, 0.10964342951774597, 0.12057032436132431, 0.13149721920490265, 0.1424241065979004, 0.15335100889205933, 0.16427789628505707, 0.175204798579216, 0.18613168597221375, 0.19705858826637268, 0.20798547565937042, 0.21891236305236816, 0.2298392653465271, 0.24076615273952484, 0.2516930401325226, 0.2626199424266815, 0.27354684472084045, 0.284473717212677, 0.29540061950683594, 0.3063275218009949, 0.3172543942928314, 0.32818129658699036, 0.3391081988811493, 0.3500351011753082, 0.3609619736671448, 0.3718888759613037, 0.38281577825546265]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 11.0, 19.0, 7.0, 20.0, 35.0, 45.0, 83.0, 114.0, 190.0, 340.0, 628.0, 1089.0, 1839.0, 3468.0, 6724.0, 13066.0, 25445.0, 51796.0, 109006.0, 252804.0, 312747.0, 138824.0, 64764.0, 31834.0, 15997.0, 8267.0, 4160.0, 2236.0, 1230.0, 684.0, 407.0, 237.0, 136.0, 119.0, 62.0, 52.0, 25.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12616539001464844, -0.12183761596679688, -0.11750984191894531, -0.11318206787109375, -0.10885429382324219, -0.10452651977539062, -0.10019874572753906, -0.0958709716796875, -0.09154319763183594, -0.08721542358398438, -0.08288764953613281, -0.07855987548828125, -0.07423210144042969, -0.06990432739257812, -0.06557655334472656, -0.061248779296875, -0.05692100524902344, -0.052593231201171875, -0.04826545715332031, -0.04393768310546875, -0.03960990905761719, -0.035282135009765625, -0.030954360961914062, -0.0266265869140625, -0.022298812866210938, -0.017971038818359375, -0.013643264770507812, -0.00931549072265625, -0.0049877166748046875, -0.000659942626953125, 0.0036678314208984375, 0.00799560546875, 0.012323379516601562, 0.016651153564453125, 0.020978927612304688, 0.02530670166015625, 0.029634475708007812, 0.033962249755859375, 0.03829002380371094, 0.0426177978515625, 0.04694557189941406, 0.051273345947265625, 0.05560111999511719, 0.05992889404296875, 0.06425666809082031, 0.06858444213867188, 0.07291221618652344, 0.077239990234375, 0.08156776428222656, 0.08589553833007812, 0.09022331237792969, 0.09455108642578125, 0.09887886047363281, 0.10320663452148438, 0.10753440856933594, 0.1118621826171875, 0.11618995666503906, 0.12051773071289062, 0.12484550476074219, 0.12917327880859375, 0.1335010528564453, 0.13782882690429688, 0.14215660095214844, 0.146484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 26.0, 28.0, 45.0, 32.0, 45.0, 43.0, 42.0, 45.0, 60.0, 59.0, 57.0, 51.0, 50.0, 55.0, 53.0, 50.0, 43.0, 27.0, 31.0, 22.0, 18.0, 25.0, 12.0, 8.0, 8.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.054351806640625, -0.05274486541748047, -0.05113792419433594, -0.049530982971191406, -0.047924041748046875, -0.046317100524902344, -0.04471015930175781, -0.04310321807861328, -0.04149627685546875, -0.03988933563232422, -0.03828239440917969, -0.036675453186035156, -0.035068511962890625, -0.033461570739746094, -0.03185462951660156, -0.03024768829345703, -0.0286407470703125, -0.02703380584716797, -0.025426864624023438, -0.023819923400878906, -0.022212982177734375, -0.020606040954589844, -0.018999099731445312, -0.01739215850830078, -0.01578521728515625, -0.014178276062011719, -0.012571334838867188, -0.010964393615722656, -0.009357452392578125, -0.007750511169433594, -0.0061435699462890625, -0.004536628723144531, -0.0029296875, -0.0013227462768554688, 0.0002841949462890625, 0.0018911361694335938, 0.003498077392578125, 0.005105018615722656, 0.0067119598388671875, 0.008318901062011719, 0.00992584228515625, 0.011532783508300781, 0.013139724731445312, 0.014746665954589844, 0.016353607177734375, 0.017960548400878906, 0.019567489624023438, 0.02117443084716797, 0.0227813720703125, 0.02438831329345703, 0.025995254516601562, 0.027602195739746094, 0.029209136962890625, 0.030816078186035156, 0.03242301940917969, 0.03402996063232422, 0.03563690185546875, 0.03724384307861328, 0.03885078430175781, 0.040457725524902344, 0.042064666748046875, 0.043671607971191406, 0.04527854919433594, 0.04688549041748047, 0.048492431640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 5.0, 10.0, 14.0, 25.0, 36.0, 53.0, 71.0, 127.0, 210.0, 351.0, 600.0, 1218.0, 2775.0, 7222.0, 24065.0, 91723.0, 486394.0, 334972.0, 69317.0, 18767.0, 5924.0, 2254.0, 970.0, 524.0, 301.0, 214.0, 128.0, 86.0, 50.0, 37.0, 26.0, 22.0, 17.0, 11.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248291015625, -0.24074363708496094, -0.23319625854492188, -0.2256488800048828, -0.21810150146484375, -0.2105541229248047, -0.20300674438476562, -0.19545936584472656, -0.1879119873046875, -0.18036460876464844, -0.17281723022460938, -0.1652698516845703, -0.15772247314453125, -0.1501750946044922, -0.14262771606445312, -0.13508033752441406, -0.127532958984375, -0.11998558044433594, -0.11243820190429688, -0.10489082336425781, -0.09734344482421875, -0.08979606628417969, -0.08224868774414062, -0.07470130920410156, -0.0671539306640625, -0.05960655212402344, -0.052059173583984375, -0.04451179504394531, -0.03696441650390625, -0.029417037963867188, -0.021869659423828125, -0.014322280883789062, -0.00677490234375, 0.0007724761962890625, 0.008319854736328125, 0.015867233276367188, 0.02341461181640625, 0.030961990356445312, 0.038509368896484375, 0.04605674743652344, 0.0536041259765625, 0.06115150451660156, 0.06869888305664062, 0.07624626159667969, 0.08379364013671875, 0.09134101867675781, 0.09888839721679688, 0.10643577575683594, 0.113983154296875, 0.12153053283691406, 0.12907791137695312, 0.1366252899169922, 0.14417266845703125, 0.1517200469970703, 0.15926742553710938, 0.16681480407714844, 0.1743621826171875, 0.18190956115722656, 0.18945693969726562, 0.1970043182373047, 0.20455169677734375, 0.2120990753173828, 0.21964645385742188, 0.22719383239746094, 0.2347412109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 8.0, 12.0, 10.0, 7.0, 19.0, 12.0, 25.0, 23.0, 26.0, 37.0, 57.0, 40.0, 35.0, 52.0, 58.0, 51.0, 47.0, 45.0, 33.0, 45.0, 40.0, 43.0, 31.0, 49.0, 29.0, 29.0, 24.0, 14.0, 20.0, 14.0, 14.0, 10.0, 5.0, 2.0, 8.0, 4.0, 2.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2196044921875, -0.21320533752441406, -0.20680618286132812, -0.2004070281982422, -0.19400787353515625, -0.1876087188720703, -0.18120956420898438, -0.17481040954589844, -0.1684112548828125, -0.16201210021972656, -0.15561294555664062, -0.1492137908935547, -0.14281463623046875, -0.1364154815673828, -0.13001632690429688, -0.12361717224121094, -0.117218017578125, -0.11081886291503906, -0.10441970825195312, -0.09802055358886719, -0.09162139892578125, -0.08522224426269531, -0.07882308959960938, -0.07242393493652344, -0.0660247802734375, -0.05962562561035156, -0.053226470947265625, -0.04682731628417969, -0.04042816162109375, -0.03402900695800781, -0.027629852294921875, -0.021230697631835938, -0.01483154296875, -0.008432388305664062, -0.002033233642578125, 0.0043659210205078125, 0.01076507568359375, 0.017164230346679688, 0.023563385009765625, 0.029962539672851562, 0.0363616943359375, 0.04276084899902344, 0.049160003662109375, 0.05555915832519531, 0.06195831298828125, 0.06835746765136719, 0.07475662231445312, 0.08115577697753906, 0.087554931640625, 0.09395408630371094, 0.10035324096679688, 0.10675239562988281, 0.11315155029296875, 0.11955070495605469, 0.12594985961914062, 0.13234901428222656, 0.1387481689453125, 0.14514732360839844, 0.15154647827148438, 0.1579456329345703, 0.16434478759765625, 0.1707439422607422, 0.17714309692382812, 0.18354225158691406, 0.18994140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 14.0, 9.0, 19.0, 27.0, 40.0, 59.0, 106.0, 152.0, 253.0, 388.0, 727.0, 1181.0, 2038.0, 4223.0, 11128.0, 41627.0, 227062.0, 613252.0, 109024.0, 22895.0, 7258.0, 3009.0, 1662.0, 944.0, 541.0, 349.0, 224.0, 121.0, 69.0, 61.0, 29.0, 20.0, 9.0, 9.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.13259315490722656, -0.12773513793945312, -0.12287712097167969, -0.11801910400390625, -0.11316108703613281, -0.10830307006835938, -0.10344505310058594, -0.0985870361328125, -0.09372901916503906, -0.08887100219726562, -0.08401298522949219, -0.07915496826171875, -0.07429695129394531, -0.06943893432617188, -0.06458091735839844, -0.059722900390625, -0.05486488342285156, -0.050006866455078125, -0.04514884948730469, -0.04029083251953125, -0.03543281555175781, -0.030574798583984375, -0.025716781616210938, -0.0208587646484375, -0.016000747680664062, -0.011142730712890625, -0.0062847137451171875, -0.00142669677734375, 0.0034313201904296875, 0.008289337158203125, 0.013147354125976562, 0.01800537109375, 0.022863388061523438, 0.027721405029296875, 0.03257942199707031, 0.03743743896484375, 0.04229545593261719, 0.047153472900390625, 0.05201148986816406, 0.0568695068359375, 0.06172752380371094, 0.06658554077148438, 0.07144355773925781, 0.07630157470703125, 0.08115959167480469, 0.08601760864257812, 0.09087562561035156, 0.095733642578125, 0.10059165954589844, 0.10544967651367188, 0.11030769348144531, 0.11516571044921875, 0.12002372741699219, 0.12488174438476562, 0.12973976135253906, 0.1345977783203125, 0.13945579528808594, 0.14431381225585938, 0.1491718292236328, 0.15402984619140625, 0.1588878631591797, 0.16374588012695312, 0.16860389709472656, 0.1734619140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 9.0, 14.0, 15.0, 23.0, 37.0, 51.0, 43.0, 94.0, 97.0, 148.0, 124.0, 106.0, 73.0, 40.0, 37.0, 33.0, 16.0, 13.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.898143768310547e-05, -3.726687282323837e-05, -3.555230796337128e-05, -3.383774310350418e-05, -3.2123178243637085e-05, -3.040861338376999e-05, -2.8694048523902893e-05, -2.6979483664035797e-05, -2.52649188041687e-05, -2.3550353944301605e-05, -2.183578908443451e-05, -2.0121224224567413e-05, -1.8406659364700317e-05, -1.669209450483322e-05, -1.4977529644966125e-05, -1.326296478509903e-05, -1.1548399925231934e-05, -9.833835065364838e-06, -8.119270205497742e-06, -6.404705345630646e-06, -4.69014048576355e-06, -2.975575625896454e-06, -1.261010766029358e-06, 4.5355409383773804e-07, 2.168118953704834e-06, 3.88268381357193e-06, 5.597248673439026e-06, 7.311813533306122e-06, 9.026378393173218e-06, 1.0740943253040314e-05, 1.245550811290741e-05, 1.4170072972774506e-05, 1.58846378326416e-05, 1.7599202692508698e-05, 1.9313767552375793e-05, 2.102833241224289e-05, 2.2742897272109985e-05, 2.445746213197708e-05, 2.6172026991844177e-05, 2.7886591851711273e-05, 2.960115671157837e-05, 3.1315721571445465e-05, 3.303028643131256e-05, 3.474485129117966e-05, 3.645941615104675e-05, 3.817398101091385e-05, 3.9888545870780945e-05, 4.160311073064804e-05, 4.331767559051514e-05, 4.503224045038223e-05, 4.674680531024933e-05, 4.8461370170116425e-05, 5.017593502998352e-05, 5.1890499889850616e-05, 5.360506474971771e-05, 5.531962960958481e-05, 5.7034194469451904e-05, 5.8748759329319e-05, 6.0463324189186096e-05, 6.217788904905319e-05, 6.389245390892029e-05, 6.560701876878738e-05, 6.732158362865448e-05, 6.903614848852158e-05, 7.075071334838867e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 9.0, 23.0, 36.0, 36.0, 58.0, 95.0, 149.0, 291.0, 466.0, 890.0, 1909.0, 4732.0, 15789.0, 103154.0, 708570.0, 178361.0, 23384.0, 5978.0, 2238.0, 1040.0, 523.0, 284.0, 163.0, 119.0, 63.0, 51.0, 40.0, 28.0, 17.0, 9.0, 5.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2120361328125, -0.20532989501953125, -0.1986236572265625, -0.19191741943359375, -0.185211181640625, -0.17850494384765625, -0.1717987060546875, -0.16509246826171875, -0.15838623046875, -0.15167999267578125, -0.1449737548828125, -0.13826751708984375, -0.131561279296875, -0.12485504150390625, -0.1181488037109375, -0.11144256591796875, -0.104736328125, -0.09803009033203125, -0.0913238525390625, -0.08461761474609375, -0.077911376953125, -0.07120513916015625, -0.0644989013671875, -0.05779266357421875, -0.05108642578125, -0.04438018798828125, -0.0376739501953125, -0.03096771240234375, -0.024261474609375, -0.01755523681640625, -0.0108489990234375, -0.00414276123046875, 0.0025634765625, 0.00926971435546875, 0.0159759521484375, 0.02268218994140625, 0.029388427734375, 0.03609466552734375, 0.0428009033203125, 0.04950714111328125, 0.05621337890625, 0.06291961669921875, 0.0696258544921875, 0.07633209228515625, 0.083038330078125, 0.08974456787109375, 0.0964508056640625, 0.10315704345703125, 0.10986328125, 0.11656951904296875, 0.1232757568359375, 0.12998199462890625, 0.136688232421875, 0.14339447021484375, 0.1501007080078125, 0.15680694580078125, 0.16351318359375, 0.17021942138671875, 0.1769256591796875, 0.18363189697265625, 0.190338134765625, 0.19704437255859375, 0.2037506103515625, 0.21045684814453125, 0.2171630859375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 7.0, 9.0, 9.0, 21.0, 32.0, 45.0, 66.0, 111.0, 178.0, 192.0, 117.0, 74.0, 56.0, 20.0, 23.0, 9.0, 10.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.27978515625, -0.2729530334472656, -0.26612091064453125, -0.2592887878417969, -0.2524566650390625, -0.24562454223632812, -0.23879241943359375, -0.23196029663085938, -0.225128173828125, -0.21829605102539062, -0.21146392822265625, -0.20463180541992188, -0.1977996826171875, -0.19096755981445312, -0.18413543701171875, -0.17730331420898438, -0.17047119140625, -0.16363906860351562, -0.15680694580078125, -0.14997482299804688, -0.1431427001953125, -0.13631057739257812, -0.12947845458984375, -0.12264633178710938, -0.115814208984375, -0.10898208618164062, -0.10214996337890625, -0.09531784057617188, -0.0884857177734375, -0.08165359497070312, -0.07482147216796875, -0.06798934936523438, -0.0611572265625, -0.054325103759765625, -0.04749298095703125, -0.040660858154296875, -0.0338287353515625, -0.026996612548828125, -0.02016448974609375, -0.013332366943359375, -0.006500244140625, 0.000331878662109375, 0.00716400146484375, 0.013996124267578125, 0.0208282470703125, 0.027660369873046875, 0.03449249267578125, 0.041324615478515625, 0.04815673828125, 0.054988861083984375, 0.06182098388671875, 0.06865310668945312, 0.0754852294921875, 0.08231735229492188, 0.08914947509765625, 0.09598159790039062, 0.102813720703125, 0.10964584350585938, 0.11647796630859375, 0.12331008911132812, 0.1301422119140625, 0.13697433471679688, 0.14380645751953125, 0.15063858032226562, 0.157470703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 11.0, 4.0, 19.0, 28.0, 68.0, 98.0, 130.0, 153.0, 170.0, 121.0, 97.0, 53.0, 21.0, 17.0, 10.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9270260334014893, -0.8544597625732422, -0.7818934321403503, -0.7093271017074585, -0.6367608308792114, -0.5641945600509644, -0.4916282296180725, -0.41906189918518066, -0.3464956283569336, -0.27392932772636414, -0.20136302709579468, -0.12879672646522522, -0.05623042583465576, 0.016335874795913696, 0.08890217542648315, 0.161468505859375, 0.23403477668762207, 0.30660107731819153, 0.379167377948761, 0.45173367857933044, 0.5242999792098999, 0.596866250038147, 0.6694325804710388, 0.7419989109039307, 0.8145651817321777, 0.8871314525604248, 0.9596977829933167, 1.0322641134262085, 1.1048303842544556, 1.1773966550827026, 1.2499630451202393, 1.3225293159484863, 1.3950955867767334, 1.4676618576049805, 1.5402281284332275, 1.6127945184707642, 1.6853607892990112, 1.7579270601272583, 1.830493450164795, 1.903059720993042, 1.975625991821289, 2.048192262649536, 2.120758533477783, 2.1933248043060303, 2.2658910751342773, 2.3384575843811035, 2.4110238552093506, 2.4835901260375977, 2.5561563968658447, 2.628722667694092, 2.701288938522339, 2.773855209350586, 2.846421718597412, 2.918987989425659, 2.9915542602539062, 3.0641205310821533, 3.1366868019104004, 3.2092530727386475, 3.2818193435668945, 3.3543856143951416, 3.4269518852233887, 3.499518394470215, 3.572084665298462, 3.644650936126709, 3.717217206954956]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 10.0, 15.0, 7.0, 18.0, 14.0, 17.0, 26.0, 26.0, 24.0, 34.0, 39.0, 42.0, 42.0, 45.0, 37.0, 45.0, 31.0, 43.0, 37.0, 51.0, 45.0, 39.0, 43.0, 31.0, 37.0, 25.0, 29.0, 19.0, 16.0, 13.0, 14.0, 11.0, 8.0, 10.0, 1.0, 6.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9620654582977295, -0.9291619658470154, -0.8962584733963013, -0.8633549213409424, -0.8304514288902283, -0.7975479364395142, -0.7646444439888, -0.7317409515380859, -0.698837399482727, -0.6659339070320129, -0.6330304145812988, -0.6001268625259399, -0.5672233700752258, -0.5343198776245117, -0.5014163851737976, -0.4685128927230835, -0.4356094002723694, -0.4027059078216553, -0.3698023855686188, -0.33689889311790466, -0.30399537086486816, -0.27109187841415405, -0.23818838596343994, -0.20528487861156464, -0.17238137125968933, -0.13947786390781403, -0.10657436400651932, -0.07367086410522461, -0.040767356753349304, -0.007863849401473999, 0.025039643049240112, 0.05794315040111542, 0.09084665775299072, 0.12375016510486603, 0.15665367245674133, 0.18955716490745544, 0.22246067225933075, 0.25536417961120605, 0.28826767206192017, 0.3211711645126343, 0.3540746867656708, 0.3869781792163849, 0.4198817014694214, 0.4527851939201355, 0.4856886863708496, 0.5185922384262085, 0.5514956712722778, 0.5843992233276367, 0.6173027157783508, 0.6502062082290649, 0.683109700679779, 0.7160131931304932, 0.748916745185852, 0.7818202376365662, 0.8147237300872803, 0.8476272225379944, 0.8805307149887085, 0.9134342074394226, 0.9463376998901367, 0.9792412519454956, 1.012144684791565, 1.0450482368469238, 1.0779516696929932, 1.110855221748352, 1.143758773803711]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 16.0, 16.0, 17.0, 28.0, 42.0, 56.0, 107.0, 162.0, 234.0, 376.0, 664.0, 1021.0, 1724.0, 3162.0, 6151.0, 12557.0, 28354.0, 82759.0, 571115.0, 3267357.0, 143995.0, 40657.0, 16332.0, 7868.0, 4061.0, 2180.0, 1252.0, 746.0, 436.0, 292.0, 199.0, 104.0, 81.0, 54.0, 35.0, 16.0, 17.0, 15.0, 8.0, 11.0, 4.0, 3.0, 2.0, 4.0], "bins": [-0.255126953125, -0.24861717224121094, -0.24210739135742188, -0.2355976104736328, -0.22908782958984375, -0.2225780487060547, -0.21606826782226562, -0.20955848693847656, -0.2030487060546875, -0.19653892517089844, -0.19002914428710938, -0.1835193634033203, -0.17700958251953125, -0.1704998016357422, -0.16399002075195312, -0.15748023986816406, -0.150970458984375, -0.14446067810058594, -0.13795089721679688, -0.1314411163330078, -0.12493133544921875, -0.11842155456542969, -0.11191177368164062, -0.10540199279785156, -0.0988922119140625, -0.09238243103027344, -0.08587265014648438, -0.07936286926269531, -0.07285308837890625, -0.06634330749511719, -0.059833526611328125, -0.05332374572753906, -0.04681396484375, -0.04030418395996094, -0.033794403076171875, -0.027284622192382812, -0.02077484130859375, -0.014265060424804688, -0.007755279541015625, -0.0012454986572265625, 0.0052642822265625, 0.011774063110351562, 0.018283843994140625, 0.024793624877929688, 0.03130340576171875, 0.03781318664550781, 0.044322967529296875, 0.05083274841308594, 0.057342529296875, 0.06385231018066406, 0.07036209106445312, 0.07687187194824219, 0.08338165283203125, 0.08989143371582031, 0.09640121459960938, 0.10291099548339844, 0.1094207763671875, 0.11593055725097656, 0.12244033813476562, 0.1289501190185547, 0.13545989990234375, 0.1419696807861328, 0.14847946166992188, 0.15498924255371094, 0.1614990234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 19.0, 16.0, 25.0, 12.0, 25.0, 40.0, 46.0, 43.0, 63.0, 56.0, 55.0, 49.0, 58.0, 79.0, 64.0, 56.0, 39.0, 42.0, 40.0, 30.0, 36.0, 24.0, 18.0, 11.0, 14.0, 9.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.061676025390625, -0.05984067916870117, -0.058005332946777344, -0.056169986724853516, -0.05433464050292969, -0.05249929428100586, -0.05066394805908203, -0.0488286018371582, -0.046993255615234375, -0.04515790939331055, -0.04332256317138672, -0.04148721694946289, -0.03965187072753906, -0.037816524505615234, -0.035981178283691406, -0.03414583206176758, -0.03231048583984375, -0.030475139617919922, -0.028639793395996094, -0.026804447174072266, -0.024969100952148438, -0.02313375473022461, -0.02129840850830078, -0.019463062286376953, -0.017627716064453125, -0.015792369842529297, -0.013957023620605469, -0.01212167739868164, -0.010286331176757812, -0.008450984954833984, -0.006615638732910156, -0.004780292510986328, -0.0029449462890625, -0.0011096000671386719, 0.0007257461547851562, 0.0025610923767089844, 0.0043964385986328125, 0.006231784820556641, 0.008067131042480469, 0.009902477264404297, 0.011737823486328125, 0.013573169708251953, 0.015408515930175781, 0.01724386215209961, 0.019079208374023438, 0.020914554595947266, 0.022749900817871094, 0.024585247039794922, 0.02642059326171875, 0.028255939483642578, 0.030091285705566406, 0.031926631927490234, 0.03376197814941406, 0.03559732437133789, 0.03743267059326172, 0.03926801681518555, 0.041103363037109375, 0.0429387092590332, 0.04477405548095703, 0.04660940170288086, 0.04844474792480469, 0.050280094146728516, 0.052115440368652344, 0.05395078659057617, 0.0557861328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 12.0, 10.0, 12.0, 8.0, 16.0, 21.0, 25.0, 42.0, 40.0, 69.0, 131.0, 192.0, 305.0, 625.0, 1363.0, 3455.0, 9920.0, 35411.0, 200222.0, 3631619.0, 252758.0, 40050.0, 11123.0, 3675.0, 1568.0, 657.0, 370.0, 192.0, 128.0, 70.0, 46.0, 29.0, 32.0, 20.0, 9.0, 16.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.455078125, -0.4422760009765625, -0.429473876953125, -0.4166717529296875, -0.40386962890625, -0.3910675048828125, -0.378265380859375, -0.3654632568359375, -0.3526611328125, -0.3398590087890625, -0.327056884765625, -0.3142547607421875, -0.30145263671875, -0.2886505126953125, -0.275848388671875, -0.2630462646484375, -0.250244140625, -0.2374420166015625, -0.224639892578125, -0.2118377685546875, -0.19903564453125, -0.1862335205078125, -0.173431396484375, -0.1606292724609375, -0.1478271484375, -0.1350250244140625, -0.122222900390625, -0.1094207763671875, -0.09661865234375, -0.0838165283203125, -0.071014404296875, -0.0582122802734375, -0.04541015625, -0.0326080322265625, -0.019805908203125, -0.0070037841796875, 0.00579833984375, 0.0186004638671875, 0.031402587890625, 0.0442047119140625, 0.0570068359375, 0.0698089599609375, 0.082611083984375, 0.0954132080078125, 0.10821533203125, 0.1210174560546875, 0.133819580078125, 0.1466217041015625, 0.159423828125, 0.1722259521484375, 0.185028076171875, 0.1978302001953125, 0.21063232421875, 0.2234344482421875, 0.236236572265625, 0.2490386962890625, 0.2618408203125, 0.2746429443359375, 0.287445068359375, 0.3002471923828125, 0.31304931640625, 0.3258514404296875, 0.338653564453125, 0.3514556884765625, 0.3642578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 10.0, 17.0, 24.0, 28.0, 37.0, 53.0, 93.0, 226.0, 715.0, 2069.0, 362.0, 173.0, 99.0, 53.0, 37.0, 28.0, 15.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1207275390625, -0.11446571350097656, -0.10820388793945312, -0.10194206237792969, -0.09568023681640625, -0.08941841125488281, -0.08315658569335938, -0.07689476013183594, -0.0706329345703125, -0.06437110900878906, -0.058109283447265625, -0.05184745788574219, -0.04558563232421875, -0.03932380676269531, -0.033061981201171875, -0.026800155639648438, -0.020538330078125, -0.014276504516601562, -0.008014678955078125, -0.0017528533935546875, 0.00450897216796875, 0.010770797729492188, 0.017032623291015625, 0.023294448852539062, 0.0295562744140625, 0.03581809997558594, 0.042079925537109375, 0.04834175109863281, 0.05460357666015625, 0.06086540222167969, 0.06712722778320312, 0.07338905334472656, 0.07965087890625, 0.08591270446777344, 0.09217453002929688, 0.09843635559082031, 0.10469818115234375, 0.11096000671386719, 0.11722183227539062, 0.12348365783691406, 0.1297454833984375, 0.13600730895996094, 0.14226913452148438, 0.1485309600830078, 0.15479278564453125, 0.1610546112060547, 0.16731643676757812, 0.17357826232910156, 0.179840087890625, 0.18610191345214844, 0.19236373901367188, 0.1986255645751953, 0.20488739013671875, 0.2111492156982422, 0.21741104125976562, 0.22367286682128906, 0.2299346923828125, 0.23619651794433594, 0.24245834350585938, 0.2487201690673828, 0.25498199462890625, 0.2612438201904297, 0.2675056457519531, 0.27376747131347656, 0.280029296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 11.0, 16.0, 24.0, 50.0, 65.0, 96.0, 108.0, 140.0, 148.0, 101.0, 77.0, 41.0, 44.0, 25.0, 20.0, 10.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3025517463684082, -1.2696025371551514, -1.2366533279418945, -1.2037042379379272, -1.1707550287246704, -1.1378058195114136, -1.1048566102981567, -1.0719074010849, -1.0389583110809326, -1.0060091018676758, -0.9730599522590637, -0.9401107430458069, -0.9071615934371948, -0.874212384223938, -0.8412631750106812, -0.8083139657974243, -0.7753647565841675, -0.7424155473709106, -0.7094663977622986, -0.6765171885490417, -0.6435680389404297, -0.6106188297271729, -0.577669620513916, -0.5447204113006592, -0.5117712616920471, -0.47882208228111267, -0.4458729028701782, -0.4129236936569214, -0.37997451424598694, -0.3470253348350525, -0.31407612562179565, -0.2811269462108612, -0.2481778860092163, -0.21522870659828186, -0.18227951228618622, -0.14933031797409058, -0.11638113856315613, -0.08343195915222168, -0.05048276484012604, -0.017533570528030396, 0.015415608882904053, 0.0483647957444191, 0.08131398260593414, 0.11426316946744919, 0.14721235632896423, 0.18016153573989868, 0.21311073005199432, 0.24605992436408997, 0.2790091037750244, 0.31195828318595886, 0.3449074625968933, 0.37785667181015015, 0.4108058512210846, 0.44375503063201904, 0.4767042398452759, 0.5096534490585327, 0.5426025986671448, 0.5755518078804016, 0.6085009574890137, 0.6414501667022705, 0.6743993759155273, 0.7073485255241394, 0.7402977347373962, 0.7732468843460083, 0.8061960935592651]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 5.0, 14.0, 11.0, 16.0, 27.0, 20.0, 30.0, 19.0, 23.0, 29.0, 30.0, 35.0, 49.0, 46.0, 32.0, 40.0, 44.0, 45.0, 53.0, 36.0, 39.0, 52.0, 40.0, 46.0, 28.0, 18.0, 19.0, 14.0, 17.0, 25.0, 18.0, 12.0, 7.0, 12.0, 7.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5119866728782654, -0.49630919098854065, -0.4806317090988159, -0.4649542570114136, -0.44927677512168884, -0.4335992932319641, -0.41792184114456177, -0.40224435925483704, -0.3865668773651123, -0.3708893954753876, -0.35521191358566284, -0.3395344614982605, -0.32385697960853577, -0.30817949771881104, -0.2925020456314087, -0.27682456374168396, -0.26114708185195923, -0.2454695999622345, -0.22979213297367096, -0.21411466598510742, -0.1984371840953827, -0.18275970220565796, -0.16708223521709442, -0.15140476822853088, -0.13572728633880615, -0.12004981189966202, -0.10437233746051788, -0.08869486302137375, -0.07301738858222961, -0.05733991414308548, -0.041662439703941345, -0.02598496526479721, -0.010307550430297852, 0.005369924008846283, 0.021047398447990417, 0.03672487288713455, 0.052402347326278687, 0.06807982176542282, 0.08375729620456696, 0.09943477064371109, 0.11511224508285522, 0.13078972697257996, 0.1464671939611435, 0.16214466094970703, 0.17782214283943176, 0.1934996247291565, 0.20917709171772003, 0.22485455870628357, 0.2405320405960083, 0.25620952248573303, 0.27188700437545776, 0.2875644564628601, 0.30324193835258484, 0.31891942024230957, 0.3345968723297119, 0.35027435421943665, 0.3659518361091614, 0.3816293179988861, 0.39730679988861084, 0.4129842519760132, 0.4286617338657379, 0.44433921575546265, 0.460016667842865, 0.4756941497325897, 0.49137163162231445]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 8.0, 10.0, 26.0, 37.0, 65.0, 111.0, 172.0, 314.0, 422.0, 814.0, 1410.0, 2691.0, 5175.0, 10372.0, 21409.0, 46179.0, 104629.0, 225853.0, 295772.0, 181743.0, 80579.0, 36095.0, 16982.0, 8356.0, 4206.0, 2260.0, 1201.0, 674.0, 394.0, 240.0, 140.0, 93.0, 52.0, 31.0, 15.0, 10.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.1383838653564453, -0.13382339477539062, -0.12926292419433594, -0.12470245361328125, -0.12014198303222656, -0.11558151245117188, -0.11102104187011719, -0.1064605712890625, -0.10190010070800781, -0.09733963012695312, -0.09277915954589844, -0.08821868896484375, -0.08365821838378906, -0.07909774780273438, -0.07453727722167969, -0.069976806640625, -0.06541633605957031, -0.060855865478515625, -0.05629539489746094, -0.05173492431640625, -0.04717445373535156, -0.042613983154296875, -0.03805351257324219, -0.0334930419921875, -0.028932571411132812, -0.024372100830078125, -0.019811630249023438, -0.01525115966796875, -0.010690689086914062, -0.006130218505859375, -0.0015697479248046875, 0.00299072265625, 0.0075511932373046875, 0.012111663818359375, 0.016672134399414062, 0.02123260498046875, 0.025793075561523438, 0.030353546142578125, 0.03491401672363281, 0.0394744873046875, 0.04403495788574219, 0.048595428466796875, 0.05315589904785156, 0.05771636962890625, 0.06227684020996094, 0.06683731079101562, 0.07139778137207031, 0.075958251953125, 0.08051872253417969, 0.08507919311523438, 0.08963966369628906, 0.09420013427734375, 0.09876060485839844, 0.10332107543945312, 0.10788154602050781, 0.1124420166015625, 0.11700248718261719, 0.12156295776367188, 0.12612342834472656, 0.13068389892578125, 0.13524436950683594, 0.13980484008789062, 0.1443653106689453, 0.14892578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 9.0, 10.0, 11.0, 18.0, 14.0, 16.0, 22.0, 22.0, 35.0, 44.0, 54.0, 47.0, 47.0, 48.0, 52.0, 64.0, 62.0, 47.0, 52.0, 61.0, 47.0, 29.0, 30.0, 28.0, 22.0, 23.0, 16.0, 22.0, 7.0, 9.0, 11.0, 7.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.053253173828125, -0.0514674186706543, -0.049681663513183594, -0.04789590835571289, -0.04611015319824219, -0.044324398040771484, -0.04253864288330078, -0.04075288772583008, -0.038967132568359375, -0.03718137741088867, -0.03539562225341797, -0.033609867095947266, -0.03182411193847656, -0.03003835678100586, -0.028252601623535156, -0.026466846466064453, -0.02468109130859375, -0.022895336151123047, -0.021109580993652344, -0.01932382583618164, -0.017538070678710938, -0.015752315521240234, -0.013966560363769531, -0.012180805206298828, -0.010395050048828125, -0.008609294891357422, -0.006823539733886719, -0.005037784576416016, -0.0032520294189453125, -0.0014662742614746094, 0.00031948089599609375, 0.002105236053466797, 0.0038909912109375, 0.005676746368408203, 0.007462501525878906, 0.00924825668334961, 0.011034011840820312, 0.012819766998291016, 0.014605522155761719, 0.016391277313232422, 0.018177032470703125, 0.019962787628173828, 0.02174854278564453, 0.023534297943115234, 0.025320053100585938, 0.02710580825805664, 0.028891563415527344, 0.030677318572998047, 0.03246307373046875, 0.03424882888793945, 0.036034584045410156, 0.03782033920288086, 0.03960609436035156, 0.041391849517822266, 0.04317760467529297, 0.04496335983276367, 0.046749114990234375, 0.04853487014770508, 0.05032062530517578, 0.052106380462646484, 0.05389213562011719, 0.05567789077758789, 0.057463645935058594, 0.0592494010925293, 0.06103515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 3.0, 5.0, 12.0, 18.0, 11.0, 20.0, 27.0, 34.0, 53.0, 71.0, 118.0, 206.0, 386.0, 593.0, 1374.0, 3443.0, 10386.0, 39918.0, 193196.0, 556755.0, 186670.0, 38916.0, 10153.0, 3300.0, 1325.0, 642.0, 327.0, 209.0, 118.0, 68.0, 53.0, 37.0, 29.0, 10.0, 15.0, 12.0, 3.0, 7.0, 6.0, 9.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2176513671875, -0.2097339630126953, -0.20181655883789062, -0.19389915466308594, -0.18598175048828125, -0.17806434631347656, -0.17014694213867188, -0.1622295379638672, -0.1543121337890625, -0.1463947296142578, -0.13847732543945312, -0.13055992126464844, -0.12264251708984375, -0.11472511291503906, -0.10680770874023438, -0.09889030456542969, -0.090972900390625, -0.08305549621582031, -0.07513809204101562, -0.06722068786621094, -0.05930328369140625, -0.05138587951660156, -0.043468475341796875, -0.03555107116699219, -0.0276336669921875, -0.019716262817382812, -0.011798858642578125, -0.0038814544677734375, 0.00403594970703125, 0.011953353881835938, 0.019870758056640625, 0.027788162231445312, 0.03570556640625, 0.04362297058105469, 0.051540374755859375, 0.05945777893066406, 0.06737518310546875, 0.07529258728027344, 0.08320999145507812, 0.09112739562988281, 0.0990447998046875, 0.10696220397949219, 0.11487960815429688, 0.12279701232910156, 0.13071441650390625, 0.13863182067871094, 0.14654922485351562, 0.1544666290283203, 0.162384033203125, 0.1703014373779297, 0.17821884155273438, 0.18613624572753906, 0.19405364990234375, 0.20197105407714844, 0.20988845825195312, 0.2178058624267578, 0.2257232666015625, 0.2336406707763672, 0.24155807495117188, 0.24947547912597656, 0.25739288330078125, 0.26531028747558594, 0.2732276916503906, 0.2811450958251953, 0.2890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 15.0, 15.0, 19.0, 20.0, 21.0, 31.0, 29.0, 31.0, 40.0, 40.0, 49.0, 41.0, 49.0, 42.0, 52.0, 46.0, 39.0, 50.0, 30.0, 36.0, 27.0, 40.0, 33.0, 34.0, 27.0, 18.0, 13.0, 11.0, 12.0, 9.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23513412475585938, -0.22734832763671875, -0.21956253051757812, -0.2117767333984375, -0.20399093627929688, -0.19620513916015625, -0.18841934204101562, -0.180633544921875, -0.17284774780273438, -0.16506195068359375, -0.15727615356445312, -0.1494903564453125, -0.14170455932617188, -0.13391876220703125, -0.12613296508789062, -0.11834716796875, -0.11056137084960938, -0.10277557373046875, -0.09498977661132812, -0.0872039794921875, -0.07941818237304688, -0.07163238525390625, -0.06384658813476562, -0.056060791015625, -0.048274993896484375, -0.04048919677734375, -0.032703399658203125, -0.0249176025390625, -0.017131805419921875, -0.00934600830078125, -0.001560211181640625, 0.0062255859375, 0.014011383056640625, 0.02179718017578125, 0.029582977294921875, 0.0373687744140625, 0.045154571533203125, 0.05294036865234375, 0.060726165771484375, 0.068511962890625, 0.07629776000976562, 0.08408355712890625, 0.09186935424804688, 0.0996551513671875, 0.10744094848632812, 0.11522674560546875, 0.12301254272460938, 0.13079833984375, 0.13858413696289062, 0.14636993408203125, 0.15415573120117188, 0.1619415283203125, 0.16972732543945312, 0.17751312255859375, 0.18529891967773438, 0.193084716796875, 0.20087051391601562, 0.20865631103515625, 0.21644210815429688, 0.2242279052734375, 0.23201370239257812, 0.23979949951171875, 0.24758529663085938, 0.25537109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 4.0, 14.0, 30.0, 40.0, 51.0, 116.0, 145.0, 393.0, 753.0, 2008.0, 7241.0, 71258.0, 848331.0, 105513.0, 8549.0, 2347.0, 897.0, 377.0, 204.0, 91.0, 79.0, 50.0, 14.0, 15.0, 12.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294677734375, -0.2839851379394531, -0.27329254150390625, -0.2625999450683594, -0.2519073486328125, -0.24121475219726562, -0.23052215576171875, -0.21982955932617188, -0.209136962890625, -0.19844436645507812, -0.18775177001953125, -0.17705917358398438, -0.1663665771484375, -0.15567398071289062, -0.14498138427734375, -0.13428878784179688, -0.12359619140625, -0.11290359497070312, -0.10221099853515625, -0.09151840209960938, -0.0808258056640625, -0.07013320922851562, -0.05944061279296875, -0.048748016357421875, -0.038055419921875, -0.027362823486328125, -0.01667022705078125, -0.005977630615234375, 0.0047149658203125, 0.015407562255859375, 0.02610015869140625, 0.036792755126953125, 0.0474853515625, 0.058177947998046875, 0.06887054443359375, 0.07956314086914062, 0.0902557373046875, 0.10094833374023438, 0.11164093017578125, 0.12233352661132812, 0.133026123046875, 0.14371871948242188, 0.15441131591796875, 0.16510391235351562, 0.1757965087890625, 0.18648910522460938, 0.19718170166015625, 0.20787429809570312, 0.21856689453125, 0.22925949096679688, 0.23995208740234375, 0.2506446838378906, 0.2613372802734375, 0.2720298767089844, 0.28272247314453125, 0.2934150695800781, 0.304107666015625, 0.3148002624511719, 0.32549285888671875, 0.3361854553222656, 0.3468780517578125, 0.3575706481933594, 0.36826324462890625, 0.3789558410644531, 0.3896484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 5.0, 14.0, 15.0, 32.0, 35.0, 27.0, 51.0, 47.0, 63.0, 75.0, 80.0, 96.0, 87.0, 68.0, 62.0, 52.0, 38.0, 42.0, 23.0, 18.0, 13.0, 8.0, 11.0, 7.0, 3.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.060434341430664e-05, -4.932191222906113e-05, -4.803948104381561e-05, -4.67570498585701e-05, -4.5474618673324585e-05, -4.419218748807907e-05, -4.290975630283356e-05, -4.162732511758804e-05, -4.034489393234253e-05, -3.9062462747097015e-05, -3.77800315618515e-05, -3.649760037660599e-05, -3.5215169191360474e-05, -3.393273800611496e-05, -3.2650306820869446e-05, -3.136787563562393e-05, -3.0085444450378418e-05, -2.8803013265132904e-05, -2.752058207988739e-05, -2.6238150894641876e-05, -2.4955719709396362e-05, -2.367328852415085e-05, -2.2390857338905334e-05, -2.110842615365982e-05, -1.9825994968414307e-05, -1.8543563783168793e-05, -1.726113259792328e-05, -1.5978701412677765e-05, -1.4696270227432251e-05, -1.3413839042186737e-05, -1.2131407856941223e-05, -1.084897667169571e-05, -9.566545486450195e-06, -8.284114301204681e-06, -7.0016831159591675e-06, -5.7192519307136536e-06, -4.43682074546814e-06, -3.1543895602226257e-06, -1.8719583749771118e-06, -5.895271897315979e-07, 6.92903995513916e-07, 1.97533518075943e-06, 3.257766366004944e-06, 4.540197551250458e-06, 5.822628736495972e-06, 7.105059921741486e-06, 8.387491106987e-06, 9.669922292232513e-06, 1.0952353477478027e-05, 1.2234784662723541e-05, 1.3517215847969055e-05, 1.4799647033214569e-05, 1.6082078218460083e-05, 1.7364509403705597e-05, 1.864694058895111e-05, 1.9929371774196625e-05, 2.121180295944214e-05, 2.2494234144687653e-05, 2.3776665329933167e-05, 2.505909651517868e-05, 2.6341527700424194e-05, 2.7623958885669708e-05, 2.8906390070915222e-05, 3.0188821256160736e-05, 3.147125244140625e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 9.0, 17.0, 24.0, 30.0, 31.0, 59.0, 77.0, 109.0, 170.0, 211.0, 322.0, 439.0, 705.0, 1216.0, 1959.0, 3881.0, 10919.0, 56263.0, 503543.0, 406065.0, 44109.0, 9611.0, 3729.0, 1842.0, 1075.0, 690.0, 445.0, 298.0, 195.0, 121.0, 98.0, 72.0, 41.0, 43.0, 28.0, 15.0, 16.0, 16.0, 11.0, 6.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2283935546875, -0.22124290466308594, -0.21409225463867188, -0.2069416046142578, -0.19979095458984375, -0.1926403045654297, -0.18548965454101562, -0.17833900451660156, -0.1711883544921875, -0.16403770446777344, -0.15688705444335938, -0.1497364044189453, -0.14258575439453125, -0.1354351043701172, -0.12828445434570312, -0.12113380432128906, -0.113983154296875, -0.10683250427246094, -0.09968185424804688, -0.09253120422363281, -0.08538055419921875, -0.07822990417480469, -0.07107925415039062, -0.06392860412597656, -0.0567779541015625, -0.04962730407714844, -0.042476654052734375, -0.03532600402832031, -0.02817535400390625, -0.021024703979492188, -0.013874053955078125, -0.0067234039306640625, 0.00042724609375, 0.0075778961181640625, 0.014728546142578125, 0.021879196166992188, 0.02902984619140625, 0.03618049621582031, 0.043331146240234375, 0.05048179626464844, 0.0576324462890625, 0.06478309631347656, 0.07193374633789062, 0.07908439636230469, 0.08623504638671875, 0.09338569641113281, 0.10053634643554688, 0.10768699645996094, 0.114837646484375, 0.12198829650878906, 0.12913894653320312, 0.1362895965576172, 0.14344024658203125, 0.1505908966064453, 0.15774154663085938, 0.16489219665527344, 0.1720428466796875, 0.17919349670410156, 0.18634414672851562, 0.1934947967529297, 0.20064544677734375, 0.2077960968017578, 0.21494674682617188, 0.22209739685058594, 0.229248046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 29.0, 30.0, 36.0, 55.0, 88.0, 106.0, 151.0, 134.0, 122.0, 68.0, 59.0, 33.0, 19.0, 18.0, 12.0, 6.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.16943931579589844, -0.16285324096679688, -0.1562671661376953, -0.14968109130859375, -0.1430950164794922, -0.13650894165039062, -0.12992286682128906, -0.1233367919921875, -0.11675071716308594, -0.11016464233398438, -0.10357856750488281, -0.09699249267578125, -0.09040641784667969, -0.08382034301757812, -0.07723426818847656, -0.070648193359375, -0.06406211853027344, -0.057476043701171875, -0.05088996887207031, -0.04430389404296875, -0.03771781921386719, -0.031131744384765625, -0.024545669555664062, -0.0179595947265625, -0.011373519897460938, -0.004787445068359375, 0.0017986297607421875, 0.00838470458984375, 0.014970779418945312, 0.021556854248046875, 0.028142929077148438, 0.03472900390625, 0.04131507873535156, 0.047901153564453125, 0.05448722839355469, 0.06107330322265625, 0.06765937805175781, 0.07424545288085938, 0.08083152770996094, 0.0874176025390625, 0.09400367736816406, 0.10058975219726562, 0.10717582702636719, 0.11376190185546875, 0.12034797668457031, 0.12693405151367188, 0.13352012634277344, 0.140106201171875, 0.14669227600097656, 0.15327835083007812, 0.1598644256591797, 0.16645050048828125, 0.1730365753173828, 0.17962265014648438, 0.18620872497558594, 0.1927947998046875, 0.19938087463378906, 0.20596694946289062, 0.2125530242919922, 0.21913909912109375, 0.2257251739501953, 0.23231124877929688, 0.23889732360839844, 0.2454833984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 11.0, 43.0, 66.0, 169.0, 262.0, 242.0, 125.0, 50.0, 27.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.215538501739502, -3.074989080429077, -2.9344396591186523, -2.7938902378082275, -2.6533408164978027, -2.512791395187378, -2.372241973876953, -2.2316925525665283, -2.0911431312561035, -1.9505937099456787, -1.810044288635254, -1.669494867324829, -1.5289454460144043, -1.3883960247039795, -1.2478466033935547, -1.1072971820831299, -0.9667477607727051, -0.8261983394622803, -0.6856489181518555, -0.5450994968414307, -0.40455007553100586, -0.26400065422058105, -0.12345123291015625, 0.017098188400268555, 0.15764760971069336, 0.29819703102111816, 0.43874645233154297, 0.5792958736419678, 0.7198452949523926, 0.8603947162628174, 1.0009441375732422, 1.141493558883667, 1.28204345703125, 1.4225928783416748, 1.5631422996520996, 1.7036917209625244, 1.8442411422729492, 1.984790563583374, 2.125339984893799, 2.2658894062042236, 2.4064388275146484, 2.5469882488250732, 2.687537670135498, 2.828087091445923, 2.9686365127563477, 3.1091859340667725, 3.2497353553771973, 3.390284776687622, 3.530834197998047, 3.6713836193084717, 3.8119330406188965, 3.9524824619293213, 4.093031883239746, 4.23358154296875, 4.374130725860596, 4.514679908752441, 4.655229568481445, 4.795779228210449, 4.936328411102295, 5.076877593994141, 5.2174272537231445, 5.357976913452148, 5.498526096343994, 5.63907527923584, 5.779624938964844]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 10.0, 5.0, 6.0, 14.0, 13.0, 16.0, 11.0, 24.0, 28.0, 16.0, 21.0, 23.0, 19.0, 30.0, 34.0, 25.0, 26.0, 39.0, 34.0, 46.0, 40.0, 41.0, 40.0, 33.0, 37.0, 47.0, 38.0, 28.0, 31.0, 30.0, 30.0, 25.0, 14.0, 17.0, 13.0, 13.0, 8.0, 14.0, 10.0, 8.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0228466987609863, -0.9889925718307495, -0.9551385045051575, -0.9212844371795654, -0.8874303102493286, -0.8535761833190918, -0.8197221159934998, -0.7858680486679077, -0.7520139217376709, -0.7181597948074341, -0.684305727481842, -0.65045166015625, -0.6165975332260132, -0.5827434062957764, -0.5488893389701843, -0.5150352716445923, -0.48118114471435547, -0.44732704758644104, -0.4134729504585266, -0.3796188533306122, -0.34576475620269775, -0.3119106590747833, -0.2780565619468689, -0.24420246481895447, -0.21034836769104004, -0.1764942705631256, -0.14264017343521118, -0.10878607630729675, -0.07493197917938232, -0.041077882051467896, -0.007223784923553467, 0.026630312204360962, 0.06048452854156494, 0.09433862566947937, 0.1281927227973938, 0.16204681992530823, 0.19590091705322266, 0.22975501418113708, 0.2636091113090515, 0.29746320843696594, 0.33131730556488037, 0.3651714026927948, 0.39902549982070923, 0.43287959694862366, 0.4667336940765381, 0.5005878210067749, 0.5344418883323669, 0.568295955657959, 0.6021500825881958, 0.6360042095184326, 0.6698582768440247, 0.7037123441696167, 0.7375664710998535, 0.7714205980300903, 0.8052746653556824, 0.8391287326812744, 0.8729828596115112, 0.906836986541748, 0.9406910538673401, 0.9745451211929321, 1.008399248123169, 1.0422533750534058, 1.0761075019836426, 1.1099615097045898, 1.1438156366348267]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 10.0, 20.0, 20.0, 23.0, 32.0, 30.0, 59.0, 69.0, 90.0, 115.0, 173.0, 214.0, 289.0, 452.0, 635.0, 1102.0, 2431.0, 6842.0, 32377.0, 4075820.0, 57591.0, 9001.0, 3015.0, 1366.0, 734.0, 467.0, 336.0, 224.0, 172.0, 140.0, 103.0, 63.0, 54.0, 49.0, 38.0, 28.0, 12.0, 12.0, 12.0, 12.0, 7.0, 2.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.482421875, -0.4671630859375, -0.451904296875, -0.4366455078125, -0.42138671875, -0.4061279296875, -0.390869140625, -0.3756103515625, -0.3603515625, -0.3450927734375, -0.329833984375, -0.3145751953125, -0.29931640625, -0.2840576171875, -0.268798828125, -0.2535400390625, -0.23828125, -0.2230224609375, -0.207763671875, -0.1925048828125, -0.17724609375, -0.1619873046875, -0.146728515625, -0.1314697265625, -0.1162109375, -0.1009521484375, -0.085693359375, -0.0704345703125, -0.05517578125, -0.0399169921875, -0.024658203125, -0.0093994140625, 0.005859375, 0.0211181640625, 0.036376953125, 0.0516357421875, 0.06689453125, 0.0821533203125, 0.097412109375, 0.1126708984375, 0.1279296875, 0.1431884765625, 0.158447265625, 0.1737060546875, 0.18896484375, 0.2042236328125, 0.219482421875, 0.2347412109375, 0.25, 0.2652587890625, 0.280517578125, 0.2957763671875, 0.31103515625, 0.3262939453125, 0.341552734375, 0.3568115234375, 0.3720703125, 0.3873291015625, 0.402587890625, 0.4178466796875, 0.43310546875, 0.4483642578125, 0.463623046875, 0.4788818359375, 0.494140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 7.0, 8.0, 13.0, 12.0, 23.0, 16.0, 22.0, 32.0, 41.0, 50.0, 48.0, 39.0, 55.0, 57.0, 69.0, 55.0, 47.0, 52.0, 53.0, 47.0, 40.0, 26.0, 37.0, 35.0, 16.0, 13.0, 18.0, 16.0, 13.0, 12.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058349609375, -0.0563507080078125, -0.054351806640625, -0.0523529052734375, -0.05035400390625, -0.0483551025390625, -0.046356201171875, -0.0443572998046875, -0.0423583984375, -0.0403594970703125, -0.038360595703125, -0.0363616943359375, -0.03436279296875, -0.0323638916015625, -0.030364990234375, -0.0283660888671875, -0.0263671875, -0.0243682861328125, -0.022369384765625, -0.0203704833984375, -0.01837158203125, -0.0163726806640625, -0.014373779296875, -0.0123748779296875, -0.0103759765625, -0.0083770751953125, -0.006378173828125, -0.0043792724609375, -0.00238037109375, -0.0003814697265625, 0.001617431640625, 0.0036163330078125, 0.005615234375, 0.0076141357421875, 0.009613037109375, 0.0116119384765625, 0.01361083984375, 0.0156097412109375, 0.017608642578125, 0.0196075439453125, 0.0216064453125, 0.0236053466796875, 0.025604248046875, 0.0276031494140625, 0.02960205078125, 0.0316009521484375, 0.033599853515625, 0.0355987548828125, 0.03759765625, 0.0395965576171875, 0.041595458984375, 0.0435943603515625, 0.04559326171875, 0.0475921630859375, 0.049591064453125, 0.0515899658203125, 0.0535888671875, 0.0555877685546875, 0.057586669921875, 0.0595855712890625, 0.06158447265625, 0.0635833740234375, 0.065582275390625, 0.0675811767578125, 0.069580078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 7.0, 6.0, 10.0, 12.0, 12.0, 15.0, 19.0, 24.0, 34.0, 39.0, 52.0, 66.0, 76.0, 131.0, 162.0, 248.0, 382.0, 707.0, 1570.0, 4907.0, 33642.0, 4114129.0, 29877.0, 4634.0, 1429.0, 720.0, 407.0, 265.0, 172.0, 113.0, 109.0, 72.0, 53.0, 37.0, 35.0, 22.0, 24.0, 15.0, 10.0, 15.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8603515625, -0.82904052734375, -0.7977294921875, -0.76641845703125, -0.735107421875, -0.70379638671875, -0.6724853515625, -0.64117431640625, -0.60986328125, -0.57855224609375, -0.5472412109375, -0.51593017578125, -0.484619140625, -0.45330810546875, -0.4219970703125, -0.39068603515625, -0.359375, -0.32806396484375, -0.2967529296875, -0.26544189453125, -0.234130859375, -0.20281982421875, -0.1715087890625, -0.14019775390625, -0.10888671875, -0.07757568359375, -0.0462646484375, -0.01495361328125, 0.016357421875, 0.04766845703125, 0.0789794921875, 0.11029052734375, 0.1416015625, 0.17291259765625, 0.2042236328125, 0.23553466796875, 0.266845703125, 0.29815673828125, 0.3294677734375, 0.36077880859375, 0.39208984375, 0.42340087890625, 0.4547119140625, 0.48602294921875, 0.517333984375, 0.54864501953125, 0.5799560546875, 0.61126708984375, 0.642578125, 0.67388916015625, 0.7052001953125, 0.73651123046875, 0.767822265625, 0.79913330078125, 0.8304443359375, 0.86175537109375, 0.89306640625, 0.92437744140625, 0.9556884765625, 0.98699951171875, 1.018310546875, 1.04962158203125, 1.0809326171875, 1.11224365234375, 1.1435546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 14.0, 20.0, 57.0, 383.0, 3450.0, 81.0, 29.0, 15.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08343505859375, -0.07790851593017578, -0.07238197326660156, -0.06685543060302734, -0.061328887939453125, -0.055802345275878906, -0.05027580261230469, -0.04474925994873047, -0.03922271728515625, -0.03369617462158203, -0.028169631958007812, -0.022643089294433594, -0.017116546630859375, -0.011590003967285156, -0.0060634613037109375, -0.0005369186401367188, 0.0049896240234375, 0.010516166687011719, 0.016042709350585938, 0.021569252014160156, 0.027095794677734375, 0.032622337341308594, 0.03814888000488281, 0.04367542266845703, 0.04920196533203125, 0.05472850799560547, 0.06025505065917969, 0.0657815933227539, 0.07130813598632812, 0.07683467864990234, 0.08236122131347656, 0.08788776397705078, 0.093414306640625, 0.09894084930419922, 0.10446739196777344, 0.10999393463134766, 0.11552047729492188, 0.1210470199584961, 0.1265735626220703, 0.13210010528564453, 0.13762664794921875, 0.14315319061279297, 0.1486797332763672, 0.1542062759399414, 0.15973281860351562, 0.16525936126708984, 0.17078590393066406, 0.17631244659423828, 0.1818389892578125, 0.18736553192138672, 0.19289207458496094, 0.19841861724853516, 0.20394515991210938, 0.2094717025756836, 0.2149982452392578, 0.22052478790283203, 0.22605133056640625, 0.23157787322998047, 0.2371044158935547, 0.2426309585571289, 0.24815750122070312, 0.25368404388427734, 0.25921058654785156, 0.2647371292114258, 0.270263671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 12.0, 23.0, 35.0, 60.0, 93.0, 115.0, 142.0, 145.0, 100.0, 74.0, 47.0, 39.0, 31.0, 19.0, 12.0, 13.0, 10.0, 9.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5047615766525269, -0.4841006398200989, -0.4634397327899933, -0.4427787959575653, -0.42211785912513733, -0.40145695209503174, -0.38079601526260376, -0.3601350784301758, -0.3394741415977478, -0.3188132047653198, -0.29815229773521423, -0.27749136090278625, -0.2568304240703583, -0.2361695021390915, -0.2155085802078247, -0.19484764337539673, -0.17418673634529114, -0.15352581441402435, -0.13286487758159637, -0.11220395565032959, -0.09154302626848221, -0.07088209688663483, -0.05022117495536804, -0.029560238122940063, -0.008899316191673279, 0.011761611327528954, 0.032422538846731186, 0.05308346450328827, 0.07374439388513565, 0.09440532326698303, 0.11506624519824982, 0.1357271820306778, 0.15638810396194458, 0.17704902589321136, 0.19770996272563934, 0.21837088465690613, 0.2390318214893341, 0.2596927285194397, 0.2803536653518677, 0.30101460218429565, 0.32167553901672363, 0.3423364758491516, 0.3629973828792572, 0.3836583197116852, 0.40431925654411316, 0.42498016357421875, 0.44564110040664673, 0.4663020372390747, 0.4869629442691803, 0.5076238512992859, 0.5282847881317139, 0.5489457249641418, 0.5696066617965698, 0.5902675986289978, 0.6109285354614258, 0.631589412689209, 0.652250349521637, 0.6729112863540649, 0.6935722231864929, 0.7142331600189209, 0.7348940372467041, 0.7555549740791321, 0.7762159109115601, 0.796876847743988, 0.817537784576416]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 9.0, 11.0, 10.0, 11.0, 14.0, 15.0, 15.0, 20.0, 24.0, 23.0, 13.0, 25.0, 35.0, 23.0, 39.0, 28.0, 34.0, 35.0, 48.0, 37.0, 31.0, 37.0, 35.0, 25.0, 33.0, 28.0, 33.0, 30.0, 19.0, 26.0, 30.0, 24.0, 25.0, 26.0, 24.0, 16.0, 15.0, 19.0, 12.0, 9.0, 9.0, 8.0, 7.0, 3.0, 3.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26647669076919556, -0.2576553225517273, -0.24883392453193665, -0.2400125414133072, -0.23119115829467773, -0.22236977517604828, -0.21354839205741882, -0.20472700893878937, -0.1959056258201599, -0.18708424270153046, -0.178262859582901, -0.16944147646427155, -0.1606200933456421, -0.15179871022701263, -0.14297732710838318, -0.13415594398975372, -0.12533456087112427, -0.11651317775249481, -0.10769179463386536, -0.0988704115152359, -0.09004902839660645, -0.08122764527797699, -0.07240626215934753, -0.06358487904071808, -0.05476349592208862, -0.04594211280345917, -0.03712072968482971, -0.028299346566200256, -0.0194779634475708, -0.010656580328941345, -0.0018351972103118896, 0.006986185908317566, 0.01580756902694702, 0.024628952145576477, 0.03345033526420593, 0.04227171838283539, 0.051093101501464844, 0.0599144846200943, 0.06873586773872375, 0.07755725085735321, 0.08637863397598267, 0.09520001709461212, 0.10402140021324158, 0.11284278333187103, 0.12166416645050049, 0.13048554956912994, 0.1393069326877594, 0.14812831580638885, 0.1569496989250183, 0.16577108204364777, 0.17459246516227722, 0.18341384828090668, 0.19223523139953613, 0.2010566145181656, 0.20987799763679504, 0.2186993807554245, 0.22752076387405396, 0.2363421469926834, 0.24516353011131287, 0.2539849281311035, 0.2628062963485718, 0.27162766456604004, 0.2804490625858307, 0.28927046060562134, 0.2980918288230896]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 8.0, 3.0, 7.0, 6.0, 10.0, 14.0, 16.0, 18.0, 34.0, 41.0, 43.0, 63.0, 101.0, 154.0, 169.0, 218.0, 302.0, 422.0, 567.0, 792.0, 1166.0, 1913.0, 3396.0, 6975.0, 17413.0, 51179.0, 174831.0, 428342.0, 245726.0, 71790.0, 23090.0, 8846.0, 4049.0, 2272.0, 1308.0, 897.0, 634.0, 432.0, 322.0, 266.0, 196.0, 144.0, 91.0, 67.0, 55.0, 44.0, 33.0, 30.0, 18.0, 15.0, 14.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.24755859375, -0.23947906494140625, -0.2313995361328125, -0.22332000732421875, -0.215240478515625, -0.20716094970703125, -0.1990814208984375, -0.19100189208984375, -0.18292236328125, -0.17484283447265625, -0.1667633056640625, -0.15868377685546875, -0.150604248046875, -0.14252471923828125, -0.1344451904296875, -0.12636566162109375, -0.1182861328125, -0.11020660400390625, -0.1021270751953125, -0.09404754638671875, -0.085968017578125, -0.07788848876953125, -0.0698089599609375, -0.06172943115234375, -0.05364990234375, -0.04557037353515625, -0.0374908447265625, -0.02941131591796875, -0.021331787109375, -0.01325225830078125, -0.0051727294921875, 0.00290679931640625, 0.010986328125, 0.01906585693359375, 0.0271453857421875, 0.03522491455078125, 0.043304443359375, 0.05138397216796875, 0.0594635009765625, 0.06754302978515625, 0.07562255859375, 0.08370208740234375, 0.0917816162109375, 0.09986114501953125, 0.107940673828125, 0.11602020263671875, 0.1240997314453125, 0.13217926025390625, 0.1402587890625, 0.14833831787109375, 0.1564178466796875, 0.16449737548828125, 0.172576904296875, 0.18065643310546875, 0.1887359619140625, 0.19681549072265625, 0.20489501953125, 0.21297454833984375, 0.2210540771484375, 0.22913360595703125, 0.237213134765625, 0.24529266357421875, 0.2533721923828125, 0.26145172119140625, 0.26953125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 7.0, 1.0, 4.0, 10.0, 13.0, 7.0, 8.0, 16.0, 19.0, 24.0, 21.0, 26.0, 29.0, 41.0, 29.0, 52.0, 50.0, 59.0, 49.0, 56.0, 53.0, 46.0, 35.0, 48.0, 41.0, 37.0, 40.0, 39.0, 15.0, 29.0, 21.0, 13.0, 11.0, 11.0, 13.0, 5.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06689453125, -0.06449222564697266, -0.06208992004394531, -0.05968761444091797, -0.057285308837890625, -0.05488300323486328, -0.05248069763183594, -0.050078392028808594, -0.04767608642578125, -0.045273780822753906, -0.04287147521972656, -0.04046916961669922, -0.038066864013671875, -0.03566455841064453, -0.03326225280761719, -0.030859947204589844, -0.0284576416015625, -0.026055335998535156, -0.023653030395507812, -0.02125072479248047, -0.018848419189453125, -0.01644611358642578, -0.014043807983398438, -0.011641502380371094, -0.00923919677734375, -0.006836891174316406, -0.0044345855712890625, -0.0020322799682617188, 0.000370025634765625, 0.0027723312377929688, 0.0051746368408203125, 0.007576942443847656, 0.009979248046875, 0.012381553649902344, 0.014783859252929688, 0.01718616485595703, 0.019588470458984375, 0.02199077606201172, 0.024393081665039062, 0.026795387268066406, 0.02919769287109375, 0.031599998474121094, 0.03400230407714844, 0.03640460968017578, 0.038806915283203125, 0.04120922088623047, 0.04361152648925781, 0.046013832092285156, 0.0484161376953125, 0.050818443298339844, 0.05322074890136719, 0.05562305450439453, 0.058025360107421875, 0.06042766571044922, 0.06282997131347656, 0.0652322769165039, 0.06763458251953125, 0.0700368881225586, 0.07243919372558594, 0.07484149932861328, 0.07724380493164062, 0.07964611053466797, 0.08204841613769531, 0.08445072174072266, 0.08685302734375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 5.0, 9.0, 10.0, 18.0, 30.0, 33.0, 61.0, 77.0, 114.0, 157.0, 241.0, 387.0, 667.0, 1085.0, 2051.0, 4188.0, 10835.0, 42503.0, 293717.0, 577867.0, 84894.0, 17471.0, 5859.0, 2651.0, 1446.0, 779.0, 467.0, 276.0, 183.0, 134.0, 92.0, 83.0, 50.0, 33.0, 24.0, 11.0, 8.0, 12.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.348388671875, -0.336456298828125, -0.32452392578125, -0.312591552734375, -0.3006591796875, -0.288726806640625, -0.27679443359375, -0.264862060546875, -0.2529296875, -0.240997314453125, -0.22906494140625, -0.217132568359375, -0.2052001953125, -0.193267822265625, -0.18133544921875, -0.169403076171875, -0.157470703125, -0.145538330078125, -0.13360595703125, -0.121673583984375, -0.1097412109375, -0.097808837890625, -0.08587646484375, -0.073944091796875, -0.06201171875, -0.050079345703125, -0.03814697265625, -0.026214599609375, -0.0142822265625, -0.002349853515625, 0.00958251953125, 0.021514892578125, 0.033447265625, 0.045379638671875, 0.05731201171875, 0.069244384765625, 0.0811767578125, 0.093109130859375, 0.10504150390625, 0.116973876953125, 0.12890625, 0.140838623046875, 0.15277099609375, 0.164703369140625, 0.1766357421875, 0.188568115234375, 0.20050048828125, 0.212432861328125, 0.224365234375, 0.236297607421875, 0.24822998046875, 0.260162353515625, 0.2720947265625, 0.284027099609375, 0.29595947265625, 0.307891845703125, 0.31982421875, 0.331756591796875, 0.34368896484375, 0.355621337890625, 0.3675537109375, 0.379486083984375, 0.39141845703125, 0.403350830078125, 0.415283203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 5.0, 1.0, 8.0, 11.0, 10.0, 11.0, 18.0, 22.0, 14.0, 33.0, 36.0, 36.0, 41.0, 49.0, 43.0, 43.0, 45.0, 46.0, 58.0, 56.0, 44.0, 49.0, 52.0, 49.0, 26.0, 39.0, 36.0, 23.0, 22.0, 12.0, 14.0, 8.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40478515625, -0.3912239074707031, -0.37766265869140625, -0.3641014099121094, -0.3505401611328125, -0.3369789123535156, -0.32341766357421875, -0.3098564147949219, -0.296295166015625, -0.2827339172363281, -0.26917266845703125, -0.2556114196777344, -0.2420501708984375, -0.22848892211914062, -0.21492767333984375, -0.20136642456054688, -0.18780517578125, -0.17424392700195312, -0.16068267822265625, -0.14712142944335938, -0.1335601806640625, -0.11999893188476562, -0.10643768310546875, -0.09287643432617188, -0.079315185546875, -0.06575393676757812, -0.05219268798828125, -0.038631439208984375, -0.0250701904296875, -0.011508941650390625, 0.00205230712890625, 0.015613555908203125, 0.0291748046875, 0.042736053466796875, 0.05629730224609375, 0.06985855102539062, 0.0834197998046875, 0.09698104858398438, 0.11054229736328125, 0.12410354614257812, 0.137664794921875, 0.15122604370117188, 0.16478729248046875, 0.17834854125976562, 0.1919097900390625, 0.20547103881835938, 0.21903228759765625, 0.23259353637695312, 0.24615478515625, 0.2597160339355469, 0.27327728271484375, 0.2868385314941406, 0.3003997802734375, 0.3139610290527344, 0.32752227783203125, 0.3410835266113281, 0.354644775390625, 0.3682060241699219, 0.38176727294921875, 0.3953285217285156, 0.4088897705078125, 0.4224510192871094, 0.43601226806640625, 0.4495735168457031, 0.463134765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 12.0, 11.0, 22.0, 23.0, 35.0, 51.0, 79.0, 111.0, 188.0, 320.0, 589.0, 1358.0, 3203.0, 11584.0, 122810.0, 836472.0, 58445.0, 8056.0, 2714.0, 1123.0, 533.0, 319.0, 152.0, 92.0, 81.0, 41.0, 26.0, 18.0, 18.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3408203125, -0.3302955627441406, -0.31977081298828125, -0.3092460632324219, -0.2987213134765625, -0.2881965637207031, -0.27767181396484375, -0.2671470642089844, -0.256622314453125, -0.24609756469726562, -0.23557281494140625, -0.22504806518554688, -0.2145233154296875, -0.20399856567382812, -0.19347381591796875, -0.18294906616210938, -0.17242431640625, -0.16189956665039062, -0.15137481689453125, -0.14085006713867188, -0.1303253173828125, -0.11980056762695312, -0.10927581787109375, -0.09875106811523438, -0.088226318359375, -0.07770156860351562, -0.06717681884765625, -0.056652069091796875, -0.0461273193359375, -0.035602569580078125, -0.02507781982421875, -0.014553070068359375, -0.0040283203125, 0.006496429443359375, 0.01702117919921875, 0.027545928955078125, 0.0380706787109375, 0.048595428466796875, 0.05912017822265625, 0.06964492797851562, 0.080169677734375, 0.09069442749023438, 0.10121917724609375, 0.11174392700195312, 0.1222686767578125, 0.13279342651367188, 0.14331817626953125, 0.15384292602539062, 0.16436767578125, 0.17489242553710938, 0.18541717529296875, 0.19594192504882812, 0.2064666748046875, 0.21699142456054688, 0.22751617431640625, 0.23804092407226562, 0.248565673828125, 0.2590904235839844, 0.26961517333984375, 0.2801399230957031, 0.2906646728515625, 0.3011894226074219, 0.31171417236328125, 0.3222389221191406, 0.332763671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 21.0, 46.0, 73.0, 135.0, 167.0, 187.0, 135.0, 102.0, 59.0, 28.0, 24.0, 15.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012093782424926758, -0.00011814013123512268, -0.00011534243822097778, -0.00011254474520683289, -0.00010974705219268799, -0.00010694935917854309, -0.0001041516661643982, -0.0001013539731502533, -9.85562801361084e-05, -9.57585871219635e-05, -9.29608941078186e-05, -9.01632010936737e-05, -8.736550807952881e-05, -8.456781506538391e-05, -8.177012205123901e-05, -7.897242903709412e-05, -7.617473602294922e-05, -7.337704300880432e-05, -7.057934999465942e-05, -6.778165698051453e-05, -6.498396396636963e-05, -6.218627095222473e-05, -5.9388577938079834e-05, -5.6590884923934937e-05, -5.379319190979004e-05, -5.099549889564514e-05, -4.8197805881500244e-05, -4.540011286735535e-05, -4.260241985321045e-05, -3.980472683906555e-05, -3.7007033824920654e-05, -3.420934081077576e-05, -3.141164779663086e-05, -2.8613954782485962e-05, -2.5816261768341064e-05, -2.3018568754196167e-05, -2.022087574005127e-05, -1.7423182725906372e-05, -1.4625489711761475e-05, -1.1827796697616577e-05, -9.03010368347168e-06, -6.232410669326782e-06, -3.4347176551818848e-06, -6.370246410369873e-07, 2.16066837310791e-06, 4.958361387252808e-06, 7.756054401397705e-06, 1.0553747415542603e-05, 1.33514404296875e-05, 1.6149133443832397e-05, 1.8946826457977295e-05, 2.1744519472122192e-05, 2.454221248626709e-05, 2.7339905500411987e-05, 3.0137598514556885e-05, 3.293529152870178e-05, 3.573298454284668e-05, 3.853067755699158e-05, 4.1328370571136475e-05, 4.412606358528137e-05, 4.692375659942627e-05, 4.972144961357117e-05, 5.2519142627716064e-05, 5.531683564186096e-05, 5.811452865600586e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 15.0, 11.0, 27.0, 26.0, 45.0, 71.0, 108.0, 178.0, 407.0, 860.0, 2465.0, 10992.0, 242324.0, 764658.0, 20549.0, 3617.0, 1136.0, 489.0, 223.0, 140.0, 72.0, 47.0, 26.0, 24.0, 7.0, 12.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.387451171875, -0.3726387023925781, -0.35782623291015625, -0.3430137634277344, -0.3282012939453125, -0.3133888244628906, -0.29857635498046875, -0.2837638854980469, -0.268951416015625, -0.2541389465332031, -0.23932647705078125, -0.22451400756835938, -0.2097015380859375, -0.19488906860351562, -0.18007659912109375, -0.16526412963867188, -0.15045166015625, -0.13563919067382812, -0.12082672119140625, -0.10601425170898438, -0.0912017822265625, -0.07638931274414062, -0.06157684326171875, -0.046764373779296875, -0.031951904296875, -0.017139434814453125, -0.00232696533203125, 0.012485504150390625, 0.0272979736328125, 0.042110443115234375, 0.05692291259765625, 0.07173538208007812, 0.0865478515625, 0.10136032104492188, 0.11617279052734375, 0.13098526000976562, 0.1457977294921875, 0.16061019897460938, 0.17542266845703125, 0.19023513793945312, 0.205047607421875, 0.21986007690429688, 0.23467254638671875, 0.24948501586914062, 0.2642974853515625, 0.2791099548339844, 0.29392242431640625, 0.3087348937988281, 0.32354736328125, 0.3383598327636719, 0.35317230224609375, 0.3679847717285156, 0.3827972412109375, 0.3976097106933594, 0.41242218017578125, 0.4272346496582031, 0.442047119140625, 0.4568595886230469, 0.47167205810546875, 0.4864845275878906, 0.5012969970703125, 0.5161094665527344, 0.5309219360351562, 0.5457344055175781, 0.560546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 12.0, 14.0, 23.0, 46.0, 84.0, 149.0, 171.0, 201.0, 129.0, 69.0, 30.0, 17.0, 12.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2186279296875, -0.2075939178466797, -0.19655990600585938, -0.18552589416503906, -0.17449188232421875, -0.16345787048339844, -0.15242385864257812, -0.1413898468017578, -0.1303558349609375, -0.11932182312011719, -0.10828781127929688, -0.09725379943847656, -0.08621978759765625, -0.07518577575683594, -0.06415176391601562, -0.05311775207519531, -0.042083740234375, -0.031049728393554688, -0.020015716552734375, -0.008981704711914062, 0.00205230712890625, 0.013086318969726562, 0.024120330810546875, 0.03515434265136719, 0.0461883544921875, 0.05722236633300781, 0.06825637817382812, 0.07929039001464844, 0.09032440185546875, 0.10135841369628906, 0.11239242553710938, 0.12342643737792969, 0.13446044921875, 0.1454944610595703, 0.15652847290039062, 0.16756248474121094, 0.17859649658203125, 0.18963050842285156, 0.20066452026367188, 0.2116985321044922, 0.2227325439453125, 0.2337665557861328, 0.24480056762695312, 0.25583457946777344, 0.26686859130859375, 0.27790260314941406, 0.2889366149902344, 0.2999706268310547, 0.311004638671875, 0.3220386505126953, 0.3330726623535156, 0.34410667419433594, 0.35514068603515625, 0.36617469787597656, 0.3772087097167969, 0.3882427215576172, 0.3992767333984375, 0.4103107452392578, 0.4213447570800781, 0.43237876892089844, 0.44341278076171875, 0.45444679260253906, 0.4654808044433594, 0.4765148162841797, 0.487548828125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 7.0, 20.0, 32.0, 62.0, 104.0, 171.0, 180.0, 150.0, 116.0, 49.0, 51.0, 21.0, 17.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.660822868347168, -6.519661903381348, -6.3785014152526855, -6.237340927124023, -6.096179962158203, -5.955018997192383, -5.813858509063721, -5.672698020935059, -5.531537055969238, -5.390376091003418, -5.249215602874756, -5.108055114746094, -4.966894149780273, -4.825733184814453, -4.684572696685791, -4.543412208557129, -4.402251243591309, -4.261090278625488, -4.119929790496826, -3.978769063949585, -3.8376083374023438, -3.6964476108551025, -3.5552868843078613, -3.41412615776062, -3.272965431213379, -3.1318047046661377, -2.9906439781188965, -2.8494832515716553, -2.708322525024414, -2.567161798477173, -2.4260010719299316, -2.2848403453826904, -2.143679141998291, -2.00251841545105, -1.8613576889038086, -1.7201969623565674, -1.5790362358093262, -1.437875509262085, -1.2967147827148438, -1.1555540561676025, -1.0143933296203613, -0.8732326030731201, -0.7320718765258789, -0.5909111499786377, -0.4497504234313965, -0.3085896968841553, -0.16742897033691406, -0.02626824378967285, 0.11489248275756836, 0.25605320930480957, 0.3972139358520508, 0.538374662399292, 0.6795353889465332, 0.8206961154937744, 0.9618568420410156, 1.1030175685882568, 1.244178295135498, 1.3853390216827393, 1.5264997482299805, 1.6676604747772217, 1.808821201324463, 1.949981927871704, 2.0911426544189453, 2.2323033809661865, 2.3734641075134277]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 13.0, 18.0, 8.0, 17.0, 19.0, 33.0, 47.0, 35.0, 31.0, 40.0, 52.0, 58.0, 54.0, 58.0, 64.0, 55.0, 48.0, 51.0, 42.0, 32.0, 30.0, 30.0, 29.0, 18.0, 18.0, 25.0, 10.0, 9.0, 4.0, 5.0, 4.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7773356437683105, -2.6994147300720215, -2.6214938163757324, -2.5435729026794434, -2.4656519889831543, -2.3877310752868652, -2.309810161590576, -2.231889247894287, -2.153968334197998, -2.076047420501709, -1.99812650680542, -1.9202055931091309, -1.8422846794128418, -1.7643637657165527, -1.6864429712295532, -1.6085220575332642, -1.5306012630462646, -1.4526803493499756, -1.3747594356536865, -1.2968385219573975, -1.2189176082611084, -1.1409966945648193, -1.0630759000778198, -0.9851549863815308, -0.9072340726852417, -0.8293131589889526, -0.7513922452926636, -0.6734713912010193, -0.5955504775047302, -0.5176295638084412, -0.4397086799144745, -0.3617877960205078, -0.28386712074279785, -0.20594622194766998, -0.12802532315254211, -0.050104424357414246, 0.027816474437713623, 0.10573738813400269, 0.18365827202796936, 0.26157915592193604, 0.3395000696182251, 0.41742098331451416, 0.49534186720848083, 0.5732627511024475, 0.6511836647987366, 0.7291045784950256, 0.8070254325866699, 0.884946346282959, 0.962867259979248, 1.040788173675537, 1.1187090873718262, 1.1966300010681152, 1.2745509147644043, 1.3524718284606934, 1.4303926229476929, 1.508313536643982, 1.586234450340271, 1.66415536403656, 1.7420762777328491, 1.8199971914291382, 1.8979179859161377, 1.9758388996124268, 2.053759813308716, 2.131680727005005, 2.209601640701294]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 4.0, 12.0, 14.0, 27.0, 30.0, 39.0, 51.0, 85.0, 146.0, 232.0, 564.0, 1616.0, 7209.0, 156395.0, 4014860.0, 9607.0, 2000.0, 636.0, 274.0, 157.0, 101.0, 47.0, 40.0, 36.0, 25.0, 13.0, 14.0, 11.0, 4.0, 4.0, 3.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7444839477539062, -0.7179718017578125, -0.6914596557617188, -0.664947509765625, -0.6384353637695312, -0.6119232177734375, -0.5854110717773438, -0.55889892578125, -0.5323867797851562, -0.5058746337890625, -0.47936248779296875, -0.452850341796875, -0.42633819580078125, -0.3998260498046875, -0.37331390380859375, -0.3468017578125, -0.32028961181640625, -0.2937774658203125, -0.26726531982421875, -0.240753173828125, -0.21424102783203125, -0.1877288818359375, -0.16121673583984375, -0.13470458984375, -0.10819244384765625, -0.0816802978515625, -0.05516815185546875, -0.028656005859375, -0.00214385986328125, 0.0243682861328125, 0.05088043212890625, 0.077392578125, 0.10390472412109375, 0.1304168701171875, 0.15692901611328125, 0.183441162109375, 0.20995330810546875, 0.2364654541015625, 0.26297760009765625, 0.28948974609375, 0.31600189208984375, 0.3425140380859375, 0.36902618408203125, 0.395538330078125, 0.42205047607421875, 0.4485626220703125, 0.47507476806640625, 0.5015869140625, 0.5280990600585938, 0.5546112060546875, 0.5811233520507812, 0.607635498046875, 0.6341476440429688, 0.6606597900390625, 0.6871719360351562, 0.71368408203125, 0.7401962280273438, 0.7667083740234375, 0.7932205200195312, 0.819732666015625, 0.8462448120117188, 0.8727569580078125, 0.8992691040039062, 0.92578125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 3.0, 5.0, 0.0, 10.0, 14.0, 10.0, 31.0, 31.0, 57.0, 61.0, 56.0, 77.0, 77.0, 88.0, 68.0, 76.0, 72.0, 56.0, 47.0, 53.0, 33.0, 25.0, 15.0, 8.0, 7.0, 9.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10809326171875, -0.10405254364013672, -0.10001182556152344, -0.09597110748291016, -0.09193038940429688, -0.0878896713256836, -0.08384895324707031, -0.07980823516845703, -0.07576751708984375, -0.07172679901123047, -0.06768608093261719, -0.0636453628540039, -0.059604644775390625, -0.055563926696777344, -0.05152320861816406, -0.04748249053955078, -0.0434417724609375, -0.03940105438232422, -0.03536033630371094, -0.031319618225097656, -0.027278900146484375, -0.023238182067871094, -0.019197463989257812, -0.015156745910644531, -0.01111602783203125, -0.007075309753417969, -0.0030345916748046875, 0.0010061264038085938, 0.005046844482421875, 0.009087562561035156, 0.013128280639648438, 0.01716899871826172, 0.021209716796875, 0.02525043487548828, 0.029291152954101562, 0.033331871032714844, 0.037372589111328125, 0.041413307189941406, 0.04545402526855469, 0.04949474334716797, 0.05353546142578125, 0.05757617950439453, 0.06161689758300781, 0.0656576156616211, 0.06969833374023438, 0.07373905181884766, 0.07777976989746094, 0.08182048797607422, 0.0858612060546875, 0.08990192413330078, 0.09394264221191406, 0.09798336029052734, 0.10202407836914062, 0.1060647964477539, 0.11010551452636719, 0.11414623260498047, 0.11818695068359375, 0.12222766876220703, 0.1262683868408203, 0.1303091049194336, 0.13434982299804688, 0.13839054107666016, 0.14243125915527344, 0.14647197723388672, 0.1505126953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 11.0, 10.0, 5.0, 12.0, 9.0, 18.0, 17.0, 21.0, 33.0, 41.0, 49.0, 57.0, 69.0, 109.0, 222.0, 658.0, 3168.0, 57981.0, 4121619.0, 8057.0, 1211.0, 366.0, 149.0, 96.0, 57.0, 40.0, 35.0, 33.0, 22.0, 23.0, 18.0, 14.0, 13.0, 5.0, 8.0, 8.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8662109375, -1.811676025390625, -1.75714111328125, -1.702606201171875, -1.6480712890625, -1.593536376953125, -1.53900146484375, -1.484466552734375, -1.429931640625, -1.375396728515625, -1.32086181640625, -1.266326904296875, -1.2117919921875, -1.157257080078125, -1.10272216796875, -1.048187255859375, -0.99365234375, -0.939117431640625, -0.88458251953125, -0.830047607421875, -0.7755126953125, -0.720977783203125, -0.66644287109375, -0.611907958984375, -0.557373046875, -0.502838134765625, -0.44830322265625, -0.393768310546875, -0.3392333984375, -0.284698486328125, -0.23016357421875, -0.175628662109375, -0.12109375, -0.066558837890625, -0.01202392578125, 0.042510986328125, 0.0970458984375, 0.151580810546875, 0.20611572265625, 0.260650634765625, 0.315185546875, 0.369720458984375, 0.42425537109375, 0.478790283203125, 0.5333251953125, 0.587860107421875, 0.64239501953125, 0.696929931640625, 0.75146484375, 0.805999755859375, 0.86053466796875, 0.915069580078125, 0.9696044921875, 1.024139404296875, 1.07867431640625, 1.133209228515625, 1.187744140625, 1.242279052734375, 1.29681396484375, 1.351348876953125, 1.4058837890625, 1.460418701171875, 1.51495361328125, 1.569488525390625, 1.6240234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 14.0, 29.0, 119.0, 3786.0, 94.0, 20.0, 9.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1868896484375, -0.17484474182128906, -0.16279983520507812, -0.1507549285888672, -0.13871002197265625, -0.1266651153564453, -0.11462020874023438, -0.10257530212402344, -0.0905303955078125, -0.07848548889160156, -0.06644058227539062, -0.05439567565917969, -0.04235076904296875, -0.030305862426757812, -0.018260955810546875, -0.0062160491943359375, 0.005828857421875, 0.017873764038085938, 0.029918670654296875, 0.04196357727050781, 0.05400848388671875, 0.06605339050292969, 0.07809829711914062, 0.09014320373535156, 0.1021881103515625, 0.11423301696777344, 0.12627792358398438, 0.1383228302001953, 0.15036773681640625, 0.1624126434326172, 0.17445755004882812, 0.18650245666503906, 0.19854736328125, 0.21059226989746094, 0.22263717651367188, 0.2346820831298828, 0.24672698974609375, 0.2587718963623047, 0.2708168029785156, 0.28286170959472656, 0.2949066162109375, 0.30695152282714844, 0.3189964294433594, 0.3310413360595703, 0.34308624267578125, 0.3551311492919922, 0.3671760559082031, 0.37922096252441406, 0.391265869140625, 0.40331077575683594, 0.4153556823730469, 0.4274005889892578, 0.43944549560546875, 0.4514904022216797, 0.4635353088378906, 0.47558021545410156, 0.4876251220703125, 0.49967002868652344, 0.5117149353027344, 0.5237598419189453, 0.5358047485351562, 0.5478496551513672, 0.5598945617675781, 0.5719394683837891, 0.583984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 11.0, 11.0, 8.0, 11.0, 11.0, 17.0, 40.0, 43.0, 65.0, 98.0, 98.0, 124.0, 108.0, 105.0, 58.0, 51.0, 48.0, 20.0, 27.0, 13.0, 10.0, 2.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6872037649154663, -0.6650705933570862, -0.6429374814033508, -0.6208043098449707, -0.5986711978912354, -0.5765380263328552, -0.5544048547744751, -0.5322717428207397, -0.5101385712623596, -0.4880054295063019, -0.46587228775024414, -0.443739116191864, -0.4216059744358063, -0.39947283267974854, -0.3773396909236908, -0.35520654916763306, -0.3330734074115753, -0.3109402656555176, -0.28880712389945984, -0.2666739821434021, -0.24454081058502197, -0.22240766882896423, -0.2002745270729065, -0.17814137041568756, -0.15600822865962982, -0.13387508690357208, -0.11174193024635315, -0.08960878849029541, -0.06747563928365707, -0.04534249007701874, -0.023209348320961, -0.0010761916637420654, 0.021056950092315674, 0.04319009929895401, 0.06532324850559235, 0.08745639026165009, 0.10958953946828842, 0.13172268867492676, 0.1538558304309845, 0.17598898708820343, 0.19812212884426117, 0.2202552706003189, 0.24238842725753784, 0.2645215690135956, 0.2866547107696533, 0.30878788232803345, 0.3309209942817688, 0.3530541658401489, 0.37518730759620667, 0.3973204493522644, 0.41945359110832214, 0.4415867328643799, 0.46371990442276, 0.48585304617881775, 0.5079861879348755, 0.5301193594932556, 0.552252471446991, 0.5743856430053711, 0.5965187549591064, 0.6186519265174866, 0.6407850384712219, 0.662918210029602, 0.6850513219833374, 0.7071844935417175, 0.7293176651000977]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 4.0, 4.0, 7.0, 11.0, 7.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 22.0, 26.0, 31.0, 30.0, 24.0, 33.0, 40.0, 30.0, 35.0, 42.0, 41.0, 48.0, 31.0, 34.0, 42.0, 37.0, 39.0, 33.0, 22.0, 32.0, 30.0, 23.0, 26.0, 17.0, 16.0, 16.0, 12.0, 11.0, 10.0, 7.0, 2.0, 9.0, 3.0, 7.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3262641429901123, -0.3152258098125458, -0.30418750643730164, -0.2931491732597351, -0.28211086988449097, -0.27107253670692444, -0.2600342035293579, -0.24899590015411377, -0.23795756697654724, -0.2269192487001419, -0.21588093042373657, -0.20484259724617004, -0.1938042789697647, -0.18276596069335938, -0.17172764241695404, -0.1606893241405487, -0.14965100586414337, -0.13861268758773804, -0.1275743693113327, -0.11653604358434677, -0.10549771785736084, -0.0944593995809555, -0.08342108130455017, -0.07238275557756424, -0.061344437301158905, -0.05030611529946327, -0.03926779329776764, -0.028229475021362305, -0.017191153019666672, -0.006152831017971039, 0.004885487258434296, 0.015923812985420227, 0.02696213126182556, 0.038000453263521194, 0.04903877526521683, 0.06007709354162216, 0.0711154192686081, 0.08215373754501343, 0.09319205582141876, 0.1042303815484047, 0.11526869982481003, 0.12630702555179596, 0.1373453438282013, 0.14838366210460663, 0.15942198038101196, 0.1704603135585785, 0.18149861693382263, 0.19253695011138916, 0.2035752683877945, 0.21461358666419983, 0.22565190494060516, 0.2366902232170105, 0.24772855639457703, 0.25876688957214355, 0.2698051929473877, 0.2808435261249542, 0.29188182950019836, 0.3029201626777649, 0.31395846605300903, 0.32499679923057556, 0.3360351026058197, 0.34707343578338623, 0.35811173915863037, 0.3691500723361969, 0.3801884055137634]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 1.0, 4.0, 5.0, 11.0, 10.0, 17.0, 24.0, 37.0, 49.0, 99.0, 152.0, 220.0, 387.0, 619.0, 1067.0, 1700.0, 2976.0, 5454.0, 10506.0, 22134.0, 49002.0, 117040.0, 264234.0, 306284.0, 149049.0, 62241.0, 27102.0, 12999.0, 6513.0, 3542.0, 1986.0, 1156.0, 741.0, 423.0, 297.0, 172.0, 105.0, 88.0, 29.0, 28.0, 16.0, 16.0, 6.0, 0.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.224365234375, -0.2181568145751953, -0.21194839477539062, -0.20573997497558594, -0.19953155517578125, -0.19332313537597656, -0.18711471557617188, -0.1809062957763672, -0.1746978759765625, -0.1684894561767578, -0.16228103637695312, -0.15607261657714844, -0.14986419677734375, -0.14365577697753906, -0.13744735717773438, -0.1312389373779297, -0.125030517578125, -0.11882209777832031, -0.11261367797851562, -0.10640525817871094, -0.10019683837890625, -0.09398841857910156, -0.08777999877929688, -0.08157157897949219, -0.0753631591796875, -0.06915473937988281, -0.06294631958007812, -0.05673789978027344, -0.05052947998046875, -0.04432106018066406, -0.038112640380859375, -0.03190422058105469, -0.02569580078125, -0.019487380981445312, -0.013278961181640625, -0.0070705413818359375, -0.00086212158203125, 0.0053462982177734375, 0.011554718017578125, 0.017763137817382812, 0.0239715576171875, 0.030179977416992188, 0.036388397216796875, 0.04259681701660156, 0.04880523681640625, 0.05501365661621094, 0.061222076416015625, 0.06743049621582031, 0.073638916015625, 0.07984733581542969, 0.08605575561523438, 0.09226417541503906, 0.09847259521484375, 0.10468101501464844, 0.11088943481445312, 0.11709785461425781, 0.1233062744140625, 0.1295146942138672, 0.13572311401367188, 0.14193153381347656, 0.14813995361328125, 0.15434837341308594, 0.16055679321289062, 0.1667652130126953, 0.1729736328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 18.0, 24.0, 20.0, 28.0, 38.0, 32.0, 49.0, 43.0, 48.0, 61.0, 48.0, 57.0, 73.0, 73.0, 63.0, 48.0, 52.0, 25.0, 36.0, 26.0, 25.0, 14.0, 14.0, 12.0, 6.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1474609375, -0.14361858367919922, -0.13977622985839844, -0.13593387603759766, -0.13209152221679688, -0.1282491683959961, -0.12440681457519531, -0.12056446075439453, -0.11672210693359375, -0.11287975311279297, -0.10903739929199219, -0.1051950454711914, -0.10135269165039062, -0.09751033782958984, -0.09366798400878906, -0.08982563018798828, -0.0859832763671875, -0.08214092254638672, -0.07829856872558594, -0.07445621490478516, -0.07061386108398438, -0.0667715072631836, -0.06292915344238281, -0.05908679962158203, -0.05524444580078125, -0.05140209197998047, -0.04755973815917969, -0.043717384338378906, -0.039875030517578125, -0.036032676696777344, -0.03219032287597656, -0.02834796905517578, -0.024505615234375, -0.02066326141357422, -0.016820907592773438, -0.012978553771972656, -0.009136199951171875, -0.005293846130371094, -0.0014514923095703125, 0.0023908615112304688, 0.00623321533203125, 0.010075569152832031, 0.013917922973632812, 0.017760276794433594, 0.021602630615234375, 0.025444984436035156, 0.029287338256835938, 0.03312969207763672, 0.0369720458984375, 0.04081439971923828, 0.04465675354003906, 0.048499107360839844, 0.052341461181640625, 0.056183815002441406, 0.06002616882324219, 0.06386852264404297, 0.06771087646484375, 0.07155323028564453, 0.07539558410644531, 0.0792379379272461, 0.08308029174804688, 0.08692264556884766, 0.09076499938964844, 0.09460735321044922, 0.09844970703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 17.0, 14.0, 22.0, 36.0, 48.0, 81.0, 147.0, 185.0, 294.0, 541.0, 1037.0, 2499.0, 7853.0, 40465.0, 405540.0, 524198.0, 50763.0, 9367.0, 2862.0, 1103.0, 564.0, 320.0, 184.0, 126.0, 76.0, 61.0, 36.0, 31.0, 22.0, 15.0, 7.0, 3.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.568359375, -0.5525970458984375, -0.536834716796875, -0.5210723876953125, -0.50531005859375, -0.4895477294921875, -0.473785400390625, -0.4580230712890625, -0.4422607421875, -0.4264984130859375, -0.410736083984375, -0.3949737548828125, -0.37921142578125, -0.3634490966796875, -0.347686767578125, -0.3319244384765625, -0.316162109375, -0.3003997802734375, -0.284637451171875, -0.2688751220703125, -0.25311279296875, -0.2373504638671875, -0.221588134765625, -0.2058258056640625, -0.1900634765625, -0.1743011474609375, -0.158538818359375, -0.1427764892578125, -0.12701416015625, -0.1112518310546875, -0.095489501953125, -0.0797271728515625, -0.06396484375, -0.0482025146484375, -0.032440185546875, -0.0166778564453125, -0.00091552734375, 0.0148468017578125, 0.030609130859375, 0.0463714599609375, 0.0621337890625, 0.0778961181640625, 0.093658447265625, 0.1094207763671875, 0.12518310546875, 0.1409454345703125, 0.156707763671875, 0.1724700927734375, 0.188232421875, 0.2039947509765625, 0.219757080078125, 0.2355194091796875, 0.25128173828125, 0.2670440673828125, 0.282806396484375, 0.2985687255859375, 0.3143310546875, 0.3300933837890625, 0.345855712890625, 0.3616180419921875, 0.37738037109375, 0.3931427001953125, 0.408905029296875, 0.4246673583984375, 0.4404296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 18.0, 8.0, 15.0, 25.0, 27.0, 33.0, 27.0, 32.0, 44.0, 34.0, 38.0, 45.0, 46.0, 53.0, 45.0, 54.0, 47.0, 38.0, 44.0, 38.0, 36.0, 38.0, 32.0, 21.0, 22.0, 20.0, 14.0, 18.0, 18.0, 7.0, 15.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5185546875, -0.5017929077148438, -0.4850311279296875, -0.46826934814453125, -0.451507568359375, -0.43474578857421875, -0.4179840087890625, -0.40122222900390625, -0.38446044921875, -0.36769866943359375, -0.3509368896484375, -0.33417510986328125, -0.317413330078125, -0.30065155029296875, -0.2838897705078125, -0.26712799072265625, -0.2503662109375, -0.23360443115234375, -0.2168426513671875, -0.20008087158203125, -0.183319091796875, -0.16655731201171875, -0.1497955322265625, -0.13303375244140625, -0.11627197265625, -0.09951019287109375, -0.0827484130859375, -0.06598663330078125, -0.049224853515625, -0.03246307373046875, -0.0157012939453125, 0.00106048583984375, 0.017822265625, 0.03458404541015625, 0.0513458251953125, 0.06810760498046875, 0.084869384765625, 0.10163116455078125, 0.1183929443359375, 0.13515472412109375, 0.15191650390625, 0.16867828369140625, 0.1854400634765625, 0.20220184326171875, 0.218963623046875, 0.23572540283203125, 0.2524871826171875, 0.26924896240234375, 0.2860107421875, 0.30277252197265625, 0.3195343017578125, 0.33629608154296875, 0.353057861328125, 0.36981964111328125, 0.3865814208984375, 0.40334320068359375, 0.42010498046875, 0.43686676025390625, 0.4536285400390625, 0.47039031982421875, 0.487152099609375, 0.5039138793945312, 0.5206756591796875, 0.5374374389648438, 0.55419921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 10.0, 14.0, 17.0, 43.0, 55.0, 98.0, 195.0, 330.0, 808.0, 2241.0, 9113.0, 65845.0, 767635.0, 179653.0, 16793.0, 3499.0, 1171.0, 471.0, 231.0, 131.0, 85.0, 40.0, 17.0, 23.0, 10.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.345458984375, -0.3348884582519531, -0.32431793212890625, -0.3137474060058594, -0.3031768798828125, -0.2926063537597656, -0.28203582763671875, -0.2714653015136719, -0.260894775390625, -0.2503242492675781, -0.23975372314453125, -0.22918319702148438, -0.2186126708984375, -0.20804214477539062, -0.19747161865234375, -0.18690109252929688, -0.17633056640625, -0.16576004028320312, -0.15518951416015625, -0.14461898803710938, -0.1340484619140625, -0.12347793579101562, -0.11290740966796875, -0.10233688354492188, -0.091766357421875, -0.08119583129882812, -0.07062530517578125, -0.060054779052734375, -0.0494842529296875, -0.038913726806640625, -0.02834320068359375, -0.017772674560546875, -0.0072021484375, 0.003368377685546875, 0.01393890380859375, 0.024509429931640625, 0.0350799560546875, 0.045650482177734375, 0.05622100830078125, 0.06679153442382812, 0.077362060546875, 0.08793258666992188, 0.09850311279296875, 0.10907363891601562, 0.1196441650390625, 0.13021469116210938, 0.14078521728515625, 0.15135574340820312, 0.16192626953125, 0.17249679565429688, 0.18306732177734375, 0.19363784790039062, 0.2042083740234375, 0.21477890014648438, 0.22534942626953125, 0.23591995239257812, 0.246490478515625, 0.2570610046386719, 0.26763153076171875, 0.2782020568847656, 0.2887725830078125, 0.2993431091308594, 0.30991363525390625, 0.3204841613769531, 0.3310546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 6.0, 6.0, 12.0, 9.0, 13.0, 28.0, 34.0, 40.0, 77.0, 66.0, 98.0, 92.0, 84.0, 100.0, 62.0, 66.0, 46.0, 39.0, 30.0, 11.0, 11.0, 18.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.463029861450195e-05, -3.327615559101105e-05, -3.192201256752014e-05, -3.0567869544029236e-05, -2.921372652053833e-05, -2.7859583497047424e-05, -2.650544047355652e-05, -2.5151297450065613e-05, -2.3797154426574707e-05, -2.24430114030838e-05, -2.1088868379592896e-05, -1.973472535610199e-05, -1.8380582332611084e-05, -1.7026439309120178e-05, -1.5672296285629272e-05, -1.4318153262138367e-05, -1.2964010238647461e-05, -1.1609867215156555e-05, -1.025572419166565e-05, -8.901581168174744e-06, -7.547438144683838e-06, -6.193295121192932e-06, -4.839152097702026e-06, -3.4850090742111206e-06, -2.130866050720215e-06, -7.767230272293091e-07, 5.774199962615967e-07, 1.9315630197525024e-06, 3.285706043243408e-06, 4.639849066734314e-06, 5.99399209022522e-06, 7.3481351137161255e-06, 8.702278137207031e-06, 1.0056421160697937e-05, 1.1410564184188843e-05, 1.2764707207679749e-05, 1.4118850231170654e-05, 1.547299325466156e-05, 1.6827136278152466e-05, 1.818127930164337e-05, 1.9535422325134277e-05, 2.0889565348625183e-05, 2.224370837211609e-05, 2.3597851395606995e-05, 2.49519944190979e-05, 2.6306137442588806e-05, 2.7660280466079712e-05, 2.9014423489570618e-05, 3.0368566513061523e-05, 3.172270953655243e-05, 3.3076852560043335e-05, 3.443099558353424e-05, 3.5785138607025146e-05, 3.713928163051605e-05, 3.849342465400696e-05, 3.9847567677497864e-05, 4.120171070098877e-05, 4.2555853724479675e-05, 4.390999674797058e-05, 4.526413977146149e-05, 4.661828279495239e-05, 4.79724258184433e-05, 4.9326568841934204e-05, 5.068071186542511e-05, 5.2034854888916016e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 0.0, 6.0, 10.0, 7.0, 15.0, 22.0, 29.0, 60.0, 102.0, 176.0, 336.0, 736.0, 1810.0, 5548.0, 25670.0, 274539.0, 664772.0, 60126.0, 9707.0, 2792.0, 1018.0, 483.0, 230.0, 127.0, 74.0, 50.0, 36.0, 28.0, 10.0, 12.0, 9.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23136329650878906, -0.22139358520507812, -0.2114238739013672, -0.20145416259765625, -0.1914844512939453, -0.18151473999023438, -0.17154502868652344, -0.1615753173828125, -0.15160560607910156, -0.14163589477539062, -0.1316661834716797, -0.12169647216796875, -0.11172676086425781, -0.10175704956054688, -0.09178733825683594, -0.081817626953125, -0.07184791564941406, -0.061878204345703125, -0.05190849304199219, -0.04193878173828125, -0.03196907043457031, -0.021999359130859375, -0.012029647827148438, -0.0020599365234375, 0.007909774780273438, 0.017879486083984375, 0.027849197387695312, 0.03781890869140625, 0.04778861999511719, 0.057758331298828125, 0.06772804260253906, 0.07769775390625, 0.08766746520996094, 0.09763717651367188, 0.10760688781738281, 0.11757659912109375, 0.1275463104248047, 0.13751602172851562, 0.14748573303222656, 0.1574554443359375, 0.16742515563964844, 0.17739486694335938, 0.1873645782470703, 0.19733428955078125, 0.2073040008544922, 0.21727371215820312, 0.22724342346191406, 0.237213134765625, 0.24718284606933594, 0.2571525573730469, 0.2671222686767578, 0.27709197998046875, 0.2870616912841797, 0.2970314025878906, 0.30700111389160156, 0.3169708251953125, 0.32694053649902344, 0.3369102478027344, 0.3468799591064453, 0.35684967041015625, 0.3668193817138672, 0.3767890930175781, 0.38675880432128906, 0.396728515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 14.0, 22.0, 33.0, 42.0, 65.0, 83.0, 113.0, 112.0, 97.0, 94.0, 91.0, 63.0, 32.0, 28.0, 26.0, 17.0, 14.0, 11.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22362518310546875, -0.2153167724609375, -0.20700836181640625, -0.198699951171875, -0.19039154052734375, -0.1820831298828125, -0.17377471923828125, -0.16546630859375, -0.15715789794921875, -0.1488494873046875, -0.14054107666015625, -0.132232666015625, -0.12392425537109375, -0.1156158447265625, -0.10730743408203125, -0.0989990234375, -0.09069061279296875, -0.0823822021484375, -0.07407379150390625, -0.065765380859375, -0.05745697021484375, -0.0491485595703125, -0.04084014892578125, -0.03253173828125, -0.02422332763671875, -0.0159149169921875, -0.00760650634765625, 0.000701904296875, 0.00901031494140625, 0.0173187255859375, 0.02562713623046875, 0.033935546875, 0.04224395751953125, 0.0505523681640625, 0.05886077880859375, 0.067169189453125, 0.07547760009765625, 0.0837860107421875, 0.09209442138671875, 0.10040283203125, 0.10871124267578125, 0.1170196533203125, 0.12532806396484375, 0.133636474609375, 0.14194488525390625, 0.1502532958984375, 0.15856170654296875, 0.1668701171875, 0.17517852783203125, 0.1834869384765625, 0.19179534912109375, 0.200103759765625, 0.20841217041015625, 0.2167205810546875, 0.22502899169921875, 0.23333740234375, 0.24164581298828125, 0.2499542236328125, 0.25826263427734375, 0.266571044921875, 0.27487945556640625, 0.2831878662109375, 0.29149627685546875, 0.2998046875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 18.0, 25.0, 70.0, 96.0, 146.0, 183.0, 171.0, 124.0, 81.0, 38.0, 18.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.785530090332031, -4.6339921951293945, -4.482454776763916, -4.330916881561279, -4.179378986358643, -4.027841567993164, -3.8763036727905273, -3.7247657775878906, -3.573228120803833, -3.4216904640197754, -3.2701525688171387, -3.118614912033081, -2.9670772552490234, -2.8155393600463867, -2.664001703262329, -2.5124640464782715, -2.3609261512756348, -2.209388494491577, -2.0578505992889404, -1.9063129425048828, -1.7547751665115356, -1.6032373905181885, -1.4516997337341309, -1.3001619577407837, -1.1486241817474365, -0.9970864057540894, -0.845548689365387, -0.6940109729766846, -0.5424731969833374, -0.39093542098999023, -0.23939770460128784, -0.08785998821258545, 0.06367778778076172, 0.2152155339717865, 0.3667532801628113, 0.5182909965515137, 0.6698287725448608, 0.821366548538208, 0.9729042649269104, 1.1244419813156128, 1.27597975730896, 1.4275175333023071, 1.5790553092956543, 1.730592966079712, 1.882130742073059, 2.0336685180664062, 2.185206174850464, 2.3367438316345215, 2.488281726837158, 2.639819383621216, 2.7913572788238525, 2.94289493560791, 3.094432830810547, 3.2459704875946045, 3.397508144378662, 3.549046039581299, 3.7005836963653564, 3.852121353149414, 4.003659248352051, 4.1551971435546875, 4.306734561920166, 4.458272457122803, 4.6098103523254395, 4.761347770690918, 4.912885665893555]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 8.0, 9.0, 8.0, 13.0, 13.0, 13.0, 18.0, 15.0, 20.0, 23.0, 25.0, 21.0, 35.0, 53.0, 44.0, 53.0, 54.0, 51.0, 51.0, 51.0, 43.0, 42.0, 42.0, 33.0, 36.0, 37.0, 24.0, 18.0, 23.0, 15.0, 17.0, 11.0, 16.0, 9.0, 11.0, 8.0, 6.0, 4.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.340937376022339, -2.2659387588500977, -2.1909403800964355, -2.1159417629241943, -2.0409433841705322, -1.965944766998291, -1.8909462690353394, -1.8159477710723877, -1.740949273109436, -1.6659507751464844, -1.5909522771835327, -1.515953779220581, -1.4409551620483398, -1.3659567832946777, -1.2909581661224365, -1.2159596681594849, -1.1409611701965332, -1.0659626722335815, -0.9909641742706299, -0.9159656167030334, -0.8409671187400818, -0.7659686207771301, -0.6909700632095337, -0.615971565246582, -0.5409730672836304, -0.4659745693206787, -0.39097604155540466, -0.3159775137901306, -0.24097901582717896, -0.1659805178642273, -0.09098199009895325, -0.0159834623336792, 0.05901527404785156, 0.13401378691196442, 0.20901229977607727, 0.2840108275413513, 0.359009325504303, 0.43400782346725464, 0.5090063810348511, 0.5840048789978027, 0.6590033769607544, 0.734001874923706, 0.8090003728866577, 0.8839989304542542, 0.9589974284172058, 1.0339958667755127, 1.108994483947754, 1.1839929819107056, 1.2589914798736572, 1.3339899778366089, 1.4089884757995605, 1.4839869737625122, 1.5589854717254639, 1.633984088897705, 1.7089825868606567, 1.7839810848236084, 1.85897958278656, 1.9339780807495117, 2.008976697921753, 2.083975076675415, 2.1589736938476562, 2.2339720726013184, 2.3089706897735596, 2.383969306945801, 2.458967685699463]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 20.0, 25.0, 34.0, 30.0, 57.0, 63.0, 89.0, 142.0, 222.0, 280.0, 407.0, 707.0, 1224.0, 2449.0, 6496.0, 33467.0, 4114581.0, 23304.0, 5353.0, 2220.0, 1155.0, 606.0, 419.0, 256.0, 168.0, 132.0, 85.0, 81.0, 58.0, 44.0, 23.0, 26.0, 19.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5263671875, -0.5101318359375, -0.493896484375, -0.4776611328125, -0.46142578125, -0.4451904296875, -0.428955078125, -0.4127197265625, -0.396484375, -0.3802490234375, -0.364013671875, -0.3477783203125, -0.33154296875, -0.3153076171875, -0.299072265625, -0.2828369140625, -0.2666015625, -0.2503662109375, -0.234130859375, -0.2178955078125, -0.20166015625, -0.1854248046875, -0.169189453125, -0.1529541015625, -0.13671875, -0.1204833984375, -0.104248046875, -0.0880126953125, -0.07177734375, -0.0555419921875, -0.039306640625, -0.0230712890625, -0.0068359375, 0.0093994140625, 0.025634765625, 0.0418701171875, 0.05810546875, 0.0743408203125, 0.090576171875, 0.1068115234375, 0.123046875, 0.1392822265625, 0.155517578125, 0.1717529296875, 0.18798828125, 0.2042236328125, 0.220458984375, 0.2366943359375, 0.2529296875, 0.2691650390625, 0.285400390625, 0.3016357421875, 0.31787109375, 0.3341064453125, 0.350341796875, 0.3665771484375, 0.3828125, 0.3990478515625, 0.415283203125, 0.4315185546875, 0.44775390625, 0.4639892578125, 0.480224609375, 0.4964599609375, 0.5126953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 7.0, 12.0, 13.0, 15.0, 14.0, 29.0, 21.0, 28.0, 31.0, 29.0, 43.0, 69.0, 59.0, 68.0, 64.0, 70.0, 62.0, 61.0, 52.0, 42.0, 44.0, 43.0, 30.0, 35.0, 7.0, 16.0, 4.0, 11.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.1522216796875, -0.1479644775390625, -0.143707275390625, -0.1394500732421875, -0.13519287109375, -0.1309356689453125, -0.126678466796875, -0.1224212646484375, -0.1181640625, -0.1139068603515625, -0.109649658203125, -0.1053924560546875, -0.10113525390625, -0.0968780517578125, -0.092620849609375, -0.0883636474609375, -0.0841064453125, -0.0798492431640625, -0.075592041015625, -0.0713348388671875, -0.06707763671875, -0.0628204345703125, -0.058563232421875, -0.0543060302734375, -0.050048828125, -0.0457916259765625, -0.041534423828125, -0.0372772216796875, -0.03302001953125, -0.0287628173828125, -0.024505615234375, -0.0202484130859375, -0.0159912109375, -0.0117340087890625, -0.007476806640625, -0.0032196044921875, 0.00103759765625, 0.0052947998046875, 0.009552001953125, 0.0138092041015625, 0.01806640625, 0.0223236083984375, 0.026580810546875, 0.0308380126953125, 0.03509521484375, 0.0393524169921875, 0.043609619140625, 0.0478668212890625, 0.0521240234375, 0.0563812255859375, 0.060638427734375, 0.0648956298828125, 0.06915283203125, 0.0734100341796875, 0.077667236328125, 0.0819244384765625, 0.086181640625, 0.0904388427734375, 0.094696044921875, 0.0989532470703125, 0.10321044921875, 0.1074676513671875, 0.111724853515625, 0.1159820556640625, 0.1202392578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 7.0, 12.0, 10.0, 29.0, 34.0, 49.0, 64.0, 67.0, 98.0, 158.0, 244.0, 376.0, 667.0, 1408.0, 3572.0, 12472.0, 289997.0, 3864122.0, 13750.0, 3830.0, 1461.0, 695.0, 389.0, 220.0, 161.0, 102.0, 78.0, 59.0, 37.0, 23.0, 28.0, 17.0, 11.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8232421875, -0.7975387573242188, -0.7718353271484375, -0.7461318969726562, -0.720428466796875, -0.6947250366210938, -0.6690216064453125, -0.6433181762695312, -0.61761474609375, -0.5919113159179688, -0.5662078857421875, -0.5405044555664062, -0.514801025390625, -0.48909759521484375, -0.4633941650390625, -0.43769073486328125, -0.4119873046875, -0.38628387451171875, -0.3605804443359375, -0.33487701416015625, -0.309173583984375, -0.28347015380859375, -0.2577667236328125, -0.23206329345703125, -0.20635986328125, -0.18065643310546875, -0.1549530029296875, -0.12924957275390625, -0.103546142578125, -0.07784271240234375, -0.0521392822265625, -0.02643585205078125, -0.000732421875, 0.02497100830078125, 0.0506744384765625, 0.07637786865234375, 0.102081298828125, 0.12778472900390625, 0.1534881591796875, 0.17919158935546875, 0.20489501953125, 0.23059844970703125, 0.2563018798828125, 0.28200531005859375, 0.307708740234375, 0.33341217041015625, 0.3591156005859375, 0.38481903076171875, 0.4105224609375, 0.43622589111328125, 0.4619293212890625, 0.48763275146484375, 0.513336181640625, 0.5390396118164062, 0.5647430419921875, 0.5904464721679688, 0.61614990234375, 0.6418533325195312, 0.6675567626953125, 0.6932601928710938, 0.718963623046875, 0.7446670532226562, 0.7703704833984375, 0.7960739135742188, 0.82177734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 4.0, 4.0, 6.0, 3.0, 8.0, 23.0, 41.0, 423.0, 3468.0, 49.0, 22.0, 13.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.23950576782226562, -0.23303985595703125, -0.22657394409179688, -0.2201080322265625, -0.21364212036132812, -0.20717620849609375, -0.20071029663085938, -0.194244384765625, -0.18777847290039062, -0.18131256103515625, -0.17484664916992188, -0.1683807373046875, -0.16191482543945312, -0.15544891357421875, -0.14898300170898438, -0.14251708984375, -0.13605117797851562, -0.12958526611328125, -0.12311935424804688, -0.1166534423828125, -0.11018753051757812, -0.10372161865234375, -0.09725570678710938, -0.090789794921875, -0.08432388305664062, -0.07785797119140625, -0.07139205932617188, -0.0649261474609375, -0.058460235595703125, -0.05199432373046875, -0.045528411865234375, -0.0390625, -0.032596588134765625, -0.02613067626953125, -0.019664764404296875, -0.0131988525390625, -0.006732940673828125, -0.00026702880859375, 0.006198883056640625, 0.012664794921875, 0.019130706787109375, 0.02559661865234375, 0.032062530517578125, 0.0385284423828125, 0.044994354248046875, 0.05146026611328125, 0.057926177978515625, 0.06439208984375, 0.07085800170898438, 0.07732391357421875, 0.08378982543945312, 0.0902557373046875, 0.09672164916992188, 0.10318756103515625, 0.10965347290039062, 0.116119384765625, 0.12258529663085938, 0.12905120849609375, 0.13551712036132812, 0.1419830322265625, 0.14844894409179688, 0.15491485595703125, 0.16138076782226562, 0.1678466796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 2.0, 8.0, 4.0, 5.0, 9.0, 16.0, 27.0, 40.0, 55.0, 96.0, 109.0, 114.0, 131.0, 121.0, 92.0, 63.0, 28.0, 26.0, 20.0, 16.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5904878377914429, -0.574653148651123, -0.5588184595108032, -0.5429837107658386, -0.5271490216255188, -0.511314332485199, -0.49547961354255676, -0.47964489459991455, -0.4638102054595947, -0.4479755163192749, -0.4321407973766327, -0.4163060784339905, -0.40047138929367065, -0.38463670015335083, -0.3688019812107086, -0.3529672622680664, -0.3371325731277466, -0.32129788398742676, -0.30546316504478455, -0.28962844610214233, -0.2737937569618225, -0.2579590678215027, -0.24212434887886047, -0.22628964483737946, -0.21045494079589844, -0.19462023675441742, -0.1787855327129364, -0.16295082867145538, -0.14711612462997437, -0.13128142058849335, -0.11544671654701233, -0.09961201250553131, -0.08377724885940552, -0.0679425448179245, -0.05210784077644348, -0.03627313673496246, -0.020438432693481445, -0.004603728652000427, 0.01123097538948059, 0.02706567943096161, 0.04290038347244263, 0.058735087513923645, 0.07456979155540466, 0.09040449559688568, 0.1062391996383667, 0.12207390367984772, 0.13790860772132874, 0.15374331176280975, 0.16957801580429077, 0.1854127198457718, 0.2012474238872528, 0.21708212792873383, 0.23291683197021484, 0.24875153601169586, 0.2645862400531769, 0.2804209589958191, 0.2962556481361389, 0.31209033727645874, 0.32792505621910095, 0.34375977516174316, 0.359594464302063, 0.3754291534423828, 0.391263872385025, 0.40709859132766724, 0.42293328046798706]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 6.0, 5.0, 7.0, 8.0, 12.0, 13.0, 19.0, 19.0, 16.0, 23.0, 22.0, 32.0, 20.0, 33.0, 33.0, 40.0, 33.0, 48.0, 29.0, 44.0, 41.0, 43.0, 36.0, 28.0, 37.0, 31.0, 45.0, 36.0, 33.0, 15.0, 20.0, 22.0, 17.0, 18.0, 18.0, 13.0, 18.0, 18.0, 8.0, 8.0, 12.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22275447845458984, -0.21590979397296906, -0.20906510949134827, -0.20222041010856628, -0.1953757256269455, -0.1885310411453247, -0.18168634176254272, -0.17484165728092194, -0.16799697279930115, -0.16115228831768036, -0.15430760383605957, -0.1474629044532776, -0.1406182199716568, -0.133773535490036, -0.12692883610725403, -0.12008415162563324, -0.11323946714401245, -0.10639478266239166, -0.09955009073019028, -0.09270539879798889, -0.0858607143163681, -0.07901602983474731, -0.07217133790254593, -0.06532664597034454, -0.058481961488723755, -0.05163727328181267, -0.04479258507490158, -0.037947896867990494, -0.031103208661079407, -0.02425852045416832, -0.017413832247257233, -0.010569144040346146, -0.0037244558334350586, 0.0031202323734760284, 0.009964920580387115, 0.016809608787298203, 0.02365429699420929, 0.030498985201120377, 0.037343673408031464, 0.04418836161494255, 0.05103304982185364, 0.057877738028764725, 0.06472242623567581, 0.0715671181678772, 0.07841180264949799, 0.08525648713111877, 0.09210117906332016, 0.09894587099552155, 0.10579055547714233, 0.11263523995876312, 0.11947993189096451, 0.1263246238231659, 0.13316930830478668, 0.14001399278640747, 0.14685869216918945, 0.15370337665081024, 0.16054806113243103, 0.16739274561405182, 0.1742374300956726, 0.1810821294784546, 0.18792681396007538, 0.19477149844169617, 0.20161619782447815, 0.20846088230609894, 0.21530556678771973]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 14.0, 37.0, 38.0, 61.0, 129.0, 171.0, 272.0, 444.0, 669.0, 1182.0, 1931.0, 3572.0, 6511.0, 12468.0, 24290.0, 49406.0, 100855.0, 199051.0, 279832.0, 183705.0, 91317.0, 44958.0, 22230.0, 11420.0, 5958.0, 3249.0, 1872.0, 1094.0, 639.0, 401.0, 240.0, 172.0, 96.0, 73.0, 53.0, 31.0, 26.0, 20.0, 14.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1552734375, -0.15048599243164062, -0.14569854736328125, -0.14091110229492188, -0.1361236572265625, -0.13133621215820312, -0.12654876708984375, -0.12176132202148438, -0.116973876953125, -0.11218643188476562, -0.10739898681640625, -0.10261154174804688, -0.0978240966796875, -0.09303665161132812, -0.08824920654296875, -0.08346176147460938, -0.07867431640625, -0.07388687133789062, -0.06909942626953125, -0.06431198120117188, -0.0595245361328125, -0.054737091064453125, -0.04994964599609375, -0.045162200927734375, -0.040374755859375, -0.035587310791015625, -0.03079986572265625, -0.026012420654296875, -0.0212249755859375, -0.016437530517578125, -0.01165008544921875, -0.006862640380859375, -0.0020751953125, 0.002712249755859375, 0.00749969482421875, 0.012287139892578125, 0.0170745849609375, 0.021862030029296875, 0.02664947509765625, 0.031436920166015625, 0.036224365234375, 0.041011810302734375, 0.04579925537109375, 0.050586700439453125, 0.0553741455078125, 0.060161590576171875, 0.06494903564453125, 0.06973648071289062, 0.07452392578125, 0.07931137084960938, 0.08409881591796875, 0.08888626098632812, 0.0936737060546875, 0.09846115112304688, 0.10324859619140625, 0.10803604125976562, 0.112823486328125, 0.11761093139648438, 0.12239837646484375, 0.12718582153320312, 0.1319732666015625, 0.13676071166992188, 0.14154815673828125, 0.14633560180664062, 0.151123046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 13.0, 10.0, 18.0, 16.0, 24.0, 26.0, 35.0, 42.0, 41.0, 38.0, 63.0, 73.0, 72.0, 63.0, 60.0, 67.0, 67.0, 47.0, 48.0, 39.0, 31.0, 22.0, 22.0, 17.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15725326538085938, -0.15251922607421875, -0.14778518676757812, -0.1430511474609375, -0.13831710815429688, -0.13358306884765625, -0.12884902954101562, -0.124114990234375, -0.11938095092773438, -0.11464691162109375, -0.10991287231445312, -0.1051788330078125, -0.10044479370117188, -0.09571075439453125, -0.09097671508789062, -0.08624267578125, -0.08150863647460938, -0.07677459716796875, -0.07204055786132812, -0.0673065185546875, -0.06257247924804688, -0.05783843994140625, -0.053104400634765625, -0.048370361328125, -0.043636322021484375, -0.03890228271484375, -0.034168243408203125, -0.0294342041015625, -0.024700164794921875, -0.01996612548828125, -0.015232086181640625, -0.010498046875, -0.005764007568359375, -0.00102996826171875, 0.003704071044921875, 0.0084381103515625, 0.013172149658203125, 0.01790618896484375, 0.022640228271484375, 0.027374267578125, 0.032108306884765625, 0.03684234619140625, 0.041576385498046875, 0.0463104248046875, 0.051044464111328125, 0.05577850341796875, 0.060512542724609375, 0.06524658203125, 0.06998062133789062, 0.07471466064453125, 0.07944869995117188, 0.0841827392578125, 0.08891677856445312, 0.09365081787109375, 0.09838485717773438, 0.103118896484375, 0.10785293579101562, 0.11258697509765625, 0.11732101440429688, 0.1220550537109375, 0.12678909301757812, 0.13152313232421875, 0.13625717163085938, 0.1409912109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 7.0, 9.0, 14.0, 21.0, 9.0, 31.0, 30.0, 43.0, 60.0, 81.0, 75.0, 124.0, 175.0, 249.0, 333.0, 472.0, 740.0, 1428.0, 3172.0, 9614.0, 40706.0, 249322.0, 597281.0, 112280.0, 21213.0, 5680.0, 2170.0, 1099.0, 630.0, 419.0, 255.0, 179.0, 141.0, 114.0, 92.0, 66.0, 55.0, 33.0, 31.0, 20.0, 16.0, 6.0, 11.0, 13.0, 9.0, 2.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.283203125, -0.2738533020019531, -0.26450347900390625, -0.2551536560058594, -0.2458038330078125, -0.23645401000976562, -0.22710418701171875, -0.21775436401367188, -0.208404541015625, -0.19905471801757812, -0.18970489501953125, -0.18035507202148438, -0.1710052490234375, -0.16165542602539062, -0.15230560302734375, -0.14295578002929688, -0.13360595703125, -0.12425613403320312, -0.11490631103515625, -0.10555648803710938, -0.0962066650390625, -0.08685684204101562, -0.07750701904296875, -0.06815719604492188, -0.058807373046875, -0.049457550048828125, -0.04010772705078125, -0.030757904052734375, -0.0214080810546875, -0.012058258056640625, -0.00270843505859375, 0.006641387939453125, 0.0159912109375, 0.025341033935546875, 0.03469085693359375, 0.044040679931640625, 0.0533905029296875, 0.06274032592773438, 0.07209014892578125, 0.08143997192382812, 0.090789794921875, 0.10013961791992188, 0.10948944091796875, 0.11883926391601562, 0.1281890869140625, 0.13753890991210938, 0.14688873291015625, 0.15623855590820312, 0.16558837890625, 0.17493820190429688, 0.18428802490234375, 0.19363784790039062, 0.2029876708984375, 0.21233749389648438, 0.22168731689453125, 0.23103713989257812, 0.240386962890625, 0.24973678588867188, 0.25908660888671875, 0.2684364318847656, 0.2777862548828125, 0.2871360778808594, 0.29648590087890625, 0.3058357238769531, 0.315185546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 15.0, 10.0, 5.0, 9.0, 17.0, 21.0, 24.0, 24.0, 28.0, 23.0, 30.0, 24.0, 34.0, 39.0, 41.0, 54.0, 39.0, 60.0, 39.0, 39.0, 38.0, 38.0, 28.0, 29.0, 30.0, 38.0, 36.0, 24.0, 10.0, 24.0, 32.0, 15.0, 15.0, 12.0, 11.0, 8.0, 5.0, 1.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.3796272277832031, -0.36545562744140625, -0.3512840270996094, -0.3371124267578125, -0.3229408264160156, -0.30876922607421875, -0.2945976257324219, -0.280426025390625, -0.2662544250488281, -0.25208282470703125, -0.23791122436523438, -0.2237396240234375, -0.20956802368164062, -0.19539642333984375, -0.18122482299804688, -0.16705322265625, -0.15288162231445312, -0.13871002197265625, -0.12453842163085938, -0.1103668212890625, -0.09619522094726562, -0.08202362060546875, -0.06785202026367188, -0.053680419921875, -0.039508819580078125, -0.02533721923828125, -0.011165618896484375, 0.0030059814453125, 0.017177581787109375, 0.03134918212890625, 0.045520782470703125, 0.0596923828125, 0.07386398315429688, 0.08803558349609375, 0.10220718383789062, 0.1163787841796875, 0.13055038452148438, 0.14472198486328125, 0.15889358520507812, 0.173065185546875, 0.18723678588867188, 0.20140838623046875, 0.21557998657226562, 0.2297515869140625, 0.24392318725585938, 0.25809478759765625, 0.2722663879394531, 0.28643798828125, 0.3006095886230469, 0.31478118896484375, 0.3289527893066406, 0.3431243896484375, 0.3572959899902344, 0.37146759033203125, 0.3856391906738281, 0.399810791015625, 0.4139823913574219, 0.42815399169921875, 0.4423255920410156, 0.4564971923828125, 0.4706687927246094, 0.48484039306640625, 0.4990119934082031, 0.51318359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 16.0, 22.0, 13.0, 37.0, 38.0, 91.0, 144.0, 261.0, 592.0, 1465.0, 4899.0, 28057.0, 422791.0, 548192.0, 33543.0, 5479.0, 1610.0, 626.0, 281.0, 134.0, 87.0, 44.0, 38.0, 19.0, 19.0, 6.0, 9.0, 7.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.288330078125, -0.2803306579589844, -0.27233123779296875, -0.2643318176269531, -0.2563323974609375, -0.24833297729492188, -0.24033355712890625, -0.23233413696289062, -0.224334716796875, -0.21633529663085938, -0.20833587646484375, -0.20033645629882812, -0.1923370361328125, -0.18433761596679688, -0.17633819580078125, -0.16833877563476562, -0.16033935546875, -0.15233993530273438, -0.14434051513671875, -0.13634109497070312, -0.1283416748046875, -0.12034225463867188, -0.11234283447265625, -0.10434341430664062, -0.096343994140625, -0.08834457397460938, -0.08034515380859375, -0.07234573364257812, -0.0643463134765625, -0.056346893310546875, -0.04834747314453125, -0.040348052978515625, -0.0323486328125, -0.024349212646484375, -0.01634979248046875, -0.008350372314453125, -0.0003509521484375, 0.007648468017578125, 0.01564788818359375, 0.023647308349609375, 0.031646728515625, 0.039646148681640625, 0.04764556884765625, 0.055644989013671875, 0.0636444091796875, 0.07164382934570312, 0.07964324951171875, 0.08764266967773438, 0.09564208984375, 0.10364151000976562, 0.11164093017578125, 0.11964035034179688, 0.1276397705078125, 0.13563919067382812, 0.14363861083984375, 0.15163803100585938, 0.159637451171875, 0.16763687133789062, 0.17563629150390625, 0.18363571166992188, 0.1916351318359375, 0.19963455200195312, 0.20763397216796875, 0.21563339233398438, 0.2236328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 9.0, 13.0, 17.0, 34.0, 34.0, 49.0, 75.0, 124.0, 157.0, 133.0, 103.0, 74.0, 57.0, 29.0, 26.0, 15.0, 17.0, 10.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.667043685913086e-05, -4.479195922613144e-05, -4.291348159313202e-05, -4.10350039601326e-05, -3.915652632713318e-05, -3.727804869413376e-05, -3.539957106113434e-05, -3.352109342813492e-05, -3.16426157951355e-05, -2.9764138162136078e-05, -2.7885660529136658e-05, -2.6007182896137238e-05, -2.4128705263137817e-05, -2.2250227630138397e-05, -2.0371749997138977e-05, -1.8493272364139557e-05, -1.6614794731140137e-05, -1.4736317098140717e-05, -1.2857839465141296e-05, -1.0979361832141876e-05, -9.100884199142456e-06, -7.222406566143036e-06, -5.343928933143616e-06, -3.4654513001441956e-06, -1.5869736671447754e-06, 2.915039658546448e-07, 2.169981598854065e-06, 4.048459231853485e-06, 5.926936864852905e-06, 7.805414497852325e-06, 9.683892130851746e-06, 1.1562369763851166e-05, 1.3440847396850586e-05, 1.5319325029850006e-05, 1.7197802662849426e-05, 1.9076280295848846e-05, 2.0954757928848267e-05, 2.2833235561847687e-05, 2.4711713194847107e-05, 2.6590190827846527e-05, 2.8468668460845947e-05, 3.0347146093845367e-05, 3.222562372684479e-05, 3.410410135984421e-05, 3.598257899284363e-05, 3.786105662584305e-05, 3.973953425884247e-05, 4.161801189184189e-05, 4.349648952484131e-05, 4.537496715784073e-05, 4.725344479084015e-05, 4.913192242383957e-05, 5.101040005683899e-05, 5.288887768983841e-05, 5.476735532283783e-05, 5.664583295583725e-05, 5.852431058883667e-05, 6.040278822183609e-05, 6.228126585483551e-05, 6.415974348783493e-05, 6.603822112083435e-05, 6.791669875383377e-05, 6.979517638683319e-05, 7.167365401983261e-05, 7.355213165283203e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 26.0, 32.0, 61.0, 108.0, 172.0, 332.0, 820.0, 2184.0, 10323.0, 106401.0, 816587.0, 97932.0, 9754.0, 2267.0, 800.0, 326.0, 168.0, 86.0, 52.0, 31.0, 22.0, 13.0, 7.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3324413299560547, -0.3233299255371094, -0.31421852111816406, -0.30510711669921875, -0.29599571228027344, -0.2868843078613281, -0.2777729034423828, -0.2686614990234375, -0.2595500946044922, -0.2504386901855469, -0.24132728576660156, -0.23221588134765625, -0.22310447692871094, -0.21399307250976562, -0.2048816680908203, -0.195770263671875, -0.1866588592529297, -0.17754745483398438, -0.16843605041503906, -0.15932464599609375, -0.15021324157714844, -0.14110183715820312, -0.1319904327392578, -0.1228790283203125, -0.11376762390136719, -0.10465621948242188, -0.09554481506347656, -0.08643341064453125, -0.07732200622558594, -0.06821060180664062, -0.05909919738769531, -0.04998779296875, -0.04087638854980469, -0.031764984130859375, -0.022653579711914062, -0.01354217529296875, -0.0044307708740234375, 0.004680633544921875, 0.013792037963867188, 0.0229034423828125, 0.03201484680175781, 0.041126251220703125, 0.05023765563964844, 0.05934906005859375, 0.06846046447753906, 0.07757186889648438, 0.08668327331542969, 0.095794677734375, 0.10490608215332031, 0.11401748657226562, 0.12312889099121094, 0.13224029541015625, 0.14135169982910156, 0.15046310424804688, 0.1595745086669922, 0.1686859130859375, 0.1777973175048828, 0.18690872192382812, 0.19602012634277344, 0.20513153076171875, 0.21424293518066406, 0.22335433959960938, 0.2324657440185547, 0.2415771484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 8.0, 15.0, 23.0, 33.0, 48.0, 73.0, 70.0, 119.0, 97.0, 136.0, 91.0, 94.0, 63.0, 41.0, 23.0, 18.0, 14.0, 9.0, 1.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2871742248535156, -0.28015899658203125, -0.2731437683105469, -0.2661285400390625, -0.2591133117675781, -0.25209808349609375, -0.24508285522460938, -0.238067626953125, -0.23105239868164062, -0.22403717041015625, -0.21702194213867188, -0.2100067138671875, -0.20299148559570312, -0.19597625732421875, -0.18896102905273438, -0.18194580078125, -0.17493057250976562, -0.16791534423828125, -0.16090011596679688, -0.1538848876953125, -0.14686965942382812, -0.13985443115234375, -0.13283920288085938, -0.125823974609375, -0.11880874633789062, -0.11179351806640625, -0.10477828979492188, -0.0977630615234375, -0.09074783325195312, -0.08373260498046875, -0.07671737670898438, -0.0697021484375, -0.06268692016601562, -0.05567169189453125, -0.048656463623046875, -0.0416412353515625, -0.034626007080078125, -0.02761077880859375, -0.020595550537109375, -0.013580322265625, -0.006565093994140625, 0.00045013427734375, 0.007465362548828125, 0.0144805908203125, 0.021495819091796875, 0.02851104736328125, 0.035526275634765625, 0.04254150390625, 0.049556732177734375, 0.05657196044921875, 0.06358718872070312, 0.0706024169921875, 0.07761764526367188, 0.08463287353515625, 0.09164810180664062, 0.098663330078125, 0.10567855834960938, 0.11269378662109375, 0.11970901489257812, 0.1267242431640625, 0.13373947143554688, 0.14075469970703125, 0.14776992797851562, 0.15478515625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 8.0, 15.0, 37.0, 75.0, 106.0, 142.0, 178.0, 167.0, 114.0, 66.0, 43.0, 20.0, 8.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.119657516479492, -4.010087490081787, -3.900517702102661, -3.790947914123535, -3.681378126144409, -3.571808338165283, -3.462238311767578, -3.352668523788452, -3.243098735809326, -3.1335289478302, -3.023958921432495, -2.914389133453369, -2.804819345474243, -2.695249557495117, -2.585679531097412, -2.476109743118286, -2.366539716720581, -2.256969928741455, -2.14739990234375, -2.037830114364624, -1.928260326385498, -1.8186904191970825, -1.709120512008667, -1.599550724029541, -1.4899808168411255, -1.38041090965271, -1.270841121673584, -1.1612712144851685, -1.051701307296753, -0.942131519317627, -0.8325616121292114, -0.7229917645454407, -0.6134216785430908, -0.5038518309593201, -0.39428195357322693, -0.2847120761871338, -0.17514222860336304, -0.06557238101959229, 0.04399752616882324, 0.153567373752594, 0.26313722133636475, 0.3727070689201355, 0.48227694630622864, 0.5918468236923218, 0.7014166712760925, 0.8109865188598633, 0.9205564260482788, 1.0301263332366943, 1.1396961212158203, 1.2492660284042358, 1.3588358163833618, 1.4684057235717773, 1.5779755115509033, 1.6875454187393188, 1.7971153259277344, 1.9066851139068604, 2.0162549018859863, 2.1258246898651123, 2.2353947162628174, 2.3449645042419434, 2.4545342922210693, 2.5641040802001953, 2.6736741065979004, 2.7832438945770264, 2.8928139209747314]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 9.0, 9.0, 7.0, 5.0, 16.0, 15.0, 20.0, 22.0, 26.0, 32.0, 40.0, 33.0, 54.0, 43.0, 52.0, 69.0, 74.0, 61.0, 60.0, 46.0, 52.0, 43.0, 31.0, 33.0, 26.0, 21.0, 19.0, 19.0, 13.0, 13.0, 10.0, 3.0, 8.0, 5.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-3.3458478450775146, -3.259589195251465, -3.173330307006836, -3.087071657180786, -3.0008130073547363, -2.9145543575286865, -2.8282957077026367, -2.742036819458008, -2.655778169631958, -2.569519519805908, -2.4832606315612793, -2.3970019817352295, -2.3107433319091797, -2.22448468208313, -2.13822603225708, -2.051967144012451, -1.9657084941864014, -1.8794498443603516, -1.7931910753250122, -1.7069323062896729, -1.620673656463623, -1.5344150066375732, -1.4481562376022339, -1.3618974685668945, -1.2756388187408447, -1.189380168914795, -1.1031213998794556, -1.0168626308441162, -0.9306039810180664, -0.8443452715873718, -0.7580865621566772, -0.6718278527259827, -0.5855693817138672, -0.4993106722831726, -0.413051962852478, -0.32679325342178345, -0.24053454399108887, -0.1542758345603943, -0.06801712512969971, 0.018241584300994873, 0.10450029373168945, 0.19075900316238403, 0.2770177125930786, 0.3632764220237732, 0.4495351314544678, 0.5357938408851624, 0.6220525503158569, 0.7083112597465515, 0.7945699691772461, 0.8808286786079407, 0.9670873880386353, 1.0533461570739746, 1.1396048069000244, 1.2258634567260742, 1.3121222257614136, 1.398380994796753, 1.4846396446228027, 1.5708982944488525, 1.657157063484192, 1.7434158325195312, 1.829674482345581, 1.9159331321716309, 2.0021920204162598, 2.0884506702423096, 2.1747093200683594]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 2.0, 3.0, 8.0, 6.0, 15.0, 19.0, 35.0, 53.0, 59.0, 100.0, 130.0, 188.0, 325.0, 424.0, 655.0, 1057.0, 1864.0, 3379.0, 7028.0, 18008.0, 94084.0, 3977468.0, 61372.0, 14475.0, 6002.0, 2989.0, 1683.0, 1003.0, 597.0, 406.0, 258.0, 179.0, 119.0, 76.0, 51.0, 46.0, 27.0, 23.0, 15.0, 15.0, 8.0, 4.0, 7.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2844200134277344, -0.27440643310546875, -0.2643928527832031, -0.2543792724609375, -0.24436569213867188, -0.23435211181640625, -0.22433853149414062, -0.214324951171875, -0.20431137084960938, -0.19429779052734375, -0.18428421020507812, -0.1742706298828125, -0.16425704956054688, -0.15424346923828125, -0.14422988891601562, -0.13421630859375, -0.12420272827148438, -0.11418914794921875, -0.10417556762695312, -0.0941619873046875, -0.08414840698242188, -0.07413482666015625, -0.06412124633789062, -0.054107666015625, -0.044094085693359375, -0.03408050537109375, -0.024066925048828125, -0.0140533447265625, -0.004039764404296875, 0.00597381591796875, 0.015987396240234375, 0.0260009765625, 0.036014556884765625, 0.04602813720703125, 0.056041717529296875, 0.0660552978515625, 0.07606887817382812, 0.08608245849609375, 0.09609603881835938, 0.106109619140625, 0.11612319946289062, 0.12613677978515625, 0.13615036010742188, 0.1461639404296875, 0.15617752075195312, 0.16619110107421875, 0.17620468139648438, 0.18621826171875, 0.19623184204101562, 0.20624542236328125, 0.21625900268554688, 0.2262725830078125, 0.23628616333007812, 0.24629974365234375, 0.2563133239746094, 0.266326904296875, 0.2763404846191406, 0.28635406494140625, 0.2963676452636719, 0.3063812255859375, 0.3163948059082031, 0.32640838623046875, 0.3364219665527344, 0.346435546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 7.0, 7.0, 8.0, 14.0, 14.0, 15.0, 19.0, 28.0, 29.0, 34.0, 38.0, 46.0, 50.0, 60.0, 61.0, 65.0, 70.0, 58.0, 57.0, 62.0, 44.0, 38.0, 28.0, 35.0, 23.0, 20.0, 19.0, 15.0, 9.0, 13.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.1629638671875, -0.1585378646850586, -0.1541118621826172, -0.14968585968017578, -0.14525985717773438, -0.14083385467529297, -0.13640785217285156, -0.13198184967041016, -0.12755584716796875, -0.12312984466552734, -0.11870384216308594, -0.11427783966064453, -0.10985183715820312, -0.10542583465576172, -0.10099983215332031, -0.0965738296508789, -0.0921478271484375, -0.0877218246459961, -0.08329582214355469, -0.07886981964111328, -0.07444381713867188, -0.07001781463623047, -0.06559181213378906, -0.061165809631347656, -0.05673980712890625, -0.052313804626464844, -0.04788780212402344, -0.04346179962158203, -0.039035797119140625, -0.03460979461669922, -0.030183792114257812, -0.025757789611816406, -0.021331787109375, -0.016905784606933594, -0.012479782104492188, -0.008053779602050781, -0.003627777099609375, 0.0007982254028320312, 0.0052242279052734375, 0.009650230407714844, 0.01407623291015625, 0.018502235412597656, 0.022928237915039062, 0.02735424041748047, 0.031780242919921875, 0.03620624542236328, 0.04063224792480469, 0.045058250427246094, 0.0494842529296875, 0.053910255432128906, 0.05833625793457031, 0.06276226043701172, 0.06718826293945312, 0.07161426544189453, 0.07604026794433594, 0.08046627044677734, 0.08489227294921875, 0.08931827545166016, 0.09374427795410156, 0.09817028045654297, 0.10259628295898438, 0.10702228546142578, 0.11144828796386719, 0.1158742904663086, 0.12030029296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 10.0, 9.0, 10.0, 10.0, 21.0, 20.0, 32.0, 51.0, 78.0, 128.0, 229.0, 444.0, 970.0, 2551.0, 9695.0, 81384.0, 4053118.0, 35802.0, 6255.0, 1817.0, 736.0, 367.0, 198.0, 109.0, 80.0, 32.0, 25.0, 25.0, 15.0, 13.0, 10.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.8662109375, -0.840240478515625, -0.81427001953125, -0.788299560546875, -0.7623291015625, -0.736358642578125, -0.71038818359375, -0.684417724609375, -0.658447265625, -0.632476806640625, -0.60650634765625, -0.580535888671875, -0.5545654296875, -0.528594970703125, -0.50262451171875, -0.476654052734375, -0.45068359375, -0.424713134765625, -0.39874267578125, -0.372772216796875, -0.3468017578125, -0.320831298828125, -0.29486083984375, -0.268890380859375, -0.242919921875, -0.216949462890625, -0.19097900390625, -0.165008544921875, -0.1390380859375, -0.113067626953125, -0.08709716796875, -0.061126708984375, -0.03515625, -0.009185791015625, 0.01678466796875, 0.042755126953125, 0.0687255859375, 0.094696044921875, 0.12066650390625, 0.146636962890625, 0.172607421875, 0.198577880859375, 0.22454833984375, 0.250518798828125, 0.2764892578125, 0.302459716796875, 0.32843017578125, 0.354400634765625, 0.38037109375, 0.406341552734375, 0.43231201171875, 0.458282470703125, 0.4842529296875, 0.510223388671875, 0.53619384765625, 0.562164306640625, 0.588134765625, 0.614105224609375, 0.64007568359375, 0.666046142578125, 0.6920166015625, 0.717987060546875, 0.74395751953125, 0.769927978515625, 0.7958984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 15.0, 24.0, 39.0, 73.0, 235.0, 3345.0, 188.0, 61.0, 22.0, 17.0, 10.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.18571853637695312, -0.17661285400390625, -0.16750717163085938, -0.1584014892578125, -0.14929580688476562, -0.14019012451171875, -0.13108444213867188, -0.121978759765625, -0.11287307739257812, -0.10376739501953125, -0.09466171264648438, -0.0855560302734375, -0.07645034790039062, -0.06734466552734375, -0.058238983154296875, -0.04913330078125, -0.040027618408203125, -0.03092193603515625, -0.021816253662109375, -0.0127105712890625, -0.003604888916015625, 0.00550079345703125, 0.014606475830078125, 0.023712158203125, 0.032817840576171875, 0.04192352294921875, 0.051029205322265625, 0.0601348876953125, 0.06924057006835938, 0.07834625244140625, 0.08745193481445312, 0.0965576171875, 0.10566329956054688, 0.11476898193359375, 0.12387466430664062, 0.1329803466796875, 0.14208602905273438, 0.15119171142578125, 0.16029739379882812, 0.169403076171875, 0.17850875854492188, 0.18761444091796875, 0.19672012329101562, 0.2058258056640625, 0.21493148803710938, 0.22403717041015625, 0.23314285278320312, 0.24224853515625, 0.2513542175292969, 0.26045989990234375, 0.2695655822753906, 0.2786712646484375, 0.2877769470214844, 0.29688262939453125, 0.3059883117675781, 0.315093994140625, 0.3241996765136719, 0.33330535888671875, 0.3424110412597656, 0.3515167236328125, 0.3606224060058594, 0.36972808837890625, 0.3788337707519531, 0.387939453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 8.0, 4.0, 9.0, 15.0, 16.0, 19.0, 27.0, 39.0, 38.0, 48.0, 59.0, 65.0, 79.0, 82.0, 70.0, 68.0, 62.0, 59.0, 43.0, 27.0, 36.0, 33.0, 19.0, 9.0, 5.0, 9.0, 12.0, 3.0, 8.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.7346688508987427, -0.7159498929977417, -0.6972309947013855, -0.6785120368003845, -0.6597931385040283, -0.6410741806030273, -0.6223552823066711, -0.6036363244056702, -0.584917426109314, -0.566198468208313, -0.5474795699119568, -0.5287606120109558, -0.5100417137145996, -0.49132275581359863, -0.47260382771492004, -0.45388489961624146, -0.4351659417152405, -0.4164470136165619, -0.3977280855178833, -0.3790091574192047, -0.3602902293205261, -0.34157127141952515, -0.32285234332084656, -0.30413341522216797, -0.2854144871234894, -0.2666955590248108, -0.2479766309261322, -0.22925768792629242, -0.21053875982761383, -0.19181983172893524, -0.17310088872909546, -0.15438196063041687, -0.13566303253173828, -0.11694410443305969, -0.0982251688838005, -0.07950623333454132, -0.06078730523586273, -0.04206837713718414, -0.023349441587924957, -0.0046305060386657715, 0.014088422060012817, 0.032807353883981705, 0.05152628570795059, 0.07024522125720978, 0.08896414935588837, 0.10768307745456696, 0.12640202045440674, 0.14512094855308533, 0.16383987665176392, 0.1825588047504425, 0.2012777328491211, 0.21999667584896088, 0.23871560394763947, 0.25743454694747925, 0.27615347504615784, 0.2948724031448364, 0.313591331243515, 0.3323102593421936, 0.3510291874408722, 0.3697481155395508, 0.38846707344055176, 0.40718597173690796, 0.42590492963790894, 0.4446238577365875, 0.4633427858352661]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 10.0, 13.0, 8.0, 14.0, 14.0, 15.0, 18.0, 23.0, 19.0, 21.0, 23.0, 21.0, 25.0, 43.0, 36.0, 30.0, 42.0, 41.0, 56.0, 32.0, 39.0, 51.0, 42.0, 37.0, 37.0, 35.0, 29.0, 39.0, 14.0, 30.0, 27.0, 17.0, 13.0, 10.0, 16.0, 6.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.5365151166915894, -0.5212335586547852, -0.505952000617981, -0.49067047238349915, -0.47538894414901733, -0.46010738611221313, -0.44482582807540894, -0.4295442998409271, -0.4142627716064453, -0.3989812135696411, -0.3836996853351593, -0.3684181272983551, -0.3531365990638733, -0.3378550410270691, -0.3225734829902649, -0.3072919547557831, -0.2920103967189789, -0.2767288386821747, -0.26144731044769287, -0.24616575241088867, -0.23088422417640686, -0.21560266613960266, -0.20032112300395966, -0.18503957986831665, -0.16975803673267365, -0.15447649359703064, -0.13919495046138763, -0.12391339987516403, -0.10863185673952103, -0.09335031360387802, -0.07806876301765442, -0.06278721988201141, -0.04750567674636841, -0.0322241336107254, -0.0169425867497921, -0.0016610398888587952, 0.01362050324678421, 0.028902046382427216, 0.04418359696865082, 0.05946514010429382, 0.07474668323993683, 0.09002822637557983, 0.10530976951122284, 0.12059132009744644, 0.13587287068367004, 0.15115439891815186, 0.16643595695495605, 0.18171750009059906, 0.19699904322624207, 0.21228058636188507, 0.22756212949752808, 0.24284368753433228, 0.2581252157688141, 0.2734067738056183, 0.2886883020401001, 0.3039698600769043, 0.3192514181137085, 0.3345329761505127, 0.3498145043849945, 0.3650960624217987, 0.3803775906562805, 0.3956591486930847, 0.4109407067298889, 0.4262222349643707, 0.44150376319885254]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 27.0, 25.0, 47.0, 72.0, 136.0, 201.0, 322.0, 528.0, 950.0, 1597.0, 2941.0, 5454.0, 10732.0, 21836.0, 47791.0, 114419.0, 296047.0, 321363.0, 124025.0, 51936.0, 23394.0, 11521.0, 5825.0, 3258.0, 1681.0, 985.0, 562.0, 322.0, 227.0, 115.0, 63.0, 39.0, 41.0, 22.0, 7.0, 7.0, 11.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.231964111328125, -0.22369384765625, -0.215423583984375, -0.2071533203125, -0.198883056640625, -0.19061279296875, -0.182342529296875, -0.174072265625, -0.165802001953125, -0.15753173828125, -0.149261474609375, -0.1409912109375, -0.132720947265625, -0.12445068359375, -0.116180419921875, -0.10791015625, -0.099639892578125, -0.09136962890625, -0.083099365234375, -0.0748291015625, -0.066558837890625, -0.05828857421875, -0.050018310546875, -0.041748046875, -0.033477783203125, -0.02520751953125, -0.016937255859375, -0.0086669921875, -0.000396728515625, 0.00787353515625, 0.016143798828125, 0.0244140625, 0.032684326171875, 0.04095458984375, 0.049224853515625, 0.0574951171875, 0.065765380859375, 0.07403564453125, 0.082305908203125, 0.090576171875, 0.098846435546875, 0.10711669921875, 0.115386962890625, 0.1236572265625, 0.131927490234375, 0.14019775390625, 0.148468017578125, 0.15673828125, 0.165008544921875, 0.17327880859375, 0.181549072265625, 0.1898193359375, 0.198089599609375, 0.20635986328125, 0.214630126953125, 0.222900390625, 0.231170654296875, 0.23944091796875, 0.247711181640625, 0.2559814453125, 0.264251708984375, 0.27252197265625, 0.280792236328125, 0.2890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 4.0, 12.0, 9.0, 12.0, 24.0, 13.0, 21.0, 29.0, 37.0, 36.0, 38.0, 44.0, 59.0, 57.0, 58.0, 55.0, 54.0, 60.0, 43.0, 45.0, 41.0, 38.0, 43.0, 27.0, 27.0, 26.0, 13.0, 16.0, 12.0, 6.0, 8.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.149688720703125, -0.14532470703125, -0.140960693359375, -0.1365966796875, -0.132232666015625, -0.12786865234375, -0.123504638671875, -0.119140625, -0.114776611328125, -0.11041259765625, -0.106048583984375, -0.1016845703125, -0.097320556640625, -0.09295654296875, -0.088592529296875, -0.084228515625, -0.079864501953125, -0.07550048828125, -0.071136474609375, -0.0667724609375, -0.062408447265625, -0.05804443359375, -0.053680419921875, -0.04931640625, -0.044952392578125, -0.04058837890625, -0.036224365234375, -0.0318603515625, -0.027496337890625, -0.02313232421875, -0.018768310546875, -0.014404296875, -0.010040283203125, -0.00567626953125, -0.001312255859375, 0.0030517578125, 0.007415771484375, 0.01177978515625, 0.016143798828125, 0.0205078125, 0.024871826171875, 0.02923583984375, 0.033599853515625, 0.0379638671875, 0.042327880859375, 0.04669189453125, 0.051055908203125, 0.055419921875, 0.059783935546875, 0.06414794921875, 0.068511962890625, 0.0728759765625, 0.077239990234375, 0.08160400390625, 0.085968017578125, 0.09033203125, 0.094696044921875, 0.09906005859375, 0.103424072265625, 0.1077880859375, 0.112152099609375, 0.11651611328125, 0.120880126953125, 0.125244140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 14.0, 10.0, 17.0, 21.0, 24.0, 30.0, 41.0, 57.0, 78.0, 134.0, 186.0, 302.0, 445.0, 756.0, 1371.0, 2877.0, 7832.0, 29229.0, 185809.0, 679882.0, 108158.0, 19914.0, 5833.0, 2406.0, 1228.0, 654.0, 430.0, 245.0, 153.0, 120.0, 70.0, 54.0, 54.0, 28.0, 27.0, 13.0, 11.0, 12.0, 2.0, 7.0, 0.0, 5.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.494964599609375, -0.47967529296875, -0.464385986328125, -0.4490966796875, -0.433807373046875, -0.41851806640625, -0.403228759765625, -0.387939453125, -0.372650146484375, -0.35736083984375, -0.342071533203125, -0.3267822265625, -0.311492919921875, -0.29620361328125, -0.280914306640625, -0.265625, -0.250335693359375, -0.23504638671875, -0.219757080078125, -0.2044677734375, -0.189178466796875, -0.17388916015625, -0.158599853515625, -0.143310546875, -0.128021240234375, -0.11273193359375, -0.097442626953125, -0.0821533203125, -0.066864013671875, -0.05157470703125, -0.036285400390625, -0.02099609375, -0.005706787109375, 0.00958251953125, 0.024871826171875, 0.0401611328125, 0.055450439453125, 0.07073974609375, 0.086029052734375, 0.101318359375, 0.116607666015625, 0.13189697265625, 0.147186279296875, 0.1624755859375, 0.177764892578125, 0.19305419921875, 0.208343505859375, 0.2236328125, 0.238922119140625, 0.25421142578125, 0.269500732421875, 0.2847900390625, 0.300079345703125, 0.31536865234375, 0.330657958984375, 0.345947265625, 0.361236572265625, 0.37652587890625, 0.391815185546875, 0.4071044921875, 0.422393798828125, 0.43768310546875, 0.452972412109375, 0.46826171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 9.0, 6.0, 14.0, 20.0, 18.0, 17.0, 32.0, 24.0, 36.0, 45.0, 45.0, 40.0, 65.0, 51.0, 43.0, 51.0, 51.0, 50.0, 41.0, 48.0, 38.0, 35.0, 37.0, 26.0, 22.0, 18.0, 20.0, 9.0, 13.0, 8.0, 10.0, 7.0, 10.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.591796875, -0.5741729736328125, -0.556549072265625, -0.5389251708984375, -0.52130126953125, -0.5036773681640625, -0.486053466796875, -0.4684295654296875, -0.4508056640625, -0.4331817626953125, -0.415557861328125, -0.3979339599609375, -0.38031005859375, -0.3626861572265625, -0.345062255859375, -0.3274383544921875, -0.309814453125, -0.2921905517578125, -0.274566650390625, -0.2569427490234375, -0.23931884765625, -0.2216949462890625, -0.204071044921875, -0.1864471435546875, -0.1688232421875, -0.1511993408203125, -0.133575439453125, -0.1159515380859375, -0.09832763671875, -0.0807037353515625, -0.063079833984375, -0.0454559326171875, -0.02783203125, -0.0102081298828125, 0.007415771484375, 0.0250396728515625, 0.04266357421875, 0.0602874755859375, 0.077911376953125, 0.0955352783203125, 0.1131591796875, 0.1307830810546875, 0.148406982421875, 0.1660308837890625, 0.18365478515625, 0.2012786865234375, 0.218902587890625, 0.2365264892578125, 0.254150390625, 0.2717742919921875, 0.289398193359375, 0.3070220947265625, 0.32464599609375, 0.3422698974609375, 0.359893798828125, 0.3775177001953125, 0.3951416015625, 0.4127655029296875, 0.430389404296875, 0.4480133056640625, 0.46563720703125, 0.4832611083984375, 0.500885009765625, 0.5185089111328125, 0.5361328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 6.0, 11.0, 7.0, 20.0, 32.0, 43.0, 54.0, 79.0, 141.0, 238.0, 419.0, 834.0, 1719.0, 4111.0, 11908.0, 44429.0, 252635.0, 587011.0, 108910.0, 23366.0, 7146.0, 2745.0, 1243.0, 557.0, 326.0, 200.0, 122.0, 62.0, 44.0, 27.0, 27.0, 16.0, 8.0, 13.0, 6.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.172607421875, -0.16725921630859375, -0.1619110107421875, -0.15656280517578125, -0.151214599609375, -0.14586639404296875, -0.1405181884765625, -0.13516998291015625, -0.12982177734375, -0.12447357177734375, -0.1191253662109375, -0.11377716064453125, -0.108428955078125, -0.10308074951171875, -0.0977325439453125, -0.09238433837890625, -0.0870361328125, -0.08168792724609375, -0.0763397216796875, -0.07099151611328125, -0.065643310546875, -0.06029510498046875, -0.0549468994140625, -0.04959869384765625, -0.04425048828125, -0.03890228271484375, -0.0335540771484375, -0.02820587158203125, -0.022857666015625, -0.01750946044921875, -0.0121612548828125, -0.00681304931640625, -0.00146484375, 0.00388336181640625, 0.0092315673828125, 0.01457977294921875, 0.019927978515625, 0.02527618408203125, 0.0306243896484375, 0.03597259521484375, 0.04132080078125, 0.04666900634765625, 0.0520172119140625, 0.05736541748046875, 0.062713623046875, 0.06806182861328125, 0.0734100341796875, 0.07875823974609375, 0.0841064453125, 0.08945465087890625, 0.0948028564453125, 0.10015106201171875, 0.105499267578125, 0.11084747314453125, 0.1161956787109375, 0.12154388427734375, 0.12689208984375, 0.13224029541015625, 0.1375885009765625, 0.14293670654296875, 0.148284912109375, 0.15363311767578125, 0.1589813232421875, 0.16432952880859375, 0.169677734375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 6.0, 10.0, 6.0, 9.0, 16.0, 26.0, 25.0, 21.0, 37.0, 38.0, 47.0, 58.0, 82.0, 111.0, 104.0, 82.0, 70.0, 51.0, 34.0, 34.0, 30.0, 29.0, 14.0, 5.0, 7.0, 10.0, 11.0, 4.0, 7.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.805492401123047e-05, -5.653873085975647e-05, -5.502253770828247e-05, -5.350634455680847e-05, -5.199015140533447e-05, -5.0473958253860474e-05, -4.8957765102386475e-05, -4.7441571950912476e-05, -4.5925378799438477e-05, -4.440918564796448e-05, -4.289299249649048e-05, -4.137679934501648e-05, -3.986060619354248e-05, -3.834441304206848e-05, -3.682821989059448e-05, -3.5312026739120483e-05, -3.3795833587646484e-05, -3.2279640436172485e-05, -3.0763447284698486e-05, -2.9247254133224487e-05, -2.7731060981750488e-05, -2.621486783027649e-05, -2.469867467880249e-05, -2.318248152732849e-05, -2.1666288375854492e-05, -2.0150095224380493e-05, -1.8633902072906494e-05, -1.7117708921432495e-05, -1.5601515769958496e-05, -1.4085322618484497e-05, -1.2569129467010498e-05, -1.1052936315536499e-05, -9.5367431640625e-06, -8.020550012588501e-06, -6.504356861114502e-06, -4.988163709640503e-06, -3.471970558166504e-06, -1.955777406692505e-06, -4.3958425521850586e-07, 1.0766088962554932e-06, 2.592802047729492e-06, 4.108995199203491e-06, 5.62518835067749e-06, 7.141381502151489e-06, 8.657574653625488e-06, 1.0173767805099487e-05, 1.1689960956573486e-05, 1.3206154108047485e-05, 1.4722347259521484e-05, 1.6238540410995483e-05, 1.7754733562469482e-05, 1.927092671394348e-05, 2.078711986541748e-05, 2.230331301689148e-05, 2.381950616836548e-05, 2.5335699319839478e-05, 2.6851892471313477e-05, 2.8368085622787476e-05, 2.9884278774261475e-05, 3.1400471925735474e-05, 3.291666507720947e-05, 3.443285822868347e-05, 3.594905138015747e-05, 3.746524453163147e-05, 3.898143768310547e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 8.0, 7.0, 18.0, 24.0, 26.0, 40.0, 46.0, 83.0, 104.0, 202.0, 290.0, 493.0, 786.0, 1526.0, 3183.0, 7713.0, 24348.0, 112016.0, 566195.0, 261816.0, 47189.0, 12823.0, 4747.0, 2206.0, 1027.0, 587.0, 372.0, 189.0, 137.0, 94.0, 66.0, 51.0, 37.0, 24.0, 22.0, 17.0, 12.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.1770038604736328, -0.17175674438476562, -0.16650962829589844, -0.16126251220703125, -0.15601539611816406, -0.15076828002929688, -0.1455211639404297, -0.1402740478515625, -0.1350269317626953, -0.12977981567382812, -0.12453269958496094, -0.11928558349609375, -0.11403846740722656, -0.10879135131835938, -0.10354423522949219, -0.098297119140625, -0.09305000305175781, -0.08780288696289062, -0.08255577087402344, -0.07730865478515625, -0.07206153869628906, -0.06681442260742188, -0.06156730651855469, -0.0563201904296875, -0.05107307434082031, -0.045825958251953125, -0.04057884216308594, -0.03533172607421875, -0.030084609985351562, -0.024837493896484375, -0.019590377807617188, -0.01434326171875, -0.009096145629882812, -0.003849029541015625, 0.0013980865478515625, 0.00664520263671875, 0.011892318725585938, 0.017139434814453125, 0.022386550903320312, 0.0276336669921875, 0.03288078308105469, 0.038127899169921875, 0.04337501525878906, 0.04862213134765625, 0.05386924743652344, 0.059116363525390625, 0.06436347961425781, 0.069610595703125, 0.07485771179199219, 0.08010482788085938, 0.08535194396972656, 0.09059906005859375, 0.09584617614746094, 0.10109329223632812, 0.10634040832519531, 0.1115875244140625, 0.11683464050292969, 0.12208175659179688, 0.12732887268066406, 0.13257598876953125, 0.13782310485839844, 0.14307022094726562, 0.1483173370361328, 0.153564453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 7.0, 4.0, 6.0, 9.0, 11.0, 9.0, 25.0, 17.0, 40.0, 35.0, 54.0, 52.0, 70.0, 73.0, 68.0, 76.0, 78.0, 80.0, 51.0, 50.0, 39.0, 30.0, 20.0, 16.0, 18.0, 13.0, 10.0, 5.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.147216796875, -0.14231300354003906, -0.13740921020507812, -0.1325054168701172, -0.12760162353515625, -0.12269783020019531, -0.11779403686523438, -0.11289024353027344, -0.1079864501953125, -0.10308265686035156, -0.09817886352539062, -0.09327507019042969, -0.08837127685546875, -0.08346748352050781, -0.07856369018554688, -0.07365989685058594, -0.068756103515625, -0.06385231018066406, -0.058948516845703125, -0.05404472351074219, -0.04914093017578125, -0.04423713684082031, -0.039333343505859375, -0.03442955017089844, -0.0295257568359375, -0.024621963500976562, -0.019718170166015625, -0.014814376831054688, -0.00991058349609375, -0.0050067901611328125, -0.000102996826171875, 0.0048007965087890625, 0.00970458984375, 0.014608383178710938, 0.019512176513671875, 0.024415969848632812, 0.02931976318359375, 0.03422355651855469, 0.039127349853515625, 0.04403114318847656, 0.0489349365234375, 0.05383872985839844, 0.058742523193359375, 0.06364631652832031, 0.06855010986328125, 0.07345390319824219, 0.07835769653320312, 0.08326148986816406, 0.088165283203125, 0.09306907653808594, 0.09797286987304688, 0.10287666320800781, 0.10778045654296875, 0.11268424987792969, 0.11758804321289062, 0.12249183654785156, 0.1273956298828125, 0.13229942321777344, 0.13720321655273438, 0.1421070098876953, 0.14701080322265625, 0.1519145965576172, 0.15681838989257812, 0.16172218322753906, 0.1666259765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 9.0, 8.0, 26.0, 66.0, 94.0, 134.0, 169.0, 170.0, 119.0, 90.0, 51.0, 23.0, 16.0, 12.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.531129837036133, -4.384349346160889, -4.2375688552856445, -4.0907883644104, -3.9440078735351562, -3.797227382659912, -3.650447130203247, -3.503666639328003, -3.356886148452759, -3.2101056575775146, -3.0633251667022705, -2.9165446758270264, -2.7697644233703613, -2.622983932495117, -2.476203441619873, -2.329422950744629, -2.1826424598693848, -2.0358619689941406, -1.8890814781188965, -1.742301106452942, -1.5955206155776978, -1.4487401247024536, -1.301959753036499, -1.1551792621612549, -1.0083987712860107, -0.8616182804107666, -0.7148378491401672, -0.5680574178695679, -0.42127692699432373, -0.2744964361190796, -0.12771600484848022, 0.01906442642211914, 0.16584539413452148, 0.31262585520744324, 0.459406316280365, 0.6061867475509644, 0.7529672384262085, 0.8997477293014526, 1.0465281009674072, 1.1933085918426514, 1.3400890827178955, 1.4868695735931396, 1.6336500644683838, 1.7804304361343384, 1.9272109270095825, 2.073991298675537, 2.2207717895507812, 2.3675522804260254, 2.5143327713012695, 2.6611132621765137, 2.807893753051758, 2.954674243927002, 3.101454734802246, 3.2482352256774902, 3.3950154781341553, 3.5417959690093994, 3.6885764598846436, 3.8353569507598877, 3.982137441635132, 4.128917694091797, 4.275698184967041, 4.422478675842285, 4.569259166717529, 4.716039657592773, 4.862820148468018]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 10.0, 6.0, 6.0, 13.0, 8.0, 6.0, 16.0, 17.0, 27.0, 20.0, 17.0, 21.0, 33.0, 31.0, 40.0, 37.0, 41.0, 48.0, 33.0, 38.0, 37.0, 40.0, 43.0, 49.0, 39.0, 27.0, 40.0, 29.0, 20.0, 35.0, 17.0, 37.0, 20.0, 20.0, 12.0, 10.0, 12.0, 4.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.8938207626342773, -1.8231133222579956, -1.7524058818817139, -1.6816984415054321, -1.6109910011291504, -1.540283441543579, -1.4695760011672974, -1.3988685607910156, -1.3281611204147339, -1.2574536800384521, -1.1867462396621704, -1.1160387992858887, -1.0453312397003174, -0.9746238589286804, -0.9039163589477539, -0.8332089185714722, -0.7625014781951904, -0.6917940378189087, -0.621086597442627, -0.5503790974617004, -0.4796716570854187, -0.40896421670913696, -0.33825674653053284, -0.2675492763519287, -0.19684183597564697, -0.12613438069820404, -0.05542692542076111, 0.015280529856681824, 0.08598798513412476, 0.1566954255104065, 0.22740289568901062, 0.29811036586761475, 0.3688175678253174, 0.4395250082015991, 0.5102324485778809, 0.5809399485588074, 0.6516473889350891, 0.7223548293113708, 0.7930623292922974, 0.8637697696685791, 0.9344772100448608, 1.0051846504211426, 1.0758920907974243, 1.146599531173706, 1.2173070907592773, 1.2880144119262695, 1.3587219715118408, 1.4294294118881226, 1.5001368522644043, 1.570844292640686, 1.6415517330169678, 1.7122591733932495, 1.7829666137695312, 1.8536741733551025, 1.9243816137313843, 1.995089054107666, 2.065796375274658, 2.1365039348602295, 2.2072112560272217, 2.277918815612793, 2.348626136779785, 2.4193336963653564, 2.4900410175323486, 2.56074857711792, 2.631456136703491]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 9.0, 13.0, 16.0, 27.0, 58.0, 60.0, 111.0, 177.0, 268.0, 454.0, 746.0, 1246.0, 2270.0, 4047.0, 8332.0, 18925.0, 54286.0, 308442.0, 3278883.0, 413486.0, 62373.0, 20707.0, 9113.0, 4375.0, 2339.0, 1378.0, 802.0, 495.0, 313.0, 205.0, 132.0, 65.0, 60.0, 25.0, 15.0, 13.0, 5.0, 9.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285888671875, -0.27710723876953125, -0.2683258056640625, -0.25954437255859375, -0.250762939453125, -0.24198150634765625, -0.2332000732421875, -0.22441864013671875, -0.21563720703125, -0.20685577392578125, -0.1980743408203125, -0.18929290771484375, -0.180511474609375, -0.17173004150390625, -0.1629486083984375, -0.15416717529296875, -0.1453857421875, -0.13660430908203125, -0.1278228759765625, -0.11904144287109375, -0.110260009765625, -0.10147857666015625, -0.0926971435546875, -0.08391571044921875, -0.07513427734375, -0.06635284423828125, -0.0575714111328125, -0.04878997802734375, -0.040008544921875, -0.03122711181640625, -0.0224456787109375, -0.01366424560546875, -0.0048828125, 0.00389862060546875, 0.0126800537109375, 0.02146148681640625, 0.030242919921875, 0.03902435302734375, 0.0478057861328125, 0.05658721923828125, 0.06536865234375, 0.07415008544921875, 0.0829315185546875, 0.09171295166015625, 0.100494384765625, 0.10927581787109375, 0.1180572509765625, 0.12683868408203125, 0.1356201171875, 0.14440155029296875, 0.1531829833984375, 0.16196441650390625, 0.170745849609375, 0.17952728271484375, 0.1883087158203125, 0.19709014892578125, 0.20587158203125, 0.21465301513671875, 0.2234344482421875, 0.23221588134765625, 0.240997314453125, 0.24977874755859375, 0.2585601806640625, 0.26734161376953125, 0.276123046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 12.0, 15.0, 11.0, 22.0, 20.0, 37.0, 27.0, 40.0, 50.0, 68.0, 54.0, 58.0, 56.0, 67.0, 67.0, 66.0, 54.0, 63.0, 33.0, 35.0, 38.0, 23.0, 17.0, 21.0, 13.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1602783203125, -0.1556987762451172, -0.15111923217773438, -0.14653968811035156, -0.14196014404296875, -0.13738059997558594, -0.13280105590820312, -0.1282215118408203, -0.1236419677734375, -0.11906242370605469, -0.11448287963867188, -0.10990333557128906, -0.10532379150390625, -0.10074424743652344, -0.09616470336914062, -0.09158515930175781, -0.087005615234375, -0.08242607116699219, -0.07784652709960938, -0.07326698303222656, -0.06868743896484375, -0.06410789489746094, -0.059528350830078125, -0.05494880676269531, -0.0503692626953125, -0.04578971862792969, -0.041210174560546875, -0.03663063049316406, -0.03205108642578125, -0.027471542358398438, -0.022891998291015625, -0.018312454223632812, -0.01373291015625, -0.009153366088867188, -0.004573822021484375, 5.7220458984375e-06, 0.00458526611328125, 0.009164810180664062, 0.013744354248046875, 0.018323898315429688, 0.0229034423828125, 0.027482986450195312, 0.032062530517578125, 0.03664207458496094, 0.04122161865234375, 0.04580116271972656, 0.050380706787109375, 0.05496025085449219, 0.059539794921875, 0.06411933898925781, 0.06869888305664062, 0.07327842712402344, 0.07785797119140625, 0.08243751525878906, 0.08701705932617188, 0.09159660339355469, 0.0961761474609375, 0.10075569152832031, 0.10533523559570312, 0.10991477966308594, 0.11449432373046875, 0.11907386779785156, 0.12365341186523438, 0.1282329559326172, 0.1328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 7.0, 15.0, 10.0, 24.0, 39.0, 46.0, 82.0, 127.0, 192.0, 320.0, 609.0, 1083.0, 2192.0, 5052.0, 12743.0, 39775.0, 213291.0, 3403205.0, 429413.0, 57347.0, 16661.0, 6311.0, 2729.0, 1345.0, 683.0, 390.0, 210.0, 119.0, 65.0, 63.0, 39.0, 23.0, 14.0, 12.0, 7.0, 13.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3444671630859375, -0.332000732421875, -0.3195343017578125, -0.30706787109375, -0.2946014404296875, -0.282135009765625, -0.2696685791015625, -0.2572021484375, -0.2447357177734375, -0.232269287109375, -0.2198028564453125, -0.20733642578125, -0.1948699951171875, -0.182403564453125, -0.1699371337890625, -0.157470703125, -0.1450042724609375, -0.132537841796875, -0.1200714111328125, -0.10760498046875, -0.0951385498046875, -0.082672119140625, -0.0702056884765625, -0.0577392578125, -0.0452728271484375, -0.032806396484375, -0.0203399658203125, -0.00787353515625, 0.0045928955078125, 0.017059326171875, 0.0295257568359375, 0.0419921875, 0.0544586181640625, 0.066925048828125, 0.0793914794921875, 0.09185791015625, 0.1043243408203125, 0.116790771484375, 0.1292572021484375, 0.1417236328125, 0.1541900634765625, 0.166656494140625, 0.1791229248046875, 0.19158935546875, 0.2040557861328125, 0.216522216796875, 0.2289886474609375, 0.241455078125, 0.2539215087890625, 0.266387939453125, 0.2788543701171875, 0.29132080078125, 0.3037872314453125, 0.316253662109375, 0.3287200927734375, 0.3411865234375, 0.3536529541015625, 0.366119384765625, 0.3785858154296875, 0.39105224609375, 0.4035186767578125, 0.415985107421875, 0.4284515380859375, 0.44091796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 3.0, 8.0, 6.0, 9.0, 10.0, 16.0, 14.0, 21.0, 36.0, 35.0, 55.0, 90.0, 140.0, 269.0, 540.0, 1058.0, 754.0, 384.0, 190.0, 125.0, 75.0, 60.0, 38.0, 28.0, 23.0, 17.0, 12.0, 9.0, 6.0, 6.0, 5.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.321533203125, -0.3099479675292969, -0.29836273193359375, -0.2867774963378906, -0.2751922607421875, -0.2636070251464844, -0.25202178955078125, -0.24043655395507812, -0.228851318359375, -0.21726608276367188, -0.20568084716796875, -0.19409561157226562, -0.1825103759765625, -0.17092514038085938, -0.15933990478515625, -0.14775466918945312, -0.13616943359375, -0.12458419799804688, -0.11299896240234375, -0.10141372680664062, -0.0898284912109375, -0.07824325561523438, -0.06665802001953125, -0.055072784423828125, -0.043487548828125, -0.031902313232421875, -0.02031707763671875, -0.008731842041015625, 0.0028533935546875, 0.014438629150390625, 0.02602386474609375, 0.037609100341796875, 0.0491943359375, 0.060779571533203125, 0.07236480712890625, 0.08395004272460938, 0.0955352783203125, 0.10712051391601562, 0.11870574951171875, 0.13029098510742188, 0.141876220703125, 0.15346145629882812, 0.16504669189453125, 0.17663192749023438, 0.1882171630859375, 0.19980239868164062, 0.21138763427734375, 0.22297286987304688, 0.23455810546875, 0.24614334106445312, 0.25772857666015625, 0.2693138122558594, 0.2808990478515625, 0.2924842834472656, 0.30406951904296875, 0.3156547546386719, 0.327239990234375, 0.3388252258300781, 0.35041046142578125, 0.3619956970214844, 0.3735809326171875, 0.3851661682128906, 0.39675140380859375, 0.4083366394042969, 0.419921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 1.0, 7.0, 2.0, 11.0, 12.0, 36.0, 93.0, 167.0, 228.0, 204.0, 137.0, 54.0, 21.0, 13.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.369821548461914, -6.2051591873168945, -6.040497303009033, -5.875834941864014, -5.711172580718994, -5.546510696411133, -5.381848335266113, -5.217185974121094, -5.052523612976074, -4.887861251831055, -4.723199367523193, -4.558537006378174, -4.393874645233154, -4.229212760925293, -4.064550399780273, -3.899888038635254, -3.7352261543273926, -3.570564031600952, -3.4059016704559326, -3.241239547729492, -3.0765771865844727, -2.9119150638580322, -2.747252941131592, -2.5825905799865723, -2.417928457260132, -2.2532663345336914, -2.088603973388672, -1.9239418506622314, -1.7592796087265015, -1.5946173667907715, -1.429955244064331, -1.265293002128601, -1.100630760192871, -0.9359685182571411, -0.7713063359260559, -0.6066441535949707, -0.4419819116592407, -0.27731966972351074, -0.11265748739242554, 0.05200469493865967, 0.21666693687438965, 0.38132914900779724, 0.5459913611412048, 0.71065354347229, 0.87531578540802, 1.03997802734375, 1.2046401500701904, 1.3693023920059204, 1.5339646339416504, 1.6986268758773804, 1.8632891178131104, 2.027951240539551, 2.1926136016845703, 2.3572757244110107, 2.521937847137451, 2.6866002082824707, 2.851262331008911, 3.0159244537353516, 3.180586814880371, 3.3452489376068115, 3.509911060333252, 3.6745734214782715, 3.839235544204712, 4.003897666931152, 4.168560028076172]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 9.0, 7.0, 12.0, 14.0, 16.0, 21.0, 31.0, 29.0, 31.0, 30.0, 59.0, 43.0, 55.0, 66.0, 65.0, 68.0, 53.0, 45.0, 60.0, 63.0, 37.0, 32.0, 32.0, 32.0, 27.0, 17.0, 13.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9480023384094238, -1.8851134777069092, -1.822224497795105, -1.7593356370925903, -1.6964466571807861, -1.6335577964782715, -1.5706689357757568, -1.5077800750732422, -1.444891095161438, -1.3820022344589233, -1.3191132545471191, -1.2562243938446045, -1.1933355331420898, -1.1304465532302856, -1.067557692527771, -1.0046687126159668, -0.9417798519134521, -0.8788909316062927, -0.8160020112991333, -0.7531131505966187, -0.6902242302894592, -0.6273353099822998, -0.5644464492797852, -0.5015575289726257, -0.4386686086654663, -0.3757796883583069, -0.31289079785346985, -0.2500019073486328, -0.1871129870414734, -0.12422406673431396, -0.06133517622947693, 0.0015537142753601074, 0.06444239616394043, 0.12733130156993866, 0.1902202069759369, 0.2531090974807739, 0.31599801778793335, 0.3788869380950928, 0.4417758285999298, 0.5046647191047668, 0.5675536394119263, 0.6304425597190857, 0.6933314800262451, 0.7562203407287598, 0.8191092610359192, 0.8819981813430786, 0.9448870420455933, 1.0077760219573975, 1.070664882659912, 1.1335537433624268, 1.196442723274231, 1.2593315839767456, 1.3222205638885498, 1.3851094245910645, 1.447998285293579, 1.5108871459960938, 1.573776125907898, 1.6366649866104126, 1.6995539665222168, 1.7624428272247314, 1.825331687927246, 1.8882206678390503, 1.951109528541565, 2.013998508453369, 2.076887369155884]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 8.0, 10.0, 13.0, 15.0, 20.0, 28.0, 34.0, 67.0, 89.0, 120.0, 174.0, 222.0, 377.0, 589.0, 883.0, 1521.0, 2230.0, 4061.0, 7310.0, 13714.0, 27852.0, 61135.0, 158589.0, 369731.0, 235416.0, 87143.0, 37386.0, 17786.0, 9177.0, 5140.0, 2820.0, 1737.0, 1030.0, 712.0, 432.0, 284.0, 214.0, 125.0, 101.0, 82.0, 54.0, 32.0, 34.0, 20.0, 14.0, 11.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22624588012695312, -0.21836090087890625, -0.21047592163085938, -0.2025909423828125, -0.19470596313476562, -0.18682098388671875, -0.17893600463867188, -0.171051025390625, -0.16316604614257812, -0.15528106689453125, -0.14739608764648438, -0.1395111083984375, -0.13162612915039062, -0.12374114990234375, -0.11585617065429688, -0.10797119140625, -0.10008621215820312, -0.09220123291015625, -0.08431625366210938, -0.0764312744140625, -0.06854629516601562, -0.06066131591796875, -0.052776336669921875, -0.044891357421875, -0.037006378173828125, -0.02912139892578125, -0.021236419677734375, -0.0133514404296875, -0.005466461181640625, 0.00241851806640625, 0.010303497314453125, 0.0181884765625, 0.026073455810546875, 0.03395843505859375, 0.041843414306640625, 0.0497283935546875, 0.057613372802734375, 0.06549835205078125, 0.07338333129882812, 0.081268310546875, 0.08915328979492188, 0.09703826904296875, 0.10492324829101562, 0.1128082275390625, 0.12069320678710938, 0.12857818603515625, 0.13646316528320312, 0.14434814453125, 0.15223312377929688, 0.16011810302734375, 0.16800308227539062, 0.1758880615234375, 0.18377304077148438, 0.19165802001953125, 0.19954299926757812, 0.207427978515625, 0.21531295776367188, 0.22319793701171875, 0.23108291625976562, 0.2389678955078125, 0.24685287475585938, 0.25473785400390625, 0.2626228332519531, 0.2705078125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 15.0, 10.0, 15.0, 20.0, 26.0, 34.0, 44.0, 40.0, 40.0, 35.0, 42.0, 40.0, 53.0, 48.0, 50.0, 60.0, 59.0, 42.0, 47.0, 36.0, 38.0, 44.0, 19.0, 23.0, 20.0, 11.0, 15.0, 8.0, 4.0, 5.0, 5.0, 7.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.118408203125, -0.11462688446044922, -0.11084556579589844, -0.10706424713134766, -0.10328292846679688, -0.0995016098022461, -0.09572029113769531, -0.09193897247314453, -0.08815765380859375, -0.08437633514404297, -0.08059501647949219, -0.0768136978149414, -0.07303237915039062, -0.06925106048583984, -0.06546974182128906, -0.06168842315673828, -0.0579071044921875, -0.05412578582763672, -0.05034446716308594, -0.046563148498535156, -0.042781829833984375, -0.039000511169433594, -0.03521919250488281, -0.03143787384033203, -0.02765655517578125, -0.02387523651123047, -0.020093917846679688, -0.016312599182128906, -0.012531280517578125, -0.008749961853027344, -0.0049686431884765625, -0.0011873245239257812, 0.002593994140625, 0.006375312805175781, 0.010156631469726562, 0.013937950134277344, 0.017719268798828125, 0.021500587463378906, 0.025281906127929688, 0.02906322479248047, 0.03284454345703125, 0.03662586212158203, 0.04040718078613281, 0.044188499450683594, 0.047969818115234375, 0.051751136779785156, 0.05553245544433594, 0.05931377410888672, 0.0630950927734375, 0.06687641143798828, 0.07065773010253906, 0.07443904876708984, 0.07822036743164062, 0.0820016860961914, 0.08578300476074219, 0.08956432342529297, 0.09334564208984375, 0.09712696075439453, 0.10090827941894531, 0.1046895980834961, 0.10847091674804688, 0.11225223541259766, 0.11603355407714844, 0.11981487274169922, 0.12359619140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 10.0, 7.0, 20.0, 26.0, 25.0, 40.0, 50.0, 68.0, 115.0, 176.0, 296.0, 440.0, 781.0, 1585.0, 3636.0, 9932.0, 41545.0, 408950.0, 517094.0, 45615.0, 10598.0, 3777.0, 1592.0, 867.0, 470.0, 262.0, 191.0, 110.0, 70.0, 61.0, 37.0, 23.0, 18.0, 12.0, 19.0, 6.0, 2.0, 4.0, 6.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48876953125, -0.47193145751953125, -0.4550933837890625, -0.43825531005859375, -0.421417236328125, -0.40457916259765625, -0.3877410888671875, -0.37090301513671875, -0.35406494140625, -0.33722686767578125, -0.3203887939453125, -0.30355072021484375, -0.286712646484375, -0.26987457275390625, -0.2530364990234375, -0.23619842529296875, -0.2193603515625, -0.20252227783203125, -0.1856842041015625, -0.16884613037109375, -0.152008056640625, -0.13516998291015625, -0.1183319091796875, -0.10149383544921875, -0.08465576171875, -0.06781768798828125, -0.0509796142578125, -0.03414154052734375, -0.017303466796875, -0.00046539306640625, 0.0163726806640625, 0.03321075439453125, 0.050048828125, 0.06688690185546875, 0.0837249755859375, 0.10056304931640625, 0.117401123046875, 0.13423919677734375, 0.1510772705078125, 0.16791534423828125, 0.18475341796875, 0.20159149169921875, 0.2184295654296875, 0.23526763916015625, 0.252105712890625, 0.26894378662109375, 0.2857818603515625, 0.30261993408203125, 0.3194580078125, 0.33629608154296875, 0.3531341552734375, 0.36997222900390625, 0.386810302734375, 0.40364837646484375, 0.4204864501953125, 0.43732452392578125, 0.45416259765625, 0.47100067138671875, 0.4878387451171875, 0.5046768188476562, 0.521514892578125, 0.5383529663085938, 0.5551910400390625, 0.5720291137695312, 0.5888671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 10.0, 3.0, 7.0, 9.0, 13.0, 11.0, 20.0, 26.0, 33.0, 38.0, 41.0, 39.0, 55.0, 50.0, 57.0, 63.0, 58.0, 59.0, 54.0, 59.0, 53.0, 37.0, 41.0, 33.0, 28.0, 30.0, 23.0, 14.0, 8.0, 11.0, 5.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6480941772460938, -0.6282196044921875, -0.6083450317382812, -0.588470458984375, -0.5685958862304688, -0.5487213134765625, -0.5288467407226562, -0.50897216796875, -0.48909759521484375, -0.4692230224609375, -0.44934844970703125, -0.429473876953125, -0.40959930419921875, -0.3897247314453125, -0.36985015869140625, -0.3499755859375, -0.33010101318359375, -0.3102264404296875, -0.29035186767578125, -0.270477294921875, -0.25060272216796875, -0.2307281494140625, -0.21085357666015625, -0.19097900390625, -0.17110443115234375, -0.1512298583984375, -0.13135528564453125, -0.111480712890625, -0.09160614013671875, -0.0717315673828125, -0.05185699462890625, -0.031982421875, -0.01210784912109375, 0.0077667236328125, 0.02764129638671875, 0.047515869140625, 0.06739044189453125, 0.0872650146484375, 0.10713958740234375, 0.12701416015625, 0.14688873291015625, 0.1667633056640625, 0.18663787841796875, 0.206512451171875, 0.22638702392578125, 0.2462615966796875, 0.26613616943359375, 0.2860107421875, 0.30588531494140625, 0.3257598876953125, 0.34563446044921875, 0.365509033203125, 0.38538360595703125, 0.4052581787109375, 0.42513275146484375, 0.44500732421875, 0.46488189697265625, 0.4847564697265625, 0.5046310424804688, 0.524505615234375, 0.5443801879882812, 0.5642547607421875, 0.5841293334960938, 0.60400390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 12.0, 14.0, 16.0, 18.0, 34.0, 45.0, 57.0, 116.0, 205.0, 316.0, 643.0, 1180.0, 2778.0, 7044.0, 22480.0, 113065.0, 716136.0, 144543.0, 25970.0, 7936.0, 3055.0, 1351.0, 650.0, 358.0, 195.0, 121.0, 65.0, 41.0, 33.0, 20.0, 20.0, 6.0, 10.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2484130859375, -0.2412242889404297, -0.23403549194335938, -0.22684669494628906, -0.21965789794921875, -0.21246910095214844, -0.20528030395507812, -0.1980915069580078, -0.1909027099609375, -0.1837139129638672, -0.17652511596679688, -0.16933631896972656, -0.16214752197265625, -0.15495872497558594, -0.14776992797851562, -0.1405811309814453, -0.133392333984375, -0.1262035369873047, -0.11901473999023438, -0.11182594299316406, -0.10463714599609375, -0.09744834899902344, -0.09025955200195312, -0.08307075500488281, -0.0758819580078125, -0.06869316101074219, -0.061504364013671875, -0.05431556701660156, -0.04712677001953125, -0.03993797302246094, -0.032749176025390625, -0.025560379028320312, -0.01837158203125, -0.011182785034179688, -0.003993988037109375, 0.0031948089599609375, 0.01038360595703125, 0.017572402954101562, 0.024761199951171875, 0.03194999694824219, 0.0391387939453125, 0.04632759094238281, 0.053516387939453125, 0.06070518493652344, 0.06789398193359375, 0.07508277893066406, 0.08227157592773438, 0.08946037292480469, 0.096649169921875, 0.10383796691894531, 0.11102676391601562, 0.11821556091308594, 0.12540435791015625, 0.13259315490722656, 0.13978195190429688, 0.1469707489013672, 0.1541595458984375, 0.1613483428955078, 0.16853713989257812, 0.17572593688964844, 0.18291473388671875, 0.19010353088378906, 0.19729232788085938, 0.2044811248779297, 0.211669921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 3.0, 1.0, 9.0, 11.0, 13.0, 15.0, 23.0, 32.0, 33.0, 57.0, 114.0, 149.0, 131.0, 125.0, 72.0, 59.0, 37.0, 28.0, 25.0, 12.0, 10.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.957220077514648e-05, -7.724948227405548e-05, -7.492676377296448e-05, -7.260404527187347e-05, -7.028132677078247e-05, -6.795860826969147e-05, -6.563588976860046e-05, -6.331317126750946e-05, -6.099045276641846e-05, -5.8667734265327454e-05, -5.634501576423645e-05, -5.402229726314545e-05, -5.169957876205444e-05, -4.937686026096344e-05, -4.7054141759872437e-05, -4.473142325878143e-05, -4.240870475769043e-05, -4.0085986256599426e-05, -3.776326775550842e-05, -3.544054925441742e-05, -3.3117830753326416e-05, -3.079511225223541e-05, -2.847239375114441e-05, -2.6149675250053406e-05, -2.3826956748962402e-05, -2.15042382478714e-05, -1.9181519746780396e-05, -1.6858801245689392e-05, -1.4536082744598389e-05, -1.2213364243507385e-05, -9.890645742416382e-06, -7.567927241325378e-06, -5.245208740234375e-06, -2.9224902391433716e-06, -5.997717380523682e-07, 1.7229467630386353e-06, 4.045665264129639e-06, 6.368383765220642e-06, 8.691102266311646e-06, 1.1013820767402649e-05, 1.3336539268493652e-05, 1.5659257769584656e-05, 1.798197627067566e-05, 2.0304694771766663e-05, 2.2627413272857666e-05, 2.495013177394867e-05, 2.7272850275039673e-05, 2.9595568776130676e-05, 3.191828727722168e-05, 3.424100577831268e-05, 3.6563724279403687e-05, 3.888644278049469e-05, 4.120916128158569e-05, 4.35318797826767e-05, 4.58545982837677e-05, 4.8177316784858704e-05, 5.050003528594971e-05, 5.282275378704071e-05, 5.5145472288131714e-05, 5.746819078922272e-05, 5.979090929031372e-05, 6.211362779140472e-05, 6.443634629249573e-05, 6.675906479358673e-05, 6.908178329467773e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 10.0, 12.0, 16.0, 19.0, 31.0, 46.0, 66.0, 118.0, 181.0, 333.0, 621.0, 1247.0, 3229.0, 10143.0, 51304.0, 628873.0, 309141.0, 31158.0, 7334.0, 2414.0, 1030.0, 494.0, 236.0, 160.0, 106.0, 60.0, 42.0, 32.0, 20.0, 19.0, 11.0, 10.0, 8.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263671875, -0.2553977966308594, -0.24712371826171875, -0.23884963989257812, -0.2305755615234375, -0.22230148315429688, -0.21402740478515625, -0.20575332641601562, -0.197479248046875, -0.18920516967773438, -0.18093109130859375, -0.17265701293945312, -0.1643829345703125, -0.15610885620117188, -0.14783477783203125, -0.13956069946289062, -0.13128662109375, -0.12301254272460938, -0.11473846435546875, -0.10646438598632812, -0.0981903076171875, -0.08991622924804688, -0.08164215087890625, -0.07336807250976562, -0.065093994140625, -0.056819915771484375, -0.04854583740234375, -0.040271759033203125, -0.0319976806640625, -0.023723602294921875, -0.01544952392578125, -0.007175445556640625, 0.0010986328125, 0.009372711181640625, 0.01764678955078125, 0.025920867919921875, 0.0341949462890625, 0.042469024658203125, 0.05074310302734375, 0.059017181396484375, 0.067291259765625, 0.07556533813476562, 0.08383941650390625, 0.09211349487304688, 0.1003875732421875, 0.10866165161132812, 0.11693572998046875, 0.12520980834960938, 0.13348388671875, 0.14175796508789062, 0.15003204345703125, 0.15830612182617188, 0.1665802001953125, 0.17485427856445312, 0.18312835693359375, 0.19140243530273438, 0.199676513671875, 0.20795059204101562, 0.21622467041015625, 0.22449874877929688, 0.2327728271484375, 0.24104690551757812, 0.24932098388671875, 0.2575950622558594, 0.265869140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 2.0, 8.0, 11.0, 24.0, 27.0, 25.0, 51.0, 40.0, 69.0, 91.0, 85.0, 111.0, 92.0, 72.0, 66.0, 49.0, 34.0, 33.0, 15.0, 18.0, 9.0, 6.0, 10.0, 3.0, 9.0, 8.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2310791015625, -0.22455596923828125, -0.2180328369140625, -0.21150970458984375, -0.204986572265625, -0.19846343994140625, -0.1919403076171875, -0.18541717529296875, -0.17889404296875, -0.17237091064453125, -0.1658477783203125, -0.15932464599609375, -0.152801513671875, -0.14627838134765625, -0.1397552490234375, -0.13323211669921875, -0.126708984375, -0.12018585205078125, -0.1136627197265625, -0.10713958740234375, -0.100616455078125, -0.09409332275390625, -0.0875701904296875, -0.08104705810546875, -0.07452392578125, -0.06800079345703125, -0.0614776611328125, -0.05495452880859375, -0.048431396484375, -0.04190826416015625, -0.0353851318359375, -0.02886199951171875, -0.0223388671875, -0.01581573486328125, -0.0092926025390625, -0.00276947021484375, 0.003753662109375, 0.01027679443359375, 0.0167999267578125, 0.02332305908203125, 0.02984619140625, 0.03636932373046875, 0.0428924560546875, 0.04941558837890625, 0.055938720703125, 0.06246185302734375, 0.0689849853515625, 0.07550811767578125, 0.08203125, 0.08855438232421875, 0.0950775146484375, 0.10160064697265625, 0.108123779296875, 0.11464691162109375, 0.1211700439453125, 0.12769317626953125, 0.13421630859375, 0.14073944091796875, 0.1472625732421875, 0.15378570556640625, 0.160308837890625, 0.16683197021484375, 0.1733551025390625, 0.17987823486328125, 0.1864013671875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 6.0, 11.0, 17.0, 42.0, 75.0, 130.0, 217.0, 185.0, 119.0, 94.0, 41.0, 21.0, 17.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6024069786071777, -2.4645769596099854, -2.326746940612793, -2.1889171600341797, -2.0510871410369873, -1.913257122039795, -1.775427222251892, -1.6375973224639893, -1.4997673034667969, -1.3619372844696045, -1.2241073846817017, -1.0862774848937988, -0.9484474658966064, -0.8106175065040588, -0.6727875471115112, -0.5349575877189636, -0.397127628326416, -0.2592976689338684, -0.1214677095413208, 0.016362249851226807, 0.15419220924377441, 0.292022168636322, 0.42985212802886963, 0.5676820874214172, 0.7055120468139648, 0.8433420062065125, 0.9811719655990601, 1.119001865386963, 1.2568318843841553, 1.3946619033813477, 1.5324918031692505, 1.6703217029571533, 1.808152198791504, 1.9459822177886963, 2.0838122367858887, 2.221642017364502, 2.3594720363616943, 2.4973020553588867, 2.6351318359375, 2.7729618549346924, 2.9107918739318848, 3.048621892929077, 3.1864519119262695, 3.324281692504883, 3.462111711502075, 3.5999417304992676, 3.737771511077881, 3.8756015300750732, 4.013431549072266, 4.151261329650879, 4.28909158706665, 4.426921367645264, 4.564751625061035, 4.702581405639648, 4.840411186218262, 4.978241443634033, 5.1160712242126465, 5.25390100479126, 5.391731262207031, 5.5295610427856445, 5.667390823364258, 5.805221080780029, 5.943050861358643, 6.080881118774414, 6.218710899353027]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 9.0, 11.0, 16.0, 14.0, 30.0, 27.0, 27.0, 35.0, 38.0, 44.0, 44.0, 54.0, 54.0, 78.0, 61.0, 64.0, 48.0, 47.0, 41.0, 35.0, 39.0, 28.0, 24.0, 18.0, 20.0, 17.0, 16.0, 12.0, 16.0, 7.0, 5.0, 0.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.039203643798828, -2.964172840118408, -2.8891422748565674, -2.8141114711761475, -2.7390806674957275, -2.6640501022338867, -2.589019298553467, -2.513988494873047, -2.438957691192627, -2.363926887512207, -2.288896322250366, -2.2138655185699463, -2.1388347148895264, -2.0638041496276855, -1.9887733459472656, -1.9137425422668457, -1.8387119770050049, -1.7636812925338745, -1.6886504888534546, -1.6136198043823242, -1.5385890007019043, -1.463558316230774, -1.3885276317596436, -1.3134968280792236, -1.2384661436080933, -1.163435459136963, -1.088404655456543, -1.0133739709854126, -0.9383432269096375, -0.8633124828338623, -0.7882817983627319, -0.7132510542869568, -0.6382205486297607, -0.5631898045539856, -0.48815909028053284, -0.4131283760070801, -0.33809763193130493, -0.2630668878555298, -0.18803617358207703, -0.11300545930862427, -0.03797471523284912, 0.03705601394176483, 0.11208674311637878, 0.18711747229099274, 0.2621482014656067, 0.33717894554138184, 0.4122096598148346, 0.48724037408828735, 0.5622711181640625, 0.6373018622398376, 0.7123326063156128, 0.7873632907867432, 0.8623940348625183, 0.9374247789382935, 1.0124554634094238, 1.0874862670898438, 1.1625169515609741, 1.2375476360321045, 1.3125784397125244, 1.3876091241836548, 1.4626398086547852, 1.537670612335205, 1.6127012968063354, 1.6877319812774658, 1.7627627849578857]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 12.0, 17.0, 24.0, 31.0, 69.0, 100.0, 186.0, 509.0, 1667.0, 8631.0, 130687.0, 4003160.0, 42550.0, 4765.0, 1106.0, 329.0, 143.0, 76.0, 46.0, 32.0, 34.0, 12.0, 14.0, 5.0, 10.0, 12.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.0673828125, -1.040252685546875, -1.01312255859375, -0.985992431640625, -0.9588623046875, -0.931732177734375, -0.90460205078125, -0.877471923828125, -0.850341796875, -0.823211669921875, -0.79608154296875, -0.768951416015625, -0.7418212890625, -0.714691162109375, -0.68756103515625, -0.660430908203125, -0.63330078125, -0.606170654296875, -0.57904052734375, -0.551910400390625, -0.5247802734375, -0.497650146484375, -0.47052001953125, -0.443389892578125, -0.416259765625, -0.389129638671875, -0.36199951171875, -0.334869384765625, -0.3077392578125, -0.280609130859375, -0.25347900390625, -0.226348876953125, -0.19921875, -0.172088623046875, -0.14495849609375, -0.117828369140625, -0.0906982421875, -0.063568115234375, -0.03643798828125, -0.009307861328125, 0.017822265625, 0.044952392578125, 0.07208251953125, 0.099212646484375, 0.1263427734375, 0.153472900390625, 0.18060302734375, 0.207733154296875, 0.23486328125, 0.261993408203125, 0.28912353515625, 0.316253662109375, 0.3433837890625, 0.370513916015625, 0.39764404296875, 0.424774169921875, 0.451904296875, 0.479034423828125, 0.50616455078125, 0.533294677734375, 0.5604248046875, 0.587554931640625, 0.61468505859375, 0.641815185546875, 0.6689453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 10.0, 6.0, 9.0, 18.0, 21.0, 28.0, 50.0, 45.0, 52.0, 68.0, 67.0, 78.0, 68.0, 76.0, 64.0, 83.0, 53.0, 49.0, 42.0, 39.0, 28.0, 11.0, 13.0, 11.0, 12.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.2256460189819336, -0.2200908660888672, -0.21453571319580078, -0.20898056030273438, -0.20342540740966797, -0.19787025451660156, -0.19231510162353516, -0.18675994873046875, -0.18120479583740234, -0.17564964294433594, -0.17009449005126953, -0.16453933715820312, -0.15898418426513672, -0.1534290313720703, -0.1478738784790039, -0.1423187255859375, -0.1367635726928711, -0.1312084197998047, -0.12565326690673828, -0.12009811401367188, -0.11454296112060547, -0.10898780822753906, -0.10343265533447266, -0.09787750244140625, -0.09232234954833984, -0.08676719665527344, -0.08121204376220703, -0.07565689086914062, -0.07010173797607422, -0.06454658508300781, -0.058991432189941406, -0.053436279296875, -0.047881126403808594, -0.04232597351074219, -0.03677082061767578, -0.031215667724609375, -0.02566051483154297, -0.020105361938476562, -0.014550209045410156, -0.00899505615234375, -0.0034399032592773438, 0.0021152496337890625, 0.007670402526855469, 0.013225555419921875, 0.01878070831298828, 0.024335861206054688, 0.029891014099121094, 0.0354461669921875, 0.041001319885253906, 0.04655647277832031, 0.05211162567138672, 0.057666778564453125, 0.06322193145751953, 0.06877708435058594, 0.07433223724365234, 0.07988739013671875, 0.08544254302978516, 0.09099769592285156, 0.09655284881591797, 0.10210800170898438, 0.10766315460205078, 0.11321830749511719, 0.1187734603881836, 0.12432861328125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 12.0, 9.0, 19.0, 37.0, 61.0, 112.0, 219.0, 399.0, 955.0, 2148.0, 5832.0, 17944.0, 71740.0, 786245.0, 3109867.0, 152278.0, 30674.0, 9494.0, 3439.0, 1447.0, 635.0, 305.0, 161.0, 90.0, 55.0, 32.0, 15.0, 12.0, 9.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.3169097900390625, -0.303253173828125, -0.2895965576171875, -0.27593994140625, -0.2622833251953125, -0.248626708984375, -0.2349700927734375, -0.2213134765625, -0.2076568603515625, -0.194000244140625, -0.1803436279296875, -0.16668701171875, -0.1530303955078125, -0.139373779296875, -0.1257171630859375, -0.112060546875, -0.0984039306640625, -0.084747314453125, -0.0710906982421875, -0.05743408203125, -0.0437774658203125, -0.030120849609375, -0.0164642333984375, -0.0028076171875, 0.0108489990234375, 0.024505615234375, 0.0381622314453125, 0.05181884765625, 0.0654754638671875, 0.079132080078125, 0.0927886962890625, 0.1064453125, 0.1201019287109375, 0.133758544921875, 0.1474151611328125, 0.16107177734375, 0.1747283935546875, 0.188385009765625, 0.2020416259765625, 0.2156982421875, 0.2293548583984375, 0.243011474609375, 0.2566680908203125, 0.27032470703125, 0.2839813232421875, 0.297637939453125, 0.3112945556640625, 0.324951171875, 0.3386077880859375, 0.352264404296875, 0.3659210205078125, 0.37957763671875, 0.3932342529296875, 0.406890869140625, 0.4205474853515625, 0.4342041015625, 0.4478607177734375, 0.461517333984375, 0.4751739501953125, 0.48883056640625, 0.5024871826171875, 0.516143798828125, 0.5298004150390625, 0.54345703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 7.0, 8.0, 21.0, 14.0, 25.0, 29.0, 53.0, 89.0, 124.0, 183.0, 381.0, 734.0, 1073.0, 515.0, 289.0, 155.0, 93.0, 74.0, 51.0, 33.0, 20.0, 18.0, 11.0, 16.0, 9.0, 6.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2823333740234375, -0.270233154296875, -0.2581329345703125, -0.24603271484375, -0.2339324951171875, -0.221832275390625, -0.2097320556640625, -0.1976318359375, -0.1855316162109375, -0.173431396484375, -0.1613311767578125, -0.14923095703125, -0.1371307373046875, -0.125030517578125, -0.1129302978515625, -0.100830078125, -0.0887298583984375, -0.076629638671875, -0.0645294189453125, -0.05242919921875, -0.0403289794921875, -0.028228759765625, -0.0161285400390625, -0.0040283203125, 0.0080718994140625, 0.020172119140625, 0.0322723388671875, 0.04437255859375, 0.0564727783203125, 0.068572998046875, 0.0806732177734375, 0.0927734375, 0.1048736572265625, 0.116973876953125, 0.1290740966796875, 0.14117431640625, 0.1532745361328125, 0.165374755859375, 0.1774749755859375, 0.1895751953125, 0.2016754150390625, 0.213775634765625, 0.2258758544921875, 0.23797607421875, 0.2500762939453125, 0.262176513671875, 0.2742767333984375, 0.286376953125, 0.2984771728515625, 0.310577392578125, 0.3226776123046875, 0.33477783203125, 0.3468780517578125, 0.358978271484375, 0.3710784912109375, 0.3831787109375, 0.3952789306640625, 0.407379150390625, 0.4194793701171875, 0.43157958984375, 0.4436798095703125, 0.455780029296875, 0.4678802490234375, 0.47998046875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 21.0, 31.0, 39.0, 70.0, 97.0, 133.0, 117.0, 124.0, 98.0, 73.0, 60.0, 38.0, 23.0, 5.0, 9.0, 5.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.598886013031006, -2.520750045776367, -2.4426143169403076, -2.364478349685669, -2.2863426208496094, -2.2082066535949707, -2.130070924758911, -2.0519349575042725, -1.973799228668213, -1.8956633806228638, -1.8175275325775146, -1.7393916845321655, -1.6612558364868164, -1.5831199884414673, -1.5049841403961182, -1.4268481731414795, -1.3487123250961304, -1.2705764770507812, -1.1924406290054321, -1.114304780960083, -1.0361689329147339, -0.9580330848693848, -0.8798971772193909, -0.8017613291740417, -0.7236254811286926, -0.6454896330833435, -0.5673537850379944, -0.4892179071903229, -0.41108205914497375, -0.33294621109962463, -0.2548103332519531, -0.176674485206604, -0.09853863716125488, -0.020402781665325165, 0.05773307383060455, 0.13586893677711487, 0.214004784822464, 0.2921406328678131, 0.3702765107154846, 0.44841235876083374, 0.5265482068061829, 0.604684054851532, 0.6828199028968811, 0.760955810546875, 0.8390916585922241, 0.9172275066375732, 0.9953633546829224, 1.0734992027282715, 1.1516350507736206, 1.2297708988189697, 1.3079067468643188, 1.386042594909668, 1.464178442955017, 1.5423142910003662, 1.6204502582550049, 1.6985859870910645, 1.7767219543457031, 1.8548578023910522, 1.9329936504364014, 2.01112961769104, 2.0892653465270996, 2.1674013137817383, 2.245537042617798, 2.3236730098724365, 2.401808738708496]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 9.0, 7.0, 13.0, 13.0, 10.0, 20.0, 28.0, 15.0, 18.0, 25.0, 35.0, 45.0, 42.0, 50.0, 48.0, 44.0, 49.0, 40.0, 51.0, 51.0, 49.0, 31.0, 26.0, 37.0, 38.0, 34.0, 25.0, 17.0, 21.0, 19.0, 14.0, 17.0, 11.0, 7.0, 10.0, 9.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.406076192855835, -1.3600701093673706, -1.3140639066696167, -1.2680578231811523, -1.222051739692688, -1.176045536994934, -1.1300394535064697, -1.0840332508087158, -1.0380271673202515, -0.9920210242271423, -0.946014940738678, -0.9000087976455688, -0.8540026545524597, -0.8079965114593506, -0.7619904279708862, -0.7159842848777771, -0.6699782013893127, -0.6239720582962036, -0.5779659748077393, -0.5319598317146301, -0.485953688621521, -0.43994757533073425, -0.3939414620399475, -0.3479353189468384, -0.30192920565605164, -0.2559230923652649, -0.20991694927215576, -0.16391083598136902, -0.11790470778942108, -0.07189857959747314, -0.0258924663066864, 0.02011367678642273, 0.06611979007720947, 0.11212591826915741, 0.15813204646110535, 0.2041381597518921, 0.2501443028450012, 0.29615041613578796, 0.3421565294265747, 0.38816267251968384, 0.4341687858104706, 0.4801748991012573, 0.5261810421943665, 0.5721871852874756, 0.6181932687759399, 0.6641994118690491, 0.7102055549621582, 0.7562116384506226, 0.8022177815437317, 0.8482239246368408, 0.8942300081253052, 0.9402361512184143, 0.9862422943115234, 1.0322483777999878, 1.0782544612884521, 1.124260663986206, 1.1702667474746704, 1.2162728309631348, 1.2622790336608887, 1.308285117149353, 1.3542912006378174, 1.4002974033355713, 1.4463034868240356, 1.4923095703125, 1.538315773010254]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 11.0, 14.0, 24.0, 32.0, 29.0, 60.0, 85.0, 98.0, 151.0, 213.0, 335.0, 455.0, 757.0, 1058.0, 1775.0, 2787.0, 4700.0, 8160.0, 14775.0, 29853.0, 68487.0, 190056.0, 403697.0, 187652.0, 67843.0, 29967.0, 14956.0, 8102.0, 4692.0, 2755.0, 1687.0, 1082.0, 738.0, 447.0, 309.0, 205.0, 169.0, 97.0, 60.0, 56.0, 36.0, 25.0, 23.0, 10.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2474365234375, -0.2395801544189453, -0.23172378540039062, -0.22386741638183594, -0.21601104736328125, -0.20815467834472656, -0.20029830932617188, -0.1924419403076172, -0.1845855712890625, -0.1767292022705078, -0.16887283325195312, -0.16101646423339844, -0.15316009521484375, -0.14530372619628906, -0.13744735717773438, -0.1295909881591797, -0.121734619140625, -0.11387825012207031, -0.10602188110351562, -0.09816551208496094, -0.09030914306640625, -0.08245277404785156, -0.07459640502929688, -0.06674003601074219, -0.0588836669921875, -0.05102729797363281, -0.043170928955078125, -0.03531455993652344, -0.02745819091796875, -0.019601821899414062, -0.011745452880859375, -0.0038890838623046875, 0.00396728515625, 0.011823654174804688, 0.019680023193359375, 0.027536392211914062, 0.03539276123046875, 0.04324913024902344, 0.051105499267578125, 0.05896186828613281, 0.0668182373046875, 0.07467460632324219, 0.08253097534179688, 0.09038734436035156, 0.09824371337890625, 0.10610008239746094, 0.11395645141601562, 0.12181282043457031, 0.129669189453125, 0.1375255584716797, 0.14538192749023438, 0.15323829650878906, 0.16109466552734375, 0.16895103454589844, 0.17680740356445312, 0.1846637725830078, 0.1925201416015625, 0.2003765106201172, 0.20823287963867188, 0.21608924865722656, 0.22394561767578125, 0.23180198669433594, 0.23965835571289062, 0.2475147247314453, 0.25537109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 18.0, 18.0, 18.0, 40.0, 43.0, 50.0, 58.0, 61.0, 65.0, 65.0, 63.0, 74.0, 70.0, 55.0, 59.0, 36.0, 42.0, 37.0, 21.0, 22.0, 20.0, 8.0, 6.0, 9.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.22412109375, -0.21869850158691406, -0.21327590942382812, -0.2078533172607422, -0.20243072509765625, -0.1970081329345703, -0.19158554077148438, -0.18616294860839844, -0.1807403564453125, -0.17531776428222656, -0.16989517211914062, -0.1644725799560547, -0.15904998779296875, -0.1536273956298828, -0.14820480346679688, -0.14278221130371094, -0.137359619140625, -0.13193702697753906, -0.12651443481445312, -0.12109184265136719, -0.11566925048828125, -0.11024665832519531, -0.10482406616210938, -0.09940147399902344, -0.0939788818359375, -0.08855628967285156, -0.08313369750976562, -0.07771110534667969, -0.07228851318359375, -0.06686592102050781, -0.061443328857421875, -0.05602073669433594, -0.05059814453125, -0.04517555236816406, -0.039752960205078125, -0.03433036804199219, -0.02890777587890625, -0.023485183715820312, -0.018062591552734375, -0.012639999389648438, -0.0072174072265625, -0.0017948150634765625, 0.003627777099609375, 0.009050369262695312, 0.01447296142578125, 0.019895553588867188, 0.025318145751953125, 0.030740737915039062, 0.036163330078125, 0.04158592224121094, 0.047008514404296875, 0.05243110656738281, 0.05785369873046875, 0.06327629089355469, 0.06869888305664062, 0.07412147521972656, 0.0795440673828125, 0.08496665954589844, 0.09038925170898438, 0.09581184387207031, 0.10123443603515625, 0.10665702819824219, 0.11207962036132812, 0.11750221252441406, 0.1229248046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 12.0, 9.0, 14.0, 19.0, 31.0, 35.0, 44.0, 71.0, 92.0, 146.0, 188.0, 331.0, 499.0, 869.0, 1621.0, 3403.0, 8548.0, 24844.0, 98805.0, 656414.0, 192052.0, 38542.0, 12223.0, 4744.0, 2105.0, 1111.0, 612.0, 339.0, 252.0, 165.0, 94.0, 79.0, 51.0, 51.0, 38.0, 18.0, 17.0, 14.0, 11.0, 5.0, 2.0, 5.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.431640625, -0.4180145263671875, -0.404388427734375, -0.3907623291015625, -0.37713623046875, -0.3635101318359375, -0.349884033203125, -0.3362579345703125, -0.3226318359375, -0.3090057373046875, -0.295379638671875, -0.2817535400390625, -0.26812744140625, -0.2545013427734375, -0.240875244140625, -0.2272491455078125, -0.213623046875, -0.1999969482421875, -0.186370849609375, -0.1727447509765625, -0.15911865234375, -0.1454925537109375, -0.131866455078125, -0.1182403564453125, -0.1046142578125, -0.0909881591796875, -0.077362060546875, -0.0637359619140625, -0.05010986328125, -0.0364837646484375, -0.022857666015625, -0.0092315673828125, 0.00439453125, 0.0180206298828125, 0.031646728515625, 0.0452728271484375, 0.05889892578125, 0.0725250244140625, 0.086151123046875, 0.0997772216796875, 0.1134033203125, 0.1270294189453125, 0.140655517578125, 0.1542816162109375, 0.16790771484375, 0.1815338134765625, 0.195159912109375, 0.2087860107421875, 0.222412109375, 0.2360382080078125, 0.249664306640625, 0.2632904052734375, 0.27691650390625, 0.2905426025390625, 0.304168701171875, 0.3177947998046875, 0.3314208984375, 0.3450469970703125, 0.358673095703125, 0.3722991943359375, 0.38592529296875, 0.3995513916015625, 0.413177490234375, 0.4268035888671875, 0.4404296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 21.0, 13.0, 15.0, 19.0, 24.0, 30.0, 28.0, 29.0, 38.0, 50.0, 51.0, 58.0, 62.0, 50.0, 47.0, 46.0, 58.0, 61.0, 49.0, 40.0, 41.0, 29.0, 29.0, 16.0, 12.0, 9.0, 8.0, 6.0, 7.0, 8.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.5829925537109375, -0.564910888671875, -0.5468292236328125, -0.52874755859375, -0.5106658935546875, -0.492584228515625, -0.4745025634765625, -0.4564208984375, -0.4383392333984375, -0.420257568359375, -0.4021759033203125, -0.38409423828125, -0.3660125732421875, -0.347930908203125, -0.3298492431640625, -0.311767578125, -0.2936859130859375, -0.275604248046875, -0.2575225830078125, -0.23944091796875, -0.2213592529296875, -0.203277587890625, -0.1851959228515625, -0.1671142578125, -0.1490325927734375, -0.130950927734375, -0.1128692626953125, -0.09478759765625, -0.0767059326171875, -0.058624267578125, -0.0405426025390625, -0.0224609375, -0.0043792724609375, 0.013702392578125, 0.0317840576171875, 0.04986572265625, 0.0679473876953125, 0.086029052734375, 0.1041107177734375, 0.1221923828125, 0.1402740478515625, 0.158355712890625, 0.1764373779296875, 0.19451904296875, 0.2126007080078125, 0.230682373046875, 0.2487640380859375, 0.266845703125, 0.2849273681640625, 0.303009033203125, 0.3210906982421875, 0.33917236328125, 0.3572540283203125, 0.375335693359375, 0.3934173583984375, 0.4114990234375, 0.4295806884765625, 0.447662353515625, 0.4657440185546875, 0.48382568359375, 0.5019073486328125, 0.519989013671875, 0.5380706787109375, 0.55615234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 9.0, 7.0, 13.0, 17.0, 18.0, 42.0, 105.0, 227.0, 552.0, 1737.0, 7587.0, 75188.0, 864464.0, 87383.0, 8246.0, 1856.0, 617.0, 245.0, 101.0, 54.0, 24.0, 21.0, 10.0, 6.0, 6.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40771484375, -0.3939056396484375, -0.380096435546875, -0.3662872314453125, -0.35247802734375, -0.3386688232421875, -0.324859619140625, -0.3110504150390625, -0.2972412109375, -0.2834320068359375, -0.269622802734375, -0.2558135986328125, -0.24200439453125, -0.2281951904296875, -0.214385986328125, -0.2005767822265625, -0.186767578125, -0.1729583740234375, -0.159149169921875, -0.1453399658203125, -0.13153076171875, -0.1177215576171875, -0.103912353515625, -0.0901031494140625, -0.0762939453125, -0.0624847412109375, -0.048675537109375, -0.0348663330078125, -0.02105712890625, -0.0072479248046875, 0.006561279296875, 0.0203704833984375, 0.0341796875, 0.0479888916015625, 0.061798095703125, 0.0756072998046875, 0.08941650390625, 0.1032257080078125, 0.117034912109375, 0.1308441162109375, 0.1446533203125, 0.1584625244140625, 0.172271728515625, 0.1860809326171875, 0.19989013671875, 0.2136993408203125, 0.227508544921875, 0.2413177490234375, 0.255126953125, 0.2689361572265625, 0.282745361328125, 0.2965545654296875, 0.31036376953125, 0.3241729736328125, 0.337982177734375, 0.3517913818359375, 0.3656005859375, 0.3794097900390625, 0.393218994140625, 0.4070281982421875, 0.42083740234375, 0.4346466064453125, 0.448455810546875, 0.4622650146484375, 0.47607421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 7.0, 10.0, 8.0, 9.0, 23.0, 25.0, 41.0, 60.0, 69.0, 93.0, 117.0, 123.0, 102.0, 71.0, 63.0, 43.0, 30.0, 31.0, 19.0, 13.0, 6.0, 4.0, 5.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.900859832763672e-05, -5.699321627616882e-05, -5.497783422470093e-05, -5.296245217323303e-05, -5.094707012176514e-05, -4.893168807029724e-05, -4.6916306018829346e-05, -4.490092396736145e-05, -4.2885541915893555e-05, -4.087015986442566e-05, -3.8854777812957764e-05, -3.683939576148987e-05, -3.482401371002197e-05, -3.280863165855408e-05, -3.079324960708618e-05, -2.8777867555618286e-05, -2.676248550415039e-05, -2.4747103452682495e-05, -2.27317214012146e-05, -2.0716339349746704e-05, -1.870095729827881e-05, -1.6685575246810913e-05, -1.4670193195343018e-05, -1.2654811143875122e-05, -1.0639429092407227e-05, -8.624047040939331e-06, -6.6086649894714355e-06, -4.59328293800354e-06, -2.5779008865356445e-06, -5.62518835067749e-07, 1.4528632164001465e-06, 3.468245267868042e-06, 5.4836273193359375e-06, 7.499009370803833e-06, 9.514391422271729e-06, 1.1529773473739624e-05, 1.354515552520752e-05, 1.5560537576675415e-05, 1.757591962814331e-05, 1.9591301679611206e-05, 2.16066837310791e-05, 2.3622065782546997e-05, 2.5637447834014893e-05, 2.7652829885482788e-05, 2.9668211936950684e-05, 3.168359398841858e-05, 3.3698976039886475e-05, 3.571435809135437e-05, 3.7729740142822266e-05, 3.974512219429016e-05, 4.176050424575806e-05, 4.377588629722595e-05, 4.579126834869385e-05, 4.780665040016174e-05, 4.982203245162964e-05, 5.1837414503097534e-05, 5.385279655456543e-05, 5.5868178606033325e-05, 5.788356065750122e-05, 5.9898942708969116e-05, 6.191432476043701e-05, 6.392970681190491e-05, 6.59450888633728e-05, 6.79604709148407e-05, 6.99758529663086e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 7.0, 6.0, 15.0, 16.0, 30.0, 24.0, 45.0, 68.0, 124.0, 180.0, 271.0, 490.0, 1007.0, 2215.0, 6206.0, 22785.0, 143713.0, 706437.0, 133068.0, 21515.0, 6052.0, 2073.0, 952.0, 486.0, 258.0, 165.0, 100.0, 87.0, 33.0, 35.0, 16.0, 22.0, 14.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.283203125, -0.2754402160644531, -0.26767730712890625, -0.2599143981933594, -0.2521514892578125, -0.24438858032226562, -0.23662567138671875, -0.22886276245117188, -0.221099853515625, -0.21333694458007812, -0.20557403564453125, -0.19781112670898438, -0.1900482177734375, -0.18228530883789062, -0.17452239990234375, -0.16675949096679688, -0.15899658203125, -0.15123367309570312, -0.14347076416015625, -0.13570785522460938, -0.1279449462890625, -0.12018203735351562, -0.11241912841796875, -0.10465621948242188, -0.096893310546875, -0.08913040161132812, -0.08136749267578125, -0.07360458374023438, -0.0658416748046875, -0.058078765869140625, -0.05031585693359375, -0.042552947998046875, -0.0347900390625, -0.027027130126953125, -0.01926422119140625, -0.011501312255859375, -0.0037384033203125, 0.004024505615234375, 0.01178741455078125, 0.019550323486328125, 0.027313232421875, 0.035076141357421875, 0.04283905029296875, 0.050601959228515625, 0.0583648681640625, 0.06612777709960938, 0.07389068603515625, 0.08165359497070312, 0.08941650390625, 0.09717941284179688, 0.10494232177734375, 0.11270523071289062, 0.1204681396484375, 0.12823104858398438, 0.13599395751953125, 0.14375686645507812, 0.151519775390625, 0.15928268432617188, 0.16704559326171875, 0.17480850219726562, 0.1825714111328125, 0.19033432006835938, 0.19809722900390625, 0.20586013793945312, 0.213623046875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 3.0, 8.0, 10.0, 18.0, 20.0, 24.0, 40.0, 39.0, 57.0, 47.0, 68.0, 96.0, 88.0, 79.0, 81.0, 59.0, 49.0, 47.0, 34.0, 24.0, 18.0, 12.0, 12.0, 7.0, 9.0, 7.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2423095703125, -0.2360210418701172, -0.22973251342773438, -0.22344398498535156, -0.21715545654296875, -0.21086692810058594, -0.20457839965820312, -0.1982898712158203, -0.1920013427734375, -0.1857128143310547, -0.17942428588867188, -0.17313575744628906, -0.16684722900390625, -0.16055870056152344, -0.15427017211914062, -0.1479816436767578, -0.141693115234375, -0.1354045867919922, -0.12911605834960938, -0.12282752990722656, -0.11653900146484375, -0.11025047302246094, -0.10396194458007812, -0.09767341613769531, -0.0913848876953125, -0.08509635925292969, -0.07880783081054688, -0.07251930236816406, -0.06623077392578125, -0.05994224548339844, -0.053653717041015625, -0.04736518859863281, -0.04107666015625, -0.03478813171386719, -0.028499603271484375, -0.022211074829101562, -0.01592254638671875, -0.009634017944335938, -0.003345489501953125, 0.0029430389404296875, 0.0092315673828125, 0.015520095825195312, 0.021808624267578125, 0.028097152709960938, 0.03438568115234375, 0.04067420959472656, 0.046962738037109375, 0.05325126647949219, 0.059539794921875, 0.06582832336425781, 0.07211685180664062, 0.07840538024902344, 0.08469390869140625, 0.09098243713378906, 0.09727096557617188, 0.10355949401855469, 0.1098480224609375, 0.11613655090332031, 0.12242507934570312, 0.12871360778808594, 0.13500213623046875, 0.14129066467285156, 0.14757919311523438, 0.1538677215576172, 0.16015625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 10.0, 13.0, 20.0, 48.0, 60.0, 96.0, 118.0, 157.0, 140.0, 115.0, 70.0, 55.0, 31.0, 19.0, 15.0, 8.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.539969444274902, -4.439096927642822, -4.338224411010742, -4.237351894378662, -4.136479377746582, -4.035606861114502, -3.934734582901001, -3.833862066268921, -3.732989549636841, -3.6321170330047607, -3.5312445163726807, -3.4303722381591797, -3.3294997215270996, -3.2286272048950195, -3.1277546882629395, -3.0268821716308594, -2.9260096549987793, -2.825137138366699, -2.724264621734619, -2.623392105102539, -2.522519826889038, -2.421647310256958, -2.320774793624878, -2.219902276992798, -2.119029998779297, -2.018157482147217, -1.9172850847244263, -1.8164125680923462, -1.7155400514602661, -1.6146676540374756, -1.5137951374053955, -1.4129226207733154, -1.3120501041412354, -1.2111775875091553, -1.1103051900863647, -1.0094326734542847, -0.9085601568222046, -0.8076876997947693, -0.706815242767334, -0.6059427261352539, -0.5050702691078186, -0.4041977822780609, -0.3033252954483032, -0.20245283842086792, -0.10158035159111023, -0.0007078647613525391, 0.10016459226608276, 0.20103710889816284, 0.30190956592559814, 0.40278205275535583, 0.5036545395851135, 0.6045269966125488, 0.7053995132446289, 0.8062719702720642, 0.9071444272994995, 1.0080169439315796, 1.1088893413543701, 1.2097618579864502, 1.3106342554092407, 1.4115067720413208, 1.5123792886734009, 1.6132516860961914, 1.7141242027282715, 1.8149967193603516, 1.9158692359924316]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 9.0, 13.0, 20.0, 19.0, 18.0, 16.0, 22.0, 21.0, 28.0, 26.0, 33.0, 30.0, 38.0, 47.0, 42.0, 49.0, 46.0, 43.0, 41.0, 44.0, 44.0, 31.0, 33.0, 36.0, 26.0, 18.0, 26.0, 31.0, 15.0, 21.0, 17.0, 11.0, 11.0, 12.0, 4.0, 11.0, 3.0, 7.0, 1.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.971482753753662, -1.9116636514663696, -1.8518446683883667, -1.7920255661010742, -1.7322065830230713, -1.6723874807357788, -1.6125683784484863, -1.5527493953704834, -1.4929304122924805, -1.433111310005188, -1.373292326927185, -1.3134732246398926, -1.2536542415618896, -1.1938351392745972, -1.1340160369873047, -1.0741970539093018, -1.0143779516220093, -0.9545589089393616, -0.8947398662567139, -0.8349207639694214, -0.7751017808914185, -0.715282678604126, -0.6554636359214783, -0.5956445932388306, -0.5358255505561829, -0.47600650787353516, -0.41618746519088745, -0.35636839270591736, -0.29654935002326965, -0.23673030734062195, -0.17691123485565186, -0.11709219217300415, -0.057273030281066895, 0.0025460198521614075, 0.06236506998538971, 0.12218412756919861, 0.1820031702518463, 0.24182221293449402, 0.3016412854194641, 0.3614603281021118, 0.4212793707847595, 0.4810984134674072, 0.5409174561500549, 0.6007364988327026, 0.6605556011199951, 0.720374584197998, 0.7801936864852905, 0.8400127291679382, 0.8998317718505859, 0.9596508145332336, 1.0194698572158813, 1.0792889595031738, 1.1391079425811768, 1.1989270448684692, 1.2587461471557617, 1.3185651302337646, 1.3783841133117676, 1.43820321559906, 1.498022198677063, 1.5578413009643555, 1.6176602840423584, 1.6774793863296509, 1.7372984886169434, 1.7971174716949463, 1.8569365739822388]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 15.0, 22.0, 32.0, 42.0, 76.0, 117.0, 171.0, 319.0, 417.0, 704.0, 1192.0, 1962.0, 3469.0, 6523.0, 12811.0, 29526.0, 84100.0, 374297.0, 2225782.0, 1167311.0, 189165.0, 53749.0, 20990.0, 9645.0, 5053.0, 2709.0, 1534.0, 954.0, 561.0, 374.0, 232.0, 164.0, 91.0, 55.0, 42.0, 27.0, 12.0, 14.0, 4.0, 4.0, 1.0, 3.0], "bins": [-0.26953125, -0.2629241943359375, -0.256317138671875, -0.2497100830078125, -0.24310302734375, -0.2364959716796875, -0.229888916015625, -0.2232818603515625, -0.2166748046875, -0.2100677490234375, -0.203460693359375, -0.1968536376953125, -0.19024658203125, -0.1836395263671875, -0.177032470703125, -0.1704254150390625, -0.163818359375, -0.1572113037109375, -0.150604248046875, -0.1439971923828125, -0.13739013671875, -0.1307830810546875, -0.124176025390625, -0.1175689697265625, -0.1109619140625, -0.1043548583984375, -0.097747802734375, -0.0911407470703125, -0.08453369140625, -0.0779266357421875, -0.071319580078125, -0.0647125244140625, -0.05810546875, -0.0514984130859375, -0.044891357421875, -0.0382843017578125, -0.03167724609375, -0.0250701904296875, -0.018463134765625, -0.0118560791015625, -0.0052490234375, 0.0013580322265625, 0.007965087890625, 0.0145721435546875, 0.02117919921875, 0.0277862548828125, 0.034393310546875, 0.0410003662109375, 0.047607421875, 0.0542144775390625, 0.060821533203125, 0.0674285888671875, 0.07403564453125, 0.0806427001953125, 0.087249755859375, 0.0938568115234375, 0.1004638671875, 0.1070709228515625, 0.113677978515625, 0.1202850341796875, 0.12689208984375, 0.1334991455078125, 0.140106201171875, 0.1467132568359375, 0.1533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 10.0, 11.0, 13.0, 24.0, 33.0, 22.0, 39.0, 44.0, 51.0, 41.0, 55.0, 60.0, 55.0, 60.0, 53.0, 58.0, 48.0, 39.0, 47.0, 45.0, 32.0, 25.0, 29.0, 15.0, 21.0, 18.0, 12.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1490478515625, -0.14482784271240234, -0.1406078338623047, -0.13638782501220703, -0.13216781616210938, -0.12794780731201172, -0.12372779846191406, -0.1195077896118164, -0.11528778076171875, -0.1110677719116211, -0.10684776306152344, -0.10262775421142578, -0.09840774536132812, -0.09418773651123047, -0.08996772766113281, -0.08574771881103516, -0.0815277099609375, -0.07730770111083984, -0.07308769226074219, -0.06886768341064453, -0.06464767456054688, -0.06042766571044922, -0.05620765686035156, -0.051987648010253906, -0.04776763916015625, -0.043547630310058594, -0.03932762145996094, -0.03510761260986328, -0.030887603759765625, -0.02666759490966797, -0.022447586059570312, -0.018227577209472656, -0.014007568359375, -0.009787559509277344, -0.0055675506591796875, -0.0013475418090820312, 0.002872467041015625, 0.007092475891113281, 0.011312484741210938, 0.015532493591308594, 0.01975250244140625, 0.023972511291503906, 0.028192520141601562, 0.03241252899169922, 0.036632537841796875, 0.04085254669189453, 0.04507255554199219, 0.049292564392089844, 0.0535125732421875, 0.057732582092285156, 0.06195259094238281, 0.06617259979248047, 0.07039260864257812, 0.07461261749267578, 0.07883262634277344, 0.0830526351928711, 0.08727264404296875, 0.0914926528930664, 0.09571266174316406, 0.09993267059326172, 0.10415267944335938, 0.10837268829345703, 0.11259269714355469, 0.11681270599365234, 0.12103271484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 6.0, 8.0, 20.0, 21.0, 40.0, 75.0, 117.0, 226.0, 417.0, 980.0, 2549.0, 7829.0, 31170.0, 184446.0, 2961484.0, 898544.0, 81404.0, 16999.0, 4849.0, 1732.0, 665.0, 287.0, 143.0, 96.0, 54.0, 34.0, 22.0, 11.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.515625, -0.5016098022460938, -0.4875946044921875, -0.47357940673828125, -0.459564208984375, -0.44554901123046875, -0.4315338134765625, -0.41751861572265625, -0.40350341796875, -0.38948822021484375, -0.3754730224609375, -0.36145782470703125, -0.347442626953125, -0.33342742919921875, -0.3194122314453125, -0.30539703369140625, -0.2913818359375, -0.27736663818359375, -0.2633514404296875, -0.24933624267578125, -0.235321044921875, -0.22130584716796875, -0.2072906494140625, -0.19327545166015625, -0.17926025390625, -0.16524505615234375, -0.1512298583984375, -0.13721466064453125, -0.123199462890625, -0.10918426513671875, -0.0951690673828125, -0.08115386962890625, -0.067138671875, -0.05312347412109375, -0.0391082763671875, -0.02509307861328125, -0.011077880859375, 0.00293731689453125, 0.0169525146484375, 0.03096771240234375, 0.04498291015625, 0.05899810791015625, 0.0730133056640625, 0.08702850341796875, 0.101043701171875, 0.11505889892578125, 0.1290740966796875, 0.14308929443359375, 0.1571044921875, 0.17111968994140625, 0.1851348876953125, 0.19915008544921875, 0.213165283203125, 0.22718048095703125, 0.2411956787109375, 0.25521087646484375, 0.26922607421875, 0.28324127197265625, 0.2972564697265625, 0.31127166748046875, 0.325286865234375, 0.33930206298828125, 0.3533172607421875, 0.36733245849609375, 0.38134765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 9.0, 10.0, 10.0, 20.0, 27.0, 30.0, 34.0, 44.0, 60.0, 83.0, 124.0, 182.0, 277.0, 476.0, 666.0, 668.0, 453.0, 271.0, 187.0, 114.0, 83.0, 61.0, 42.0, 31.0, 27.0, 11.0, 16.0, 8.0, 12.0, 7.0, 5.0, 7.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37744140625, -0.36522674560546875, -0.3530120849609375, -0.34079742431640625, -0.328582763671875, -0.31636810302734375, -0.3041534423828125, -0.29193878173828125, -0.27972412109375, -0.26750946044921875, -0.2552947998046875, -0.24308013916015625, -0.230865478515625, -0.21865081787109375, -0.2064361572265625, -0.19422149658203125, -0.1820068359375, -0.16979217529296875, -0.1575775146484375, -0.14536285400390625, -0.133148193359375, -0.12093353271484375, -0.1087188720703125, -0.09650421142578125, -0.08428955078125, -0.07207489013671875, -0.0598602294921875, -0.04764556884765625, -0.035430908203125, -0.02321624755859375, -0.0110015869140625, 0.00121307373046875, 0.013427734375, 0.02564239501953125, 0.0378570556640625, 0.05007171630859375, 0.062286376953125, 0.07450103759765625, 0.0867156982421875, 0.09893035888671875, 0.11114501953125, 0.12335968017578125, 0.1355743408203125, 0.14778900146484375, 0.160003662109375, 0.17221832275390625, 0.1844329833984375, 0.19664764404296875, 0.2088623046875, 0.22107696533203125, 0.2332916259765625, 0.24550628662109375, 0.257720947265625, 0.26993560791015625, 0.2821502685546875, 0.29436492919921875, 0.30657958984375, 0.31879425048828125, 0.3310089111328125, 0.34322357177734375, 0.355438232421875, 0.36765289306640625, 0.3798675537109375, 0.39208221435546875, 0.404296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 10.0, 16.0, 12.0, 64.0, 123.0, 236.0, 244.0, 151.0, 66.0, 41.0, 13.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.866659164428711, -7.679159164428711, -7.491659641265869, -7.304160118103027, -7.116660118103027, -6.929160118103027, -6.7416605949401855, -6.554161071777344, -6.366661071777344, -6.179161071777344, -5.991661548614502, -5.80416202545166, -5.61666202545166, -5.42916202545166, -5.241662502288818, -5.054162979125977, -4.866662979125977, -4.679162979125977, -4.491663455963135, -4.304163932800293, -4.116663932800293, -3.929164171218872, -3.741664409637451, -3.5541646480560303, -3.3666648864746094, -3.1791651248931885, -2.9916653633117676, -2.8041656017303467, -2.616665840148926, -2.429166078567505, -2.241666316986084, -2.054166555404663, -1.8666667938232422, -1.6791670322418213, -1.4916672706604004, -1.3041675090789795, -1.1166677474975586, -0.9291679859161377, -0.7416682243347168, -0.5541684627532959, -0.366668701171875, -0.1791689395904541, 0.008330821990966797, 0.1958305835723877, 0.3833303451538086, 0.5708301067352295, 0.7583298683166504, 0.9458296298980713, 1.1333293914794922, 1.320829153060913, 1.508328914642334, 1.6958286762237549, 1.8833284378051758, 2.0708281993865967, 2.2583279609680176, 2.4458277225494385, 2.6333274841308594, 2.8208272457122803, 3.008327007293701, 3.195826768875122, 3.383326530456543, 3.570826292037964, 3.7583260536193848, 3.9458258152008057, 4.133325576782227]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 12.0, 15.0, 16.0, 22.0, 23.0, 26.0, 26.0, 33.0, 32.0, 40.0, 45.0, 42.0, 42.0, 52.0, 49.0, 45.0, 49.0, 50.0, 53.0, 52.0, 37.0, 31.0, 28.0, 38.0, 24.0, 29.0, 13.0, 16.0, 9.0, 14.0, 9.0, 4.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.54189133644104, -2.473738670349121, -2.405586004257202, -2.337433338165283, -2.2692806720733643, -2.2011280059814453, -2.1329753398895264, -2.0648226737976074, -1.996670126914978, -1.928517460823059, -1.8603647947311401, -1.7922121286392212, -1.7240595817565918, -1.6559069156646729, -1.587754249572754, -1.519601583480835, -1.451448917388916, -1.383296251296997, -1.3151435852050781, -1.2469909191131592, -1.1788382530212402, -1.1106855869293213, -1.042533040046692, -0.974380373954773, -0.906227707862854, -0.8380750417709351, -0.7699223756790161, -0.7017697691917419, -0.633617103099823, -0.565464437007904, -0.4973118007183075, -0.42915916442871094, -0.3610062599182129, -0.29285359382629395, -0.2247009575366974, -0.15654830634593964, -0.08839565515518188, -0.02024298906326294, 0.04790964722633362, 0.11606228351593018, 0.18421494960784912, 0.25236761569976807, 0.3205202519893646, 0.3886728882789612, 0.4568255543708801, 0.5249782204627991, 0.5931308269500732, 0.6612834930419922, 0.7294361591339111, 0.7975888252258301, 0.865741491317749, 0.9338940978050232, 1.002046823501587, 1.0701994895935059, 1.1383520364761353, 1.2065047025680542, 1.2746573686599731, 1.342810034751892, 1.410962700843811, 1.47911536693573, 1.5472679138183594, 1.6154205799102783, 1.6835732460021973, 1.7517259120941162, 1.8198785781860352]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 5.0, 16.0, 20.0, 30.0, 32.0, 62.0, 90.0, 136.0, 193.0, 252.0, 409.0, 681.0, 966.0, 1451.0, 2437.0, 3995.0, 6966.0, 11797.0, 21835.0, 41057.0, 80007.0, 167887.0, 312523.0, 197987.0, 92835.0, 46604.0, 25000.0, 13607.0, 7663.0, 4436.0, 2740.0, 1681.0, 1066.0, 714.0, 451.0, 301.0, 212.0, 143.0, 68.0, 54.0, 42.0, 29.0, 27.0, 15.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.220947265625, -0.2137279510498047, -0.20650863647460938, -0.19928932189941406, -0.19207000732421875, -0.18485069274902344, -0.17763137817382812, -0.1704120635986328, -0.1631927490234375, -0.1559734344482422, -0.14875411987304688, -0.14153480529785156, -0.13431549072265625, -0.12709617614746094, -0.11987686157226562, -0.11265754699707031, -0.105438232421875, -0.09821891784667969, -0.09099960327148438, -0.08378028869628906, -0.07656097412109375, -0.06934165954589844, -0.062122344970703125, -0.05490303039550781, -0.0476837158203125, -0.04046440124511719, -0.033245086669921875, -0.026025772094726562, -0.01880645751953125, -0.011587142944335938, -0.004367828369140625, 0.0028514862060546875, 0.01007080078125, 0.017290115356445312, 0.024509429931640625, 0.03172874450683594, 0.03894805908203125, 0.04616737365722656, 0.053386688232421875, 0.06060600280761719, 0.0678253173828125, 0.07504463195800781, 0.08226394653320312, 0.08948326110839844, 0.09670257568359375, 0.10392189025878906, 0.11114120483398438, 0.11836051940917969, 0.125579833984375, 0.1327991485595703, 0.14001846313476562, 0.14723777770996094, 0.15445709228515625, 0.16167640686035156, 0.16889572143554688, 0.1761150360107422, 0.1833343505859375, 0.1905536651611328, 0.19777297973632812, 0.20499229431152344, 0.21221160888671875, 0.21943092346191406, 0.22665023803710938, 0.2338695526123047, 0.2410888671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 10.0, 13.0, 12.0, 12.0, 14.0, 18.0, 17.0, 28.0, 32.0, 35.0, 43.0, 41.0, 45.0, 50.0, 58.0, 48.0, 39.0, 65.0, 35.0, 41.0, 48.0, 51.0, 57.0, 43.0, 20.0, 16.0, 22.0, 22.0, 13.0, 15.0, 11.0, 11.0, 5.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11138916015625, -0.10715198516845703, -0.10291481018066406, -0.0986776351928711, -0.09444046020507812, -0.09020328521728516, -0.08596611022949219, -0.08172893524169922, -0.07749176025390625, -0.07325458526611328, -0.06901741027832031, -0.06478023529052734, -0.060543060302734375, -0.056305885314941406, -0.05206871032714844, -0.04783153533935547, -0.0435943603515625, -0.03935718536376953, -0.03512001037597656, -0.030882835388183594, -0.026645660400390625, -0.022408485412597656, -0.018171310424804688, -0.013934135437011719, -0.00969696044921875, -0.005459785461425781, -0.0012226104736328125, 0.0030145645141601562, 0.007251739501953125, 0.011488914489746094, 0.015726089477539062, 0.01996326446533203, 0.024200439453125, 0.02843761444091797, 0.03267478942871094, 0.036911964416503906, 0.041149139404296875, 0.045386314392089844, 0.04962348937988281, 0.05386066436767578, 0.05809783935546875, 0.06233501434326172, 0.06657218933105469, 0.07080936431884766, 0.07504653930664062, 0.0792837142944336, 0.08352088928222656, 0.08775806427001953, 0.0919952392578125, 0.09623241424560547, 0.10046958923339844, 0.1047067642211914, 0.10894393920898438, 0.11318111419677734, 0.11741828918457031, 0.12165546417236328, 0.12589263916015625, 0.13012981414794922, 0.1343669891357422, 0.13860416412353516, 0.14284133911132812, 0.1470785140991211, 0.15131568908691406, 0.15555286407470703, 0.1597900390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 8.0, 4.0, 20.0, 17.0, 22.0, 38.0, 36.0, 39.0, 64.0, 87.0, 130.0, 172.0, 240.0, 320.0, 537.0, 839.0, 1409.0, 2575.0, 5433.0, 15115.0, 58780.0, 491457.0, 389110.0, 55641.0, 14581.0, 5482.0, 2491.0, 1378.0, 766.0, 554.0, 310.0, 258.0, 179.0, 122.0, 89.0, 75.0, 44.0, 31.0, 33.0, 19.0, 8.0, 12.0, 14.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0], "bins": [-0.58349609375, -0.567718505859375, -0.55194091796875, -0.536163330078125, -0.5203857421875, -0.504608154296875, -0.48883056640625, -0.473052978515625, -0.457275390625, -0.441497802734375, -0.42572021484375, -0.409942626953125, -0.3941650390625, -0.378387451171875, -0.36260986328125, -0.346832275390625, -0.3310546875, -0.315277099609375, -0.29949951171875, -0.283721923828125, -0.2679443359375, -0.252166748046875, -0.23638916015625, -0.220611572265625, -0.204833984375, -0.189056396484375, -0.17327880859375, -0.157501220703125, -0.1417236328125, -0.125946044921875, -0.11016845703125, -0.094390869140625, -0.07861328125, -0.062835693359375, -0.04705810546875, -0.031280517578125, -0.0155029296875, 0.000274658203125, 0.01605224609375, 0.031829833984375, 0.047607421875, 0.063385009765625, 0.07916259765625, 0.094940185546875, 0.1107177734375, 0.126495361328125, 0.14227294921875, 0.158050537109375, 0.173828125, 0.189605712890625, 0.20538330078125, 0.221160888671875, 0.2369384765625, 0.252716064453125, 0.26849365234375, 0.284271240234375, 0.300048828125, 0.315826416015625, 0.33160400390625, 0.347381591796875, 0.3631591796875, 0.378936767578125, 0.39471435546875, 0.410491943359375, 0.42626953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 10.0, 7.0, 9.0, 14.0, 7.0, 23.0, 20.0, 21.0, 25.0, 35.0, 37.0, 48.0, 44.0, 31.0, 40.0, 38.0, 55.0, 48.0, 49.0, 40.0, 46.0, 40.0, 48.0, 40.0, 37.0, 28.0, 26.0, 29.0, 19.0, 16.0, 12.0, 9.0, 8.0, 12.0, 4.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59033203125, -0.5719680786132812, -0.5536041259765625, -0.5352401733398438, -0.516876220703125, -0.49851226806640625, -0.4801483154296875, -0.46178436279296875, -0.44342041015625, -0.42505645751953125, -0.4066925048828125, -0.38832855224609375, -0.369964599609375, -0.35160064697265625, -0.3332366943359375, -0.31487274169921875, -0.2965087890625, -0.27814483642578125, -0.2597808837890625, -0.24141693115234375, -0.223052978515625, -0.20468902587890625, -0.1863250732421875, -0.16796112060546875, -0.14959716796875, -0.13123321533203125, -0.1128692626953125, -0.09450531005859375, -0.076141357421875, -0.05777740478515625, -0.0394134521484375, -0.02104949951171875, -0.002685546875, 0.01567840576171875, 0.0340423583984375, 0.05240631103515625, 0.070770263671875, 0.08913421630859375, 0.1074981689453125, 0.12586212158203125, 0.14422607421875, 0.16259002685546875, 0.1809539794921875, 0.19931793212890625, 0.217681884765625, 0.23604583740234375, 0.2544097900390625, 0.27277374267578125, 0.2911376953125, 0.30950164794921875, 0.3278656005859375, 0.34622955322265625, 0.364593505859375, 0.38295745849609375, 0.4013214111328125, 0.41968536376953125, 0.43804931640625, 0.45641326904296875, 0.4747772216796875, 0.49314117431640625, 0.511505126953125, 0.5298690795898438, 0.5482330322265625, 0.5665969848632812, 0.5849609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 10.0, 7.0, 17.0, 42.0, 51.0, 104.0, 146.0, 329.0, 652.0, 1443.0, 4244.0, 16462.0, 88921.0, 657308.0, 230269.0, 36202.0, 8079.0, 2436.0, 939.0, 392.0, 201.0, 106.0, 57.0, 45.0, 15.0, 18.0, 16.0, 7.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.21511077880859375, -0.2085418701171875, -0.20197296142578125, -0.195404052734375, -0.18883514404296875, -0.1822662353515625, -0.17569732666015625, -0.16912841796875, -0.16255950927734375, -0.1559906005859375, -0.14942169189453125, -0.142852783203125, -0.13628387451171875, -0.1297149658203125, -0.12314605712890625, -0.1165771484375, -0.11000823974609375, -0.1034393310546875, -0.09687042236328125, -0.090301513671875, -0.08373260498046875, -0.0771636962890625, -0.07059478759765625, -0.06402587890625, -0.05745697021484375, -0.0508880615234375, -0.04431915283203125, -0.037750244140625, -0.03118133544921875, -0.0246124267578125, -0.01804351806640625, -0.011474609375, -0.00490570068359375, 0.0016632080078125, 0.00823211669921875, 0.014801025390625, 0.02136993408203125, 0.0279388427734375, 0.03450775146484375, 0.04107666015625, 0.04764556884765625, 0.0542144775390625, 0.06078338623046875, 0.067352294921875, 0.07392120361328125, 0.0804901123046875, 0.08705902099609375, 0.0936279296875, 0.10019683837890625, 0.1067657470703125, 0.11333465576171875, 0.119903564453125, 0.12647247314453125, 0.1330413818359375, 0.13961029052734375, 0.14617919921875, 0.15274810791015625, 0.1593170166015625, 0.16588592529296875, 0.172454833984375, 0.17902374267578125, 0.1855926513671875, 0.19216156005859375, 0.19873046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 7.0, 10.0, 7.0, 10.0, 5.0, 15.0, 15.0, 15.0, 28.0, 21.0, 31.0, 39.0, 47.0, 57.0, 68.0, 77.0, 100.0, 70.0, 61.0, 49.0, 46.0, 33.0, 36.0, 32.0, 18.0, 16.0, 15.0, 13.0, 8.0, 13.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.857778549194336e-05, -4.704948514699936e-05, -4.552118480205536e-05, -4.399288445711136e-05, -4.246458411216736e-05, -4.093628376722336e-05, -3.940798342227936e-05, -3.787968307733536e-05, -3.635138273239136e-05, -3.482308238744736e-05, -3.329478204250336e-05, -3.176648169755936e-05, -3.0238181352615356e-05, -2.8709881007671356e-05, -2.7181580662727356e-05, -2.5653280317783356e-05, -2.4124979972839355e-05, -2.2596679627895355e-05, -2.1068379282951355e-05, -1.9540078938007355e-05, -1.8011778593063354e-05, -1.6483478248119354e-05, -1.4955177903175354e-05, -1.3426877558231354e-05, -1.1898577213287354e-05, -1.0370276868343353e-05, -8.841976523399353e-06, -7.313676178455353e-06, -5.7853758335113525e-06, -4.257075488567352e-06, -2.728775143623352e-06, -1.2004747986793518e-06, 3.2782554626464844e-07, 1.8561258912086487e-06, 3.384426236152649e-06, 4.912726581096649e-06, 6.441026926040649e-06, 7.96932727098465e-06, 9.49762761592865e-06, 1.102592796087265e-05, 1.255422830581665e-05, 1.408252865076065e-05, 1.561082899570465e-05, 1.713912934064865e-05, 1.866742968559265e-05, 2.019573003053665e-05, 2.1724030375480652e-05, 2.3252330720424652e-05, 2.4780631065368652e-05, 2.6308931410312653e-05, 2.7837231755256653e-05, 2.9365532100200653e-05, 3.089383244514465e-05, 3.2422132790088654e-05, 3.3950433135032654e-05, 3.5478733479976654e-05, 3.7007033824920654e-05, 3.8535334169864655e-05, 4.0063634514808655e-05, 4.1591934859752655e-05, 4.3120235204696655e-05, 4.4648535549640656e-05, 4.6176835894584656e-05, 4.7705136239528656e-05, 4.9233436584472656e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 11.0, 18.0, 30.0, 52.0, 95.0, 185.0, 332.0, 769.0, 1861.0, 5715.0, 29937.0, 367690.0, 593314.0, 37961.0, 6715.0, 2160.0, 865.0, 414.0, 224.0, 99.0, 45.0, 35.0, 13.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.184326171875, -0.17633056640625, -0.1683349609375, -0.16033935546875, -0.15234375, -0.14434814453125, -0.1363525390625, -0.12835693359375, -0.120361328125, -0.11236572265625, -0.1043701171875, -0.09637451171875, -0.08837890625, -0.08038330078125, -0.0723876953125, -0.06439208984375, -0.056396484375, -0.04840087890625, -0.0404052734375, -0.03240966796875, -0.0244140625, -0.01641845703125, -0.0084228515625, -0.00042724609375, 0.007568359375, 0.01556396484375, 0.0235595703125, 0.03155517578125, 0.03955078125, 0.04754638671875, 0.0555419921875, 0.06353759765625, 0.071533203125, 0.07952880859375, 0.0875244140625, 0.09552001953125, 0.103515625, 0.11151123046875, 0.1195068359375, 0.12750244140625, 0.135498046875, 0.14349365234375, 0.1514892578125, 0.15948486328125, 0.16748046875, 0.17547607421875, 0.1834716796875, 0.19146728515625, 0.199462890625, 0.20745849609375, 0.2154541015625, 0.22344970703125, 0.2314453125, 0.23944091796875, 0.2474365234375, 0.25543212890625, 0.263427734375, 0.27142333984375, 0.2794189453125, 0.28741455078125, 0.29541015625, 0.30340576171875, 0.3114013671875, 0.31939697265625, 0.327392578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 7.0, 3.0, 7.0, 6.0, 7.0, 15.0, 13.0, 14.0, 8.0, 16.0, 20.0, 25.0, 33.0, 31.0, 38.0, 39.0, 44.0, 54.0, 65.0, 62.0, 53.0, 57.0, 46.0, 45.0, 46.0, 44.0, 27.0, 30.0, 21.0, 25.0, 17.0, 16.0, 19.0, 14.0, 8.0, 3.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1414794921875, -0.13768291473388672, -0.13388633728027344, -0.13008975982666016, -0.12629318237304688, -0.1224966049194336, -0.11870002746582031, -0.11490345001220703, -0.11110687255859375, -0.10731029510498047, -0.10351371765136719, -0.0997171401977539, -0.09592056274414062, -0.09212398529052734, -0.08832740783691406, -0.08453083038330078, -0.0807342529296875, -0.07693767547607422, -0.07314109802246094, -0.06934452056884766, -0.06554794311523438, -0.061751365661621094, -0.05795478820800781, -0.05415821075439453, -0.05036163330078125, -0.04656505584716797, -0.04276847839355469, -0.038971900939941406, -0.035175323486328125, -0.031378746032714844, -0.027582168579101562, -0.02378559112548828, -0.019989013671875, -0.01619243621826172, -0.012395858764648438, -0.008599281311035156, -0.004802703857421875, -0.0010061264038085938, 0.0027904510498046875, 0.006587028503417969, 0.01038360595703125, 0.014180183410644531, 0.017976760864257812, 0.021773338317871094, 0.025569915771484375, 0.029366493225097656, 0.03316307067871094, 0.03695964813232422, 0.0407562255859375, 0.04455280303955078, 0.04834938049316406, 0.052145957946777344, 0.055942535400390625, 0.059739112854003906, 0.06353569030761719, 0.06733226776123047, 0.07112884521484375, 0.07492542266845703, 0.07872200012207031, 0.0825185775756836, 0.08631515502929688, 0.09011173248291016, 0.09390830993652344, 0.09770488739013672, 0.10150146484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 12.0, 11.0, 17.0, 43.0, 70.0, 80.0, 142.0, 246.0, 145.0, 97.0, 60.0, 24.0, 16.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6263699531555176, -3.50262713432312, -3.3788843154907227, -3.255141496658325, -3.1313986778259277, -3.0076558589935303, -2.883913040161133, -2.7601704597473145, -2.636427402496338, -2.5126845836639404, -2.388941764831543, -2.2651989459991455, -2.141456127166748, -2.0177133083343506, -1.8939706087112427, -1.7702277898788452, -1.6464850902557373, -1.5227422714233398, -1.3989994525909424, -1.275256633758545, -1.1515138149261475, -1.02777099609375, -0.9040282964706421, -0.7802854776382446, -0.6565426588058472, -0.5327998399734497, -0.40905705094337463, -0.28531426191329956, -0.1615714430809021, -0.03782862424850464, 0.08591413497924805, 0.2096569538116455, 0.33339977264404297, 0.45714259147644043, 0.5808854103088379, 0.7046281695365906, 0.828370988368988, 0.9521138072013855, 1.0758565664291382, 1.1995993852615356, 1.323342204093933, 1.4470850229263306, 1.570827841758728, 1.694570541381836, 1.8183133602142334, 1.9420561790466309, 2.0657989978790283, 2.189541816711426, 2.3132846355438232, 2.4370274543762207, 2.560770273208618, 2.6845130920410156, 2.808255910873413, 2.9319987297058105, 3.055741310119629, 3.1794843673706055, 3.303226947784424, 3.4269697666168213, 3.5507125854492188, 3.674455404281616, 3.7981982231140137, 3.921941041946411, 4.045683860778809, 4.169426441192627, 4.2931694984436035]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 9.0, 13.0, 14.0, 21.0, 10.0, 22.0, 26.0, 30.0, 27.0, 34.0, 36.0, 37.0, 53.0, 54.0, 59.0, 76.0, 73.0, 55.0, 39.0, 41.0, 35.0, 30.0, 31.0, 24.0, 23.0, 18.0, 18.0, 11.0, 11.0, 11.0, 7.0, 12.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5546655654907227, -2.4808285236358643, -2.406991481781006, -2.3331542015075684, -2.25931715965271, -2.1854801177978516, -2.111642837524414, -2.0378057956695557, -1.9639687538146973, -1.8901317119598389, -1.816294550895691, -1.742457389831543, -1.6686203479766846, -1.5947833061218262, -1.5209461450576782, -1.4471089839935303, -1.3732719421386719, -1.2994349002838135, -1.2255977392196655, -1.1517605781555176, -1.0779235363006592, -1.0040864944458008, -0.9302493333816528, -0.8564122319221497, -0.7825751304626465, -0.7087380290031433, -0.6349009275436401, -0.561063826084137, -0.4872267246246338, -0.4133896231651306, -0.33955252170562744, -0.26571542024612427, -0.191878080368042, -0.11804097890853882, -0.044203877449035645, 0.02963322401046753, 0.1034703254699707, 0.17730742692947388, 0.25114452838897705, 0.3249816298484802, 0.3988187313079834, 0.4726558327674866, 0.5464929342269897, 0.6203300356864929, 0.6941671371459961, 0.7680042386054993, 0.8418413400650024, 0.9156784415245056, 0.9895155429840088, 1.0633525848388672, 1.1371897459030151, 1.211026906967163, 1.2848639488220215, 1.3587009906768799, 1.4325381517410278, 1.5063753128051758, 1.5802123546600342, 1.6540493965148926, 1.7278865575790405, 1.8017237186431885, 1.8755607604980469, 1.9493978023529053, 2.0232348442077637, 2.097072124481201, 2.1709091663360596]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 13.0, 35.0, 48.0, 75.0, 140.0, 226.0, 386.0, 668.0, 1412.0, 2940.0, 7077.0, 18012.0, 55475.0, 245241.0, 1584984.0, 1889823.0, 292761.0, 61198.0, 19378.0, 7568.0, 3226.0, 1510.0, 872.0, 456.0, 264.0, 167.0, 106.0, 77.0, 42.0, 19.0, 24.0, 14.0, 10.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.2039642333984375, -0.197601318359375, -0.1912384033203125, -0.18487548828125, -0.1785125732421875, -0.172149658203125, -0.1657867431640625, -0.159423828125, -0.1530609130859375, -0.146697998046875, -0.1403350830078125, -0.13397216796875, -0.1276092529296875, -0.121246337890625, -0.1148834228515625, -0.1085205078125, -0.1021575927734375, -0.095794677734375, -0.0894317626953125, -0.08306884765625, -0.0767059326171875, -0.070343017578125, -0.0639801025390625, -0.0576171875, -0.0512542724609375, -0.044891357421875, -0.0385284423828125, -0.03216552734375, -0.0258026123046875, -0.019439697265625, -0.0130767822265625, -0.0067138671875, -0.0003509521484375, 0.006011962890625, 0.0123748779296875, 0.01873779296875, 0.0251007080078125, 0.031463623046875, 0.0378265380859375, 0.044189453125, 0.0505523681640625, 0.056915283203125, 0.0632781982421875, 0.06964111328125, 0.0760040283203125, 0.082366943359375, 0.0887298583984375, 0.0950927734375, 0.1014556884765625, 0.107818603515625, 0.1141815185546875, 0.12054443359375, 0.1269073486328125, 0.133270263671875, 0.1396331787109375, 0.14599609375, 0.1523590087890625, 0.158721923828125, 0.1650848388671875, 0.17144775390625, 0.1778106689453125, 0.184173583984375, 0.1905364990234375, 0.1968994140625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 9.0, 12.0, 10.0, 12.0, 14.0, 21.0, 33.0, 30.0, 33.0, 46.0, 48.0, 54.0, 65.0, 67.0, 77.0, 60.0, 59.0, 59.0, 43.0, 39.0, 30.0, 32.0, 27.0, 21.0, 22.0, 20.0, 16.0, 15.0, 11.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11224365234375, -0.10732555389404297, -0.10240745544433594, -0.0974893569946289, -0.09257125854492188, -0.08765316009521484, -0.08273506164550781, -0.07781696319580078, -0.07289886474609375, -0.06798076629638672, -0.06306266784667969, -0.058144569396972656, -0.053226470947265625, -0.048308372497558594, -0.04339027404785156, -0.03847217559814453, -0.0335540771484375, -0.02863597869873047, -0.023717880249023438, -0.018799781799316406, -0.013881683349609375, -0.008963584899902344, -0.0040454864501953125, 0.0008726119995117188, 0.00579071044921875, 0.010708808898925781, 0.015626907348632812, 0.020545005798339844, 0.025463104248046875, 0.030381202697753906, 0.03529930114746094, 0.04021739959716797, 0.045135498046875, 0.05005359649658203, 0.05497169494628906, 0.059889793395996094, 0.06480789184570312, 0.06972599029541016, 0.07464408874511719, 0.07956218719482422, 0.08448028564453125, 0.08939838409423828, 0.09431648254394531, 0.09923458099365234, 0.10415267944335938, 0.1090707778930664, 0.11398887634277344, 0.11890697479248047, 0.1238250732421875, 0.12874317169189453, 0.13366127014160156, 0.1385793685913086, 0.14349746704101562, 0.14841556549072266, 0.1533336639404297, 0.15825176239013672, 0.16316986083984375, 0.16808795928955078, 0.1730060577392578, 0.17792415618896484, 0.18284225463867188, 0.1877603530883789, 0.19267845153808594, 0.19759654998779297, 0.2025146484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 13.0, 12.0, 31.0, 54.0, 64.0, 112.0, 238.0, 492.0, 1437.0, 4415.0, 16917.0, 88505.0, 1210431.0, 2684663.0, 154346.0, 23710.0, 5707.0, 1808.0, 680.0, 276.0, 114.0, 97.0, 48.0, 30.0, 17.0, 13.0, 10.0, 8.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.400146484375, -0.3876991271972656, -0.37525177001953125, -0.3628044128417969, -0.3503570556640625, -0.3379096984863281, -0.32546234130859375, -0.3130149841308594, -0.300567626953125, -0.2881202697753906, -0.27567291259765625, -0.2632255554199219, -0.2507781982421875, -0.23833084106445312, -0.22588348388671875, -0.21343612670898438, -0.20098876953125, -0.18854141235351562, -0.17609405517578125, -0.16364669799804688, -0.1511993408203125, -0.13875198364257812, -0.12630462646484375, -0.11385726928710938, -0.101409912109375, -0.08896255493164062, -0.07651519775390625, -0.06406784057617188, -0.0516204833984375, -0.039173126220703125, -0.02672576904296875, -0.014278411865234375, -0.0018310546875, 0.010616302490234375, 0.02306365966796875, 0.035511016845703125, 0.0479583740234375, 0.060405731201171875, 0.07285308837890625, 0.08530044555664062, 0.097747802734375, 0.11019515991210938, 0.12264251708984375, 0.13508987426757812, 0.1475372314453125, 0.15998458862304688, 0.17243194580078125, 0.18487930297851562, 0.19732666015625, 0.20977401733398438, 0.22222137451171875, 0.23466873168945312, 0.2471160888671875, 0.2595634460449219, 0.27201080322265625, 0.2844581604003906, 0.296905517578125, 0.3093528747558594, 0.32180023193359375, 0.3342475891113281, 0.3466949462890625, 0.3591423034667969, 0.37158966064453125, 0.3840370178222656, 0.396484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 6.0, 7.0, 10.0, 4.0, 12.0, 9.0, 13.0, 16.0, 29.0, 36.0, 41.0, 69.0, 90.0, 126.0, 159.0, 243.0, 336.0, 494.0, 585.0, 537.0, 362.0, 272.0, 192.0, 117.0, 92.0, 55.0, 30.0, 35.0, 18.0, 19.0, 12.0, 12.0, 10.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.2677803039550781, -0.25772857666015625, -0.24767684936523438, -0.2376251220703125, -0.22757339477539062, -0.21752166748046875, -0.20746994018554688, -0.197418212890625, -0.18736648559570312, -0.17731475830078125, -0.16726303100585938, -0.1572113037109375, -0.14715957641601562, -0.13710784912109375, -0.12705612182617188, -0.11700439453125, -0.10695266723632812, -0.09690093994140625, -0.08684921264648438, -0.0767974853515625, -0.06674575805664062, -0.05669403076171875, -0.046642303466796875, -0.036590576171875, -0.026538848876953125, -0.01648712158203125, -0.006435394287109375, 0.0036163330078125, 0.013668060302734375, 0.02371978759765625, 0.033771514892578125, 0.0438232421875, 0.053874969482421875, 0.06392669677734375, 0.07397842407226562, 0.0840301513671875, 0.09408187866210938, 0.10413360595703125, 0.11418533325195312, 0.124237060546875, 0.13428878784179688, 0.14434051513671875, 0.15439224243164062, 0.1644439697265625, 0.17449569702148438, 0.18454742431640625, 0.19459915161132812, 0.20465087890625, 0.21470260620117188, 0.22475433349609375, 0.23480606079101562, 0.2448577880859375, 0.2549095153808594, 0.26496124267578125, 0.2750129699707031, 0.285064697265625, 0.2951164245605469, 0.30516815185546875, 0.3152198791503906, 0.3252716064453125, 0.3353233337402344, 0.34537506103515625, 0.3554267883300781, 0.365478515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 14.0, 23.0, 38.0, 81.0, 147.0, 195.0, 207.0, 138.0, 72.0, 28.0, 15.0, 7.0, 8.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.727634906768799, -3.5950684547424316, -3.4625022411346436, -3.3299360275268555, -3.1973695755004883, -3.064803123474121, -2.932236909866333, -2.799670696258545, -2.6671042442321777, -2.5345377922058105, -2.4019715785980225, -2.2694053649902344, -2.136838912963867, -2.0042724609375, -1.871706247329712, -1.7391399145126343, -1.6065735816955566, -1.474007248878479, -1.3414409160614014, -1.2088745832443237, -1.076308250427246, -0.9437419176101685, -0.8111755847930908, -0.6786092519760132, -0.5460429191589355, -0.4134765863418579, -0.2809102535247803, -0.14834392070770264, -0.015777587890625, 0.11678874492645264, 0.24935507774353027, 0.3819214105606079, 0.5144882202148438, 0.6470545530319214, 0.779620885848999, 0.9121872186660767, 1.0447535514831543, 1.177319884300232, 1.3098862171173096, 1.4424525499343872, 1.5750188827514648, 1.7075852155685425, 1.8401515483856201, 1.9727178812026978, 2.1052842140197754, 2.2378506660461426, 2.3704168796539307, 2.5029830932617188, 2.635549545288086, 2.768115997314453, 2.900682210922241, 3.0332484245300293, 3.1658148765563965, 3.2983813285827637, 3.4309475421905518, 3.56351375579834, 3.696080207824707, 3.828646659851074, 3.9612128734588623, 4.09377908706665, 4.226345539093018, 4.358911991119385, 4.491477966308594, 4.624044418334961, 4.756610870361328]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 8.0, 11.0, 14.0, 11.0, 11.0, 19.0, 21.0, 24.0, 27.0, 36.0, 39.0, 53.0, 36.0, 60.0, 53.0, 37.0, 42.0, 49.0, 64.0, 50.0, 41.0, 26.0, 43.0, 44.0, 29.0, 29.0, 19.0, 19.0, 10.0, 13.0, 12.0, 10.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.666301965713501, -1.609972596168518, -1.5536432266235352, -1.4973138570785522, -1.4409844875335693, -1.384655237197876, -1.328325867652893, -1.2719964981079102, -1.2156671285629272, -1.1593377590179443, -1.1030083894729614, -1.0466790199279785, -0.9903497099876404, -0.9340203404426575, -0.8776910305023193, -0.8213616609573364, -0.7650322914123535, -0.7087029218673706, -0.6523735523223877, -0.5960442423820496, -0.5397148728370667, -0.48338550329208374, -0.4270561635494232, -0.3707268238067627, -0.3143974542617798, -0.2580680847167969, -0.20173874497413635, -0.14540939033031464, -0.08908003568649292, -0.03275066614151001, 0.023578673601150513, 0.07990801334381104, 0.13623738288879395, 0.19256673753261566, 0.24889609217643738, 0.3052254319190979, 0.3615548014640808, 0.4178841710090637, 0.47421351075172424, 0.5305428504943848, 0.5868722200393677, 0.6432015895843506, 0.6995309591293335, 0.7558602690696716, 0.8121896386146545, 0.8685190081596375, 0.9248483180999756, 0.9811776876449585, 1.0375070571899414, 1.0938364267349243, 1.1501657962799072, 1.2064951658248901, 1.262824535369873, 1.3191537857055664, 1.3754831552505493, 1.4318125247955322, 1.4881418943405151, 1.544471263885498, 1.600800633430481, 1.6571300029754639, 1.7134592533111572, 1.7697887420654297, 1.826117992401123, 1.882447361946106, 1.9387767314910889]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 11.0, 11.0, 15.0, 20.0, 23.0, 50.0, 44.0, 56.0, 128.0, 144.0, 221.0, 353.0, 544.0, 881.0, 1341.0, 2262.0, 3728.0, 7031.0, 14129.0, 30714.0, 76185.0, 224629.0, 417329.0, 159960.0, 58179.0, 24651.0, 11326.0, 5928.0, 3328.0, 1870.0, 1193.0, 703.0, 506.0, 339.0, 226.0, 152.0, 105.0, 78.0, 39.0, 38.0, 23.0, 21.0, 9.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.248046875, -0.23987579345703125, -0.2317047119140625, -0.22353363037109375, -0.215362548828125, -0.20719146728515625, -0.1990203857421875, -0.19084930419921875, -0.18267822265625, -0.17450714111328125, -0.1663360595703125, -0.15816497802734375, -0.149993896484375, -0.14182281494140625, -0.1336517333984375, -0.12548065185546875, -0.1173095703125, -0.10913848876953125, -0.1009674072265625, -0.09279632568359375, -0.084625244140625, -0.07645416259765625, -0.0682830810546875, -0.06011199951171875, -0.05194091796875, -0.04376983642578125, -0.0355987548828125, -0.02742767333984375, -0.019256591796875, -0.01108551025390625, -0.0029144287109375, 0.00525665283203125, 0.013427734375, 0.02159881591796875, 0.0297698974609375, 0.03794097900390625, 0.046112060546875, 0.05428314208984375, 0.0624542236328125, 0.07062530517578125, 0.07879638671875, 0.08696746826171875, 0.0951385498046875, 0.10330963134765625, 0.111480712890625, 0.11965179443359375, 0.1278228759765625, 0.13599395751953125, 0.1441650390625, 0.15233612060546875, 0.1605072021484375, 0.16867828369140625, 0.176849365234375, 0.18502044677734375, 0.1931915283203125, 0.20136260986328125, 0.20953369140625, 0.21770477294921875, 0.2258758544921875, 0.23404693603515625, 0.242218017578125, 0.25038909912109375, 0.2585601806640625, 0.26673126220703125, 0.27490234375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 12.0, 16.0, 18.0, 18.0, 24.0, 30.0, 40.0, 38.0, 60.0, 39.0, 57.0, 48.0, 55.0, 60.0, 60.0, 45.0, 48.0, 30.0, 42.0, 43.0, 27.0, 28.0, 25.0, 20.0, 22.0, 15.0, 19.0, 10.0, 5.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1268310546875, -0.12234115600585938, -0.11785125732421875, -0.11336135864257812, -0.1088714599609375, -0.10438156127929688, -0.09989166259765625, -0.09540176391601562, -0.090911865234375, -0.08642196655273438, -0.08193206787109375, -0.07744216918945312, -0.0729522705078125, -0.06846237182617188, -0.06397247314453125, -0.059482574462890625, -0.05499267578125, -0.050502777099609375, -0.04601287841796875, -0.041522979736328125, -0.0370330810546875, -0.032543182373046875, -0.02805328369140625, -0.023563385009765625, -0.019073486328125, -0.014583587646484375, -0.01009368896484375, -0.005603790283203125, -0.0011138916015625, 0.003376007080078125, 0.00786590576171875, 0.012355804443359375, 0.016845703125, 0.021335601806640625, 0.02582550048828125, 0.030315399169921875, 0.0348052978515625, 0.039295196533203125, 0.04378509521484375, 0.048274993896484375, 0.052764892578125, 0.057254791259765625, 0.06174468994140625, 0.06623458862304688, 0.0707244873046875, 0.07521438598632812, 0.07970428466796875, 0.08419418334960938, 0.08868408203125, 0.09317398071289062, 0.09766387939453125, 0.10215377807617188, 0.1066436767578125, 0.11113357543945312, 0.11562347412109375, 0.12011337280273438, 0.124603271484375, 0.12909317016601562, 0.13358306884765625, 0.13807296752929688, 0.1425628662109375, 0.14705276489257812, 0.15154266357421875, 0.15603256225585938, 0.1605224609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 10.0, 12.0, 17.0, 14.0, 22.0, 32.0, 35.0, 61.0, 73.0, 102.0, 129.0, 185.0, 257.0, 361.0, 620.0, 1052.0, 1832.0, 3929.0, 9715.0, 32124.0, 166642.0, 702983.0, 92613.0, 21187.0, 7250.0, 3041.0, 1502.0, 903.0, 565.0, 375.0, 243.0, 167.0, 119.0, 97.0, 60.0, 60.0, 43.0, 26.0, 22.0, 17.0, 14.0, 7.0, 10.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4150390625, -0.4008979797363281, -0.38675689697265625, -0.3726158142089844, -0.3584747314453125, -0.3443336486816406, -0.33019256591796875, -0.3160514831542969, -0.301910400390625, -0.2877693176269531, -0.27362823486328125, -0.2594871520996094, -0.2453460693359375, -0.23120498657226562, -0.21706390380859375, -0.20292282104492188, -0.18878173828125, -0.17464065551757812, -0.16049957275390625, -0.14635848999023438, -0.1322174072265625, -0.11807632446289062, -0.10393524169921875, -0.08979415893554688, -0.075653076171875, -0.061511993408203125, -0.04737091064453125, -0.033229827880859375, -0.0190887451171875, -0.004947662353515625, 0.00919342041015625, 0.023334503173828125, 0.0374755859375, 0.051616668701171875, 0.06575775146484375, 0.07989883422851562, 0.0940399169921875, 0.10818099975585938, 0.12232208251953125, 0.13646316528320312, 0.150604248046875, 0.16474533081054688, 0.17888641357421875, 0.19302749633789062, 0.2071685791015625, 0.22130966186523438, 0.23545074462890625, 0.24959182739257812, 0.26373291015625, 0.2778739929199219, 0.29201507568359375, 0.3061561584472656, 0.3202972412109375, 0.3344383239746094, 0.34857940673828125, 0.3627204895019531, 0.376861572265625, 0.3910026550292969, 0.40514373779296875, 0.4192848205566406, 0.4334259033203125, 0.4475669860839844, 0.46170806884765625, 0.4758491516113281, 0.489990234375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 13.0, 17.0, 11.0, 17.0, 21.0, 31.0, 35.0, 28.0, 37.0, 25.0, 39.0, 50.0, 55.0, 49.0, 53.0, 69.0, 46.0, 49.0, 36.0, 39.0, 42.0, 33.0, 31.0, 21.0, 22.0, 16.0, 16.0, 16.0, 15.0, 11.0, 9.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.63525390625, -0.61700439453125, -0.5987548828125, -0.58050537109375, -0.562255859375, -0.54400634765625, -0.5257568359375, -0.50750732421875, -0.4892578125, -0.47100830078125, -0.4527587890625, -0.43450927734375, -0.416259765625, -0.39801025390625, -0.3797607421875, -0.36151123046875, -0.34326171875, -0.32501220703125, -0.3067626953125, -0.28851318359375, -0.270263671875, -0.25201416015625, -0.2337646484375, -0.21551513671875, -0.197265625, -0.17901611328125, -0.1607666015625, -0.14251708984375, -0.124267578125, -0.10601806640625, -0.0877685546875, -0.06951904296875, -0.05126953125, -0.03302001953125, -0.0147705078125, 0.00347900390625, 0.021728515625, 0.03997802734375, 0.0582275390625, 0.07647705078125, 0.0947265625, 0.11297607421875, 0.1312255859375, 0.14947509765625, 0.167724609375, 0.18597412109375, 0.2042236328125, 0.22247314453125, 0.24072265625, 0.25897216796875, 0.2772216796875, 0.29547119140625, 0.313720703125, 0.33197021484375, 0.3502197265625, 0.36846923828125, 0.38671875, 0.40496826171875, 0.4232177734375, 0.44146728515625, 0.459716796875, 0.47796630859375, 0.4962158203125, 0.51446533203125, 0.53271484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 6.0, 15.0, 10.0, 22.0, 22.0, 36.0, 42.0, 80.0, 96.0, 138.0, 295.0, 454.0, 878.0, 1852.0, 4548.0, 14288.0, 57714.0, 332995.0, 540610.0, 68509.0, 16520.0, 5128.0, 1996.0, 930.0, 508.0, 322.0, 169.0, 124.0, 64.0, 48.0, 32.0, 22.0, 19.0, 8.0, 9.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1895751953125, -0.1838397979736328, -0.17810440063476562, -0.17236900329589844, -0.16663360595703125, -0.16089820861816406, -0.15516281127929688, -0.1494274139404297, -0.1436920166015625, -0.1379566192626953, -0.13222122192382812, -0.12648582458496094, -0.12075042724609375, -0.11501502990722656, -0.10927963256835938, -0.10354423522949219, -0.097808837890625, -0.09207344055175781, -0.08633804321289062, -0.08060264587402344, -0.07486724853515625, -0.06913185119628906, -0.06339645385742188, -0.05766105651855469, -0.0519256591796875, -0.04619026184082031, -0.040454864501953125, -0.03471946716308594, -0.02898406982421875, -0.023248672485351562, -0.017513275146484375, -0.011777877807617188, -0.00604248046875, -0.0003070831298828125, 0.005428314208984375, 0.011163711547851562, 0.01689910888671875, 0.022634506225585938, 0.028369903564453125, 0.03410530090332031, 0.0398406982421875, 0.04557609558105469, 0.051311492919921875, 0.05704689025878906, 0.06278228759765625, 0.06851768493652344, 0.07425308227539062, 0.07998847961425781, 0.085723876953125, 0.09145927429199219, 0.09719467163085938, 0.10293006896972656, 0.10866546630859375, 0.11440086364746094, 0.12013626098632812, 0.1258716583251953, 0.1316070556640625, 0.1373424530029297, 0.14307785034179688, 0.14881324768066406, 0.15454864501953125, 0.16028404235839844, 0.16601943969726562, 0.1717548370361328, 0.177490234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 10.0, 3.0, 13.0, 10.0, 17.0, 20.0, 32.0, 23.0, 22.0, 26.0, 44.0, 51.0, 72.0, 92.0, 81.0, 86.0, 78.0, 59.0, 49.0, 35.0, 30.0, 23.0, 16.0, 17.0, 17.0, 12.0, 9.0, 11.0, 6.0, 6.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.792213439941406e-05, -4.640687257051468e-05, -4.4891610741615295e-05, -4.337634891271591e-05, -4.186108708381653e-05, -4.0345825254917145e-05, -3.883056342601776e-05, -3.731530159711838e-05, -3.5800039768218994e-05, -3.428477793931961e-05, -3.276951611042023e-05, -3.1254254281520844e-05, -2.973899245262146e-05, -2.8223730623722076e-05, -2.6708468794822693e-05, -2.519320696592331e-05, -2.3677945137023926e-05, -2.2162683308124542e-05, -2.064742147922516e-05, -1.9132159650325775e-05, -1.761689782142639e-05, -1.6101635992527008e-05, -1.4586374163627625e-05, -1.3071112334728241e-05, -1.1555850505828857e-05, -1.0040588676929474e-05, -8.52532684803009e-06, -7.010065019130707e-06, -5.494803190231323e-06, -3.97954136133194e-06, -2.464279532432556e-06, -9.490177035331726e-07, 5.662441253662109e-07, 2.0815059542655945e-06, 3.596767783164978e-06, 5.1120296120643616e-06, 6.627291440963745e-06, 8.142553269863129e-06, 9.657815098762512e-06, 1.1173076927661896e-05, 1.268833875656128e-05, 1.4203600585460663e-05, 1.5718862414360046e-05, 1.723412424325943e-05, 1.8749386072158813e-05, 2.0264647901058197e-05, 2.177990972995758e-05, 2.3295171558856964e-05, 2.4810433387756348e-05, 2.632569521665573e-05, 2.7840957045555115e-05, 2.9356218874454498e-05, 3.087148070335388e-05, 3.2386742532253265e-05, 3.390200436115265e-05, 3.541726619005203e-05, 3.6932528018951416e-05, 3.84477898478508e-05, 3.996305167675018e-05, 4.147831350564957e-05, 4.299357533454895e-05, 4.4508837163448334e-05, 4.602409899234772e-05, 4.75393608212471e-05, 4.9054622650146484e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 12.0, 7.0, 14.0, 15.0, 34.0, 49.0, 75.0, 148.0, 251.0, 530.0, 1123.0, 2807.0, 9899.0, 67518.0, 765898.0, 174414.0, 18267.0, 4308.0, 1622.0, 728.0, 358.0, 199.0, 106.0, 73.0, 46.0, 14.0, 6.0, 12.0, 6.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.274658203125, -0.26696205139160156, -0.2592658996582031, -0.2515697479248047, -0.24387359619140625, -0.2361774444580078, -0.22848129272460938, -0.22078514099121094, -0.2130889892578125, -0.20539283752441406, -0.19769668579101562, -0.1900005340576172, -0.18230438232421875, -0.1746082305908203, -0.16691207885742188, -0.15921592712402344, -0.151519775390625, -0.14382362365722656, -0.13612747192382812, -0.1284313201904297, -0.12073516845703125, -0.11303901672363281, -0.10534286499023438, -0.09764671325683594, -0.0899505615234375, -0.08225440979003906, -0.07455825805664062, -0.06686210632324219, -0.05916595458984375, -0.05146980285644531, -0.043773651123046875, -0.03607749938964844, -0.02838134765625, -0.020685195922851562, -0.012989044189453125, -0.0052928924560546875, 0.00240325927734375, 0.010099411010742188, 0.017795562744140625, 0.025491714477539062, 0.0331878662109375, 0.04088401794433594, 0.048580169677734375, 0.05627632141113281, 0.06397247314453125, 0.07166862487792969, 0.07936477661132812, 0.08706092834472656, 0.094757080078125, 0.10245323181152344, 0.11014938354492188, 0.11784553527832031, 0.12554168701171875, 0.1332378387451172, 0.14093399047851562, 0.14863014221191406, 0.1563262939453125, 0.16402244567871094, 0.17171859741210938, 0.1794147491455078, 0.18711090087890625, 0.1948070526123047, 0.20250320434570312, 0.21019935607910156, 0.2178955078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 11.0, 15.0, 13.0, 16.0, 24.0, 37.0, 52.0, 49.0, 94.0, 96.0, 107.0, 92.0, 82.0, 58.0, 48.0, 54.0, 28.0, 34.0, 28.0, 13.0, 15.0, 5.0, 11.0, 7.0, 5.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24586868286132812, -0.23954010009765625, -0.23321151733398438, -0.2268829345703125, -0.22055435180664062, -0.21422576904296875, -0.20789718627929688, -0.201568603515625, -0.19524002075195312, -0.18891143798828125, -0.18258285522460938, -0.1762542724609375, -0.16992568969726562, -0.16359710693359375, -0.15726852416992188, -0.15093994140625, -0.14461135864257812, -0.13828277587890625, -0.13195419311523438, -0.1256256103515625, -0.11929702758789062, -0.11296844482421875, -0.10663986206054688, -0.100311279296875, -0.09398269653320312, -0.08765411376953125, -0.08132553100585938, -0.0749969482421875, -0.06866836547851562, -0.06233978271484375, -0.056011199951171875, -0.0496826171875, -0.043354034423828125, -0.03702545166015625, -0.030696868896484375, -0.0243682861328125, -0.018039703369140625, -0.01171112060546875, -0.005382537841796875, 0.000946044921875, 0.007274627685546875, 0.01360321044921875, 0.019931793212890625, 0.0262603759765625, 0.032588958740234375, 0.03891754150390625, 0.045246124267578125, 0.05157470703125, 0.057903289794921875, 0.06423187255859375, 0.07056045532226562, 0.0768890380859375, 0.08321762084960938, 0.08954620361328125, 0.09587478637695312, 0.102203369140625, 0.10853195190429688, 0.11486053466796875, 0.12118911743164062, 0.1275177001953125, 0.13384628295898438, 0.14017486572265625, 0.14650344848632812, 0.15283203125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 9.0, 11.0, 54.0, 93.0, 216.0, 302.0, 139.0, 82.0, 34.0, 11.0, 14.0, 5.0, 3.0, 2.0, 1.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9421443939208984, -3.7858171463012695, -3.6294896602630615, -3.4731624126434326, -3.3168351650238037, -3.1605076789855957, -3.004180431365967, -2.847853183746338, -2.691525936126709, -2.53519868850708, -2.378871202468872, -2.222543954849243, -2.0662167072296143, -1.9098893404006958, -1.7535619735717773, -1.5972347259521484, -1.4409072399139404, -1.284579873085022, -1.128252625465393, -0.9719252586364746, -0.8155979514122009, -0.6592706441879272, -0.5029432773590088, -0.3466160297393799, -0.19028866291046143, -0.03396134078502655, 0.12236598134040833, 0.2786933183670044, 0.4350206255912781, 0.5913479328155518, 0.7476752996444702, 0.9040025472640991, 1.0603299140930176, 1.216657280921936, 1.372984528541565, 1.5293118953704834, 1.6856391429901123, 1.8419665098190308, 1.9982938766479492, 2.154621124267578, 2.310948371887207, 2.467275619506836, 2.623603105545044, 2.779930353164673, 2.9362576007843018, 3.0925850868225098, 3.2489123344421387, 3.4052395820617676, 3.5615670680999756, 3.7178943157196045, 3.8742218017578125, 4.030549049377441, 4.18687629699707, 4.343203544616699, 4.499530792236328, 4.655858039855957, 4.812185764312744, 4.968513011932373, 5.124840259552002, 5.281167984008789, 5.437495231628418, 5.593822479248047, 5.750149726867676, 5.906476974487305, 6.062804222106934]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 3.0, 8.0, 9.0, 10.0, 11.0, 10.0, 21.0, 17.0, 19.0, 22.0, 20.0, 21.0, 21.0, 31.0, 21.0, 23.0, 36.0, 42.0, 61.0, 66.0, 72.0, 67.0, 52.0, 38.0, 29.0, 29.0, 28.0, 33.0, 30.0, 22.0, 16.0, 15.0, 11.0, 8.0, 11.0, 9.0, 6.0, 7.0, 7.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.110687255859375, -2.04278564453125, -1.9748839139938354, -1.906982183456421, -1.839080572128296, -1.7711788415908813, -1.7032771110534668, -1.6353754997253418, -1.5674738883972168, -1.4995721578598022, -1.4316705465316772, -1.3637688159942627, -1.2958672046661377, -1.2279654741287231, -1.1600637435913086, -1.0921621322631836, -1.024260401725769, -0.9563587307929993, -0.8884570598602295, -0.8205553293228149, -0.7526537179946899, -0.6847519874572754, -0.6168503165245056, -0.5489486455917358, -0.48104697465896606, -0.4131453037261963, -0.3452436327934265, -0.27734193205833435, -0.20944026112556458, -0.1415385901927948, -0.07363688945770264, -0.005735218524932861, 0.062166452407836914, 0.1300681233406067, 0.19796980917453766, 0.26587149500846863, 0.3337731659412384, 0.4016748368740082, 0.46957653760910034, 0.5374782085418701, 0.6053798794746399, 0.6732815504074097, 0.7411832213401794, 0.8090848922729492, 0.8769866228103638, 0.9448882341384888, 1.0127899646759033, 1.0806915760040283, 1.1485933065414429, 1.2164950370788574, 1.2843966484069824, 1.352298378944397, 1.420199990272522, 1.4881017208099365, 1.5560033321380615, 1.623905062675476, 1.6918067932128906, 1.7597085237503052, 1.8276101350784302, 1.8955118656158447, 1.9634134769439697, 2.0313150882720947, 2.099216938018799, 2.167118549346924, 2.235020160675049]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 6.0, 2.0, 6.0, 15.0, 12.0, 18.0, 22.0, 38.0, 50.0, 77.0, 111.0, 155.0, 256.0, 358.0, 487.0, 786.0, 1268.0, 2067.0, 3427.0, 6115.0, 11941.0, 26535.0, 71113.0, 251183.0, 1056670.0, 1943632.0, 586790.0, 145980.0, 45999.0, 18379.0, 8929.0, 4590.0, 2716.0, 1604.0, 966.0, 627.0, 436.0, 286.0, 188.0, 147.0, 87.0, 62.0, 42.0, 33.0, 27.0, 16.0, 7.0, 7.0, 7.0, 8.0, 2.0, 2.0, 3.0], "bins": [-0.15380859375, -0.14957046508789062, -0.14533233642578125, -0.14109420776367188, -0.1368560791015625, -0.13261795043945312, -0.12837982177734375, -0.12414169311523438, -0.119903564453125, -0.11566543579101562, -0.11142730712890625, -0.10718917846679688, -0.1029510498046875, -0.09871292114257812, -0.09447479248046875, -0.09023666381835938, -0.08599853515625, -0.08176040649414062, -0.07752227783203125, -0.07328414916992188, -0.0690460205078125, -0.06480789184570312, -0.06056976318359375, -0.056331634521484375, -0.052093505859375, -0.047855377197265625, -0.04361724853515625, -0.039379119873046875, -0.0351409912109375, -0.030902862548828125, -0.02666473388671875, -0.022426605224609375, -0.0181884765625, -0.013950347900390625, -0.00971221923828125, -0.005474090576171875, -0.0012359619140625, 0.003002166748046875, 0.00724029541015625, 0.011478424072265625, 0.015716552734375, 0.019954681396484375, 0.02419281005859375, 0.028430938720703125, 0.0326690673828125, 0.036907196044921875, 0.04114532470703125, 0.045383453369140625, 0.04962158203125, 0.053859710693359375, 0.05809783935546875, 0.062335968017578125, 0.0665740966796875, 0.07081222534179688, 0.07505035400390625, 0.07928848266601562, 0.083526611328125, 0.08776473999023438, 0.09200286865234375, 0.09624099731445312, 0.1004791259765625, 0.10471725463867188, 0.10895538330078125, 0.11319351196289062, 0.117431640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 1.0, 9.0, 3.0, 10.0, 12.0, 16.0, 12.0, 11.0, 22.0, 17.0, 30.0, 36.0, 40.0, 45.0, 46.0, 55.0, 75.0, 56.0, 59.0, 72.0, 47.0, 54.0, 39.0, 36.0, 33.0, 33.0, 24.0, 29.0, 16.0, 13.0, 13.0, 15.0, 13.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11724853515625, -0.11259746551513672, -0.10794639587402344, -0.10329532623291016, -0.09864425659179688, -0.0939931869506836, -0.08934211730957031, -0.08469104766845703, -0.08003997802734375, -0.07538890838623047, -0.07073783874511719, -0.0660867691040039, -0.061435699462890625, -0.056784629821777344, -0.05213356018066406, -0.04748249053955078, -0.0428314208984375, -0.03818035125732422, -0.03352928161621094, -0.028878211975097656, -0.024227142333984375, -0.019576072692871094, -0.014925003051757812, -0.010273933410644531, -0.00562286376953125, -0.0009717941284179688, 0.0036792755126953125, 0.008330345153808594, 0.012981414794921875, 0.017632484436035156, 0.022283554077148438, 0.02693462371826172, 0.031585693359375, 0.03623676300048828, 0.04088783264160156, 0.045538902282714844, 0.050189971923828125, 0.054841041564941406, 0.05949211120605469, 0.06414318084716797, 0.06879425048828125, 0.07344532012939453, 0.07809638977050781, 0.0827474594116211, 0.08739852905273438, 0.09204959869384766, 0.09670066833496094, 0.10135173797607422, 0.1060028076171875, 0.11065387725830078, 0.11530494689941406, 0.11995601654052734, 0.12460708618164062, 0.1292581558227539, 0.1339092254638672, 0.13856029510498047, 0.14321136474609375, 0.14786243438720703, 0.1525135040283203, 0.1571645736694336, 0.16181564331054688, 0.16646671295166016, 0.17111778259277344, 0.17576885223388672, 0.180419921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 5.0, 13.0, 11.0, 26.0, 52.0, 75.0, 153.0, 294.0, 909.0, 3242.0, 16298.0, 193329.0, 3755111.0, 204587.0, 15798.0, 2954.0, 821.0, 307.0, 121.0, 67.0, 44.0, 23.0, 18.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.58984375, -0.57275390625, -0.5556640625, -0.53857421875, -0.521484375, -0.50439453125, -0.4873046875, -0.47021484375, -0.453125, -0.43603515625, -0.4189453125, -0.40185546875, -0.384765625, -0.36767578125, -0.3505859375, -0.33349609375, -0.31640625, -0.29931640625, -0.2822265625, -0.26513671875, -0.248046875, -0.23095703125, -0.2138671875, -0.19677734375, -0.1796875, -0.16259765625, -0.1455078125, -0.12841796875, -0.111328125, -0.09423828125, -0.0771484375, -0.06005859375, -0.04296875, -0.02587890625, -0.0087890625, 0.00830078125, 0.025390625, 0.04248046875, 0.0595703125, 0.07666015625, 0.09375, 0.11083984375, 0.1279296875, 0.14501953125, 0.162109375, 0.17919921875, 0.1962890625, 0.21337890625, 0.23046875, 0.24755859375, 0.2646484375, 0.28173828125, 0.298828125, 0.31591796875, 0.3330078125, 0.35009765625, 0.3671875, 0.38427734375, 0.4013671875, 0.41845703125, 0.435546875, 0.45263671875, 0.4697265625, 0.48681640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 5.0, 3.0, 11.0, 6.0, 9.0, 9.0, 20.0, 27.0, 29.0, 38.0, 39.0, 70.0, 118.0, 154.0, 224.0, 358.0, 562.0, 682.0, 558.0, 400.0, 236.0, 165.0, 89.0, 80.0, 50.0, 28.0, 30.0, 17.0, 9.0, 15.0, 8.0, 11.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.26811981201171875, -0.2584075927734375, -0.24869537353515625, -0.238983154296875, -0.22927093505859375, -0.2195587158203125, -0.20984649658203125, -0.20013427734375, -0.19042205810546875, -0.1807098388671875, -0.17099761962890625, -0.161285400390625, -0.15157318115234375, -0.1418609619140625, -0.13214874267578125, -0.1224365234375, -0.11272430419921875, -0.1030120849609375, -0.09329986572265625, -0.083587646484375, -0.07387542724609375, -0.0641632080078125, -0.05445098876953125, -0.04473876953125, -0.03502655029296875, -0.0253143310546875, -0.01560211181640625, -0.005889892578125, 0.00382232666015625, 0.0135345458984375, 0.02324676513671875, 0.032958984375, 0.04267120361328125, 0.0523834228515625, 0.06209564208984375, 0.071807861328125, 0.08152008056640625, 0.0912322998046875, 0.10094451904296875, 0.11065673828125, 0.12036895751953125, 0.1300811767578125, 0.13979339599609375, 0.149505615234375, 0.15921783447265625, 0.1689300537109375, 0.17864227294921875, 0.1883544921875, 0.19806671142578125, 0.2077789306640625, 0.21749114990234375, 0.227203369140625, 0.23691558837890625, 0.2466278076171875, 0.25634002685546875, 0.26605224609375, 0.27576446533203125, 0.2854766845703125, 0.29518890380859375, 0.304901123046875, 0.31461334228515625, 0.3243255615234375, 0.33403778076171875, 0.34375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 12.0, 29.0, 51.0, 129.0, 235.0, 273.0, 154.0, 60.0, 22.0, 12.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.281395435333252, -7.127960205078125, -6.97452449798584, -6.821089267730713, -6.667653560638428, -6.514218330383301, -6.360782623291016, -6.207347393035889, -6.053912162780762, -5.900476932525635, -5.74704122543335, -5.593605995178223, -5.4401702880859375, -5.2867350578308105, -5.133299350738525, -4.979864120483398, -4.826428413391113, -4.672993183135986, -4.519557476043701, -4.366122245788574, -4.212686538696289, -4.059251308441162, -3.905815839767456, -3.75238037109375, -3.598944902420044, -3.445509433746338, -3.292073965072632, -3.138638496398926, -2.985203266143799, -2.8317675590515137, -2.6783323287963867, -2.5248968601226807, -2.371461868286133, -2.2180263996124268, -2.0645909309387207, -1.9111555814743042, -1.7577201128005981, -1.604284644126892, -1.4508492946624756, -1.2974138259887695, -1.1439783573150635, -0.9905428886413574, -0.8371074795722961, -0.6836720705032349, -0.5302366018295288, -0.37680113315582275, -0.22336572408676147, -0.0699303150177002, 0.08350515365600586, 0.23694059252738953, 0.3903760313987732, 0.5438114404678345, 0.6972469091415405, 0.8506823778152466, 1.004117727279663, 1.1575531959533691, 1.3109886646270752, 1.4644241333007812, 1.6178596019744873, 1.7712949514389038, 1.9247304201126099, 2.0781660079956055, 2.2316012382507324, 2.3850367069244385, 2.5384721755981445]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 10.0, 16.0, 18.0, 10.0, 18.0, 19.0, 25.0, 30.0, 31.0, 34.0, 39.0, 42.0, 37.0, 39.0, 36.0, 48.0, 45.0, 30.0, 46.0, 35.0, 47.0, 39.0, 32.0, 30.0, 24.0, 20.0, 31.0, 20.0, 26.0, 18.0, 22.0, 12.0, 16.0, 7.0, 6.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2125723361968994, -1.1690690517425537, -1.1255658864974976, -1.0820626020431519, -1.0385594367980957, -0.99505615234375, -0.9515529274940491, -0.9080497026443481, -0.8645464777946472, -0.8210432529449463, -0.7775400280952454, -0.7340368032455444, -0.6905335187911987, -0.6470303535461426, -0.6035270690917969, -0.560023844242096, -0.516520619392395, -0.4730173945426941, -0.42951416969299316, -0.38601091504096985, -0.3425076901912689, -0.299004465341568, -0.2555012106895447, -0.21199798583984375, -0.16849476099014282, -0.1249915286898613, -0.08148829638957977, -0.03798505663871765, 0.005518168210983276, 0.049021393060684204, 0.09252464771270752, 0.13602787256240845, 0.17953097820281982, 0.22303420305252075, 0.2665374279022217, 0.310040682554245, 0.3535439074039459, 0.39704713225364685, 0.44055038690567017, 0.4840536117553711, 0.527556836605072, 0.571060061454773, 0.6145632863044739, 0.6580665111541748, 0.7015697956085205, 0.7450729608535767, 0.7885762453079224, 0.8320794701576233, 0.8755826950073242, 0.9190859198570251, 0.9625891447067261, 1.0060924291610718, 1.049595594406128, 1.0930988788604736, 1.1366021633148193, 1.1801053285598755, 1.2236084938049316, 1.2671117782592773, 1.3106149435043335, 1.3541182279586792, 1.3976213932037354, 1.441124677658081, 1.4846279621124268, 1.528131127357483, 1.5716344118118286]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 12.0, 7.0, 10.0, 25.0, 39.0, 39.0, 72.0, 100.0, 164.0, 265.0, 371.0, 725.0, 1342.0, 2562.0, 5363.0, 12978.0, 34533.0, 112433.0, 351184.0, 353834.0, 113225.0, 35234.0, 12751.0, 5577.0, 2580.0, 1275.0, 740.0, 418.0, 254.0, 150.0, 95.0, 70.0, 44.0, 17.0, 22.0, 21.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.180908203125, -0.17444801330566406, -0.16798782348632812, -0.1615276336669922, -0.15506744384765625, -0.1486072540283203, -0.14214706420898438, -0.13568687438964844, -0.1292266845703125, -0.12276649475097656, -0.11630630493164062, -0.10984611511230469, -0.10338592529296875, -0.09692573547363281, -0.09046554565429688, -0.08400535583496094, -0.077545166015625, -0.07108497619628906, -0.06462478637695312, -0.05816459655761719, -0.05170440673828125, -0.04524421691894531, -0.038784027099609375, -0.03232383728027344, -0.0258636474609375, -0.019403457641601562, -0.012943267822265625, -0.0064830780029296875, -2.288818359375e-05, 0.0064373016357421875, 0.012897491455078125, 0.019357681274414062, 0.02581787109375, 0.03227806091308594, 0.038738250732421875, 0.04519844055175781, 0.05165863037109375, 0.05811882019042969, 0.06457901000976562, 0.07103919982910156, 0.0774993896484375, 0.08395957946777344, 0.09041976928710938, 0.09687995910644531, 0.10334014892578125, 0.10980033874511719, 0.11626052856445312, 0.12272071838378906, 0.129180908203125, 0.13564109802246094, 0.14210128784179688, 0.1485614776611328, 0.15502166748046875, 0.1614818572998047, 0.16794204711914062, 0.17440223693847656, 0.1808624267578125, 0.18732261657714844, 0.19378280639648438, 0.2002429962158203, 0.20670318603515625, 0.2131633758544922, 0.21962356567382812, 0.22608375549316406, 0.2325439453125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 7.0, 10.0, 17.0, 23.0, 15.0, 29.0, 21.0, 42.0, 48.0, 29.0, 45.0, 52.0, 58.0, 70.0, 52.0, 51.0, 46.0, 44.0, 36.0, 33.0, 50.0, 35.0, 30.0, 29.0, 23.0, 24.0, 17.0, 13.0, 12.0, 8.0, 6.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12353515625, -0.11874961853027344, -0.11396408081054688, -0.10917854309082031, -0.10439300537109375, -0.09960746765136719, -0.09482192993164062, -0.09003639221191406, -0.0852508544921875, -0.08046531677246094, -0.07567977905273438, -0.07089424133300781, -0.06610870361328125, -0.06132316589355469, -0.056537628173828125, -0.05175209045410156, -0.046966552734375, -0.04218101501464844, -0.037395477294921875, -0.03260993957519531, -0.02782440185546875, -0.023038864135742188, -0.018253326416015625, -0.013467788696289062, -0.0086822509765625, -0.0038967132568359375, 0.000888824462890625, 0.0056743621826171875, 0.01045989990234375, 0.015245437622070312, 0.020030975341796875, 0.024816513061523438, 0.02960205078125, 0.03438758850097656, 0.039173126220703125, 0.04395866394042969, 0.04874420166015625, 0.05352973937988281, 0.058315277099609375, 0.06310081481933594, 0.0678863525390625, 0.07267189025878906, 0.07745742797851562, 0.08224296569824219, 0.08702850341796875, 0.09181404113769531, 0.09659957885742188, 0.10138511657714844, 0.106170654296875, 0.11095619201660156, 0.11574172973632812, 0.12052726745605469, 0.12531280517578125, 0.1300983428955078, 0.13488388061523438, 0.13966941833496094, 0.1444549560546875, 0.14924049377441406, 0.15402603149414062, 0.1588115692138672, 0.16359710693359375, 0.1683826446533203, 0.17316818237304688, 0.17795372009277344, 0.1827392578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 10.0, 11.0, 7.0, 10.0, 15.0, 19.0, 32.0, 41.0, 52.0, 102.0, 180.0, 232.0, 474.0, 916.0, 2150.0, 6616.0, 27152.0, 191785.0, 701539.0, 93598.0, 15810.0, 4303.0, 1684.0, 796.0, 379.0, 197.0, 139.0, 81.0, 44.0, 42.0, 25.0, 25.0, 17.0, 18.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3466796875, -0.3359565734863281, -0.32523345947265625, -0.3145103454589844, -0.3037872314453125, -0.2930641174316406, -0.28234100341796875, -0.2716178894042969, -0.260894775390625, -0.2501716613769531, -0.23944854736328125, -0.22872543334960938, -0.2180023193359375, -0.20727920532226562, -0.19655609130859375, -0.18583297729492188, -0.17510986328125, -0.16438674926757812, -0.15366363525390625, -0.14294052124023438, -0.1322174072265625, -0.12149429321289062, -0.11077117919921875, -0.10004806518554688, -0.089324951171875, -0.07860183715820312, -0.06787872314453125, -0.057155609130859375, -0.0464324951171875, -0.035709381103515625, -0.02498626708984375, -0.014263153076171875, -0.0035400390625, 0.007183074951171875, 0.01790618896484375, 0.028629302978515625, 0.0393524169921875, 0.050075531005859375, 0.06079864501953125, 0.07152175903320312, 0.082244873046875, 0.09296798706054688, 0.10369110107421875, 0.11441421508789062, 0.1251373291015625, 0.13586044311523438, 0.14658355712890625, 0.15730667114257812, 0.16802978515625, 0.17875289916992188, 0.18947601318359375, 0.20019912719726562, 0.2109222412109375, 0.22164535522460938, 0.23236846923828125, 0.24309158325195312, 0.253814697265625, 0.2645378112792969, 0.27526092529296875, 0.2859840393066406, 0.2967071533203125, 0.3074302673339844, 0.31815338134765625, 0.3288764953613281, 0.339599609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 8.0, 5.0, 12.0, 17.0, 23.0, 32.0, 36.0, 55.0, 66.0, 53.0, 64.0, 71.0, 71.0, 56.0, 65.0, 56.0, 48.0, 57.0, 40.0, 39.0, 25.0, 31.0, 16.0, 11.0, 8.0, 13.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6650238037109375, -0.642059326171875, -0.6190948486328125, -0.59613037109375, -0.5731658935546875, -0.550201416015625, -0.5272369384765625, -0.5042724609375, -0.4813079833984375, -0.458343505859375, -0.4353790283203125, -0.41241455078125, -0.3894500732421875, -0.366485595703125, -0.3435211181640625, -0.320556640625, -0.2975921630859375, -0.274627685546875, -0.2516632080078125, -0.22869873046875, -0.2057342529296875, -0.182769775390625, -0.1598052978515625, -0.1368408203125, -0.1138763427734375, -0.090911865234375, -0.0679473876953125, -0.04498291015625, -0.0220184326171875, 0.000946044921875, 0.0239105224609375, 0.046875, 0.0698394775390625, 0.092803955078125, 0.1157684326171875, 0.13873291015625, 0.1616973876953125, 0.184661865234375, 0.2076263427734375, 0.2305908203125, 0.2535552978515625, 0.276519775390625, 0.2994842529296875, 0.32244873046875, 0.3454132080078125, 0.368377685546875, 0.3913421630859375, 0.414306640625, 0.4372711181640625, 0.460235595703125, 0.4832000732421875, 0.50616455078125, 0.5291290283203125, 0.552093505859375, 0.5750579833984375, 0.5980224609375, 0.6209869384765625, 0.643951416015625, 0.6669158935546875, 0.68988037109375, 0.7128448486328125, 0.735809326171875, 0.7587738037109375, 0.78173828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 17.0, 10.0, 25.0, 35.0, 54.0, 92.0, 183.0, 309.0, 589.0, 1342.0, 3235.0, 9808.0, 39119.0, 229742.0, 649985.0, 86234.0, 18584.0, 5380.0, 1969.0, 894.0, 375.0, 237.0, 127.0, 75.0, 44.0, 23.0, 22.0, 16.0, 4.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15771484375, -0.1531085968017578, -0.14850234985351562, -0.14389610290527344, -0.13928985595703125, -0.13468360900878906, -0.13007736206054688, -0.1254711151123047, -0.1208648681640625, -0.11625862121582031, -0.11165237426757812, -0.10704612731933594, -0.10243988037109375, -0.09783363342285156, -0.09322738647460938, -0.08862113952636719, -0.084014892578125, -0.07940864562988281, -0.07480239868164062, -0.07019615173339844, -0.06558990478515625, -0.06098365783691406, -0.056377410888671875, -0.05177116394042969, -0.0471649169921875, -0.04255867004394531, -0.037952423095703125, -0.03334617614746094, -0.02873992919921875, -0.024133682250976562, -0.019527435302734375, -0.014921188354492188, -0.01031494140625, -0.0057086944580078125, -0.001102447509765625, 0.0035037994384765625, 0.00811004638671875, 0.012716293334960938, 0.017322540283203125, 0.021928787231445312, 0.0265350341796875, 0.031141281127929688, 0.035747528076171875, 0.04035377502441406, 0.04496002197265625, 0.04956626892089844, 0.054172515869140625, 0.05877876281738281, 0.063385009765625, 0.06799125671386719, 0.07259750366210938, 0.07720375061035156, 0.08180999755859375, 0.08641624450683594, 0.09102249145507812, 0.09562873840332031, 0.1002349853515625, 0.10484123229980469, 0.10944747924804688, 0.11405372619628906, 0.11865997314453125, 0.12326622009277344, 0.12787246704101562, 0.1324787139892578, 0.1370849609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 7.0, 8.0, 12.0, 7.0, 15.0, 23.0, 23.0, 42.0, 55.0, 67.0, 102.0, 104.0, 103.0, 103.0, 74.0, 74.0, 47.0, 28.0, 25.0, 17.0, 22.0, 16.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.13060188293457e-05, -3.999192267656326e-05, -3.867782652378082e-05, -3.736373037099838e-05, -3.604963421821594e-05, -3.47355380654335e-05, -3.342144191265106e-05, -3.210734575986862e-05, -3.079324960708618e-05, -2.947915345430374e-05, -2.81650573015213e-05, -2.685096114873886e-05, -2.553686499595642e-05, -2.422276884317398e-05, -2.290867269039154e-05, -2.15945765376091e-05, -2.028048038482666e-05, -1.896638423204422e-05, -1.765228807926178e-05, -1.633819192647934e-05, -1.50240957736969e-05, -1.370999962091446e-05, -1.2395903468132019e-05, -1.1081807315349579e-05, -9.767711162567139e-06, -8.453615009784698e-06, -7.139518857002258e-06, -5.825422704219818e-06, -4.511326551437378e-06, -3.1972303986549377e-06, -1.8831342458724976e-06, -5.690380930900574e-07, 7.450580596923828e-07, 2.059154212474823e-06, 3.373250365257263e-06, 4.687346518039703e-06, 6.0014426708221436e-06, 7.315538823604584e-06, 8.629634976387024e-06, 9.943731129169464e-06, 1.1257827281951904e-05, 1.2571923434734344e-05, 1.3886019587516785e-05, 1.5200115740299225e-05, 1.6514211893081665e-05, 1.7828308045864105e-05, 1.9142404198646545e-05, 2.0456500351428986e-05, 2.1770596504211426e-05, 2.3084692656993866e-05, 2.4398788809776306e-05, 2.5712884962558746e-05, 2.7026981115341187e-05, 2.8341077268123627e-05, 2.9655173420906067e-05, 3.096926957368851e-05, 3.228336572647095e-05, 3.359746187925339e-05, 3.491155803203583e-05, 3.622565418481827e-05, 3.753975033760071e-05, 3.885384649038315e-05, 4.016794264316559e-05, 4.148203879594803e-05, 4.279613494873047e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 9.0, 20.0, 27.0, 38.0, 58.0, 102.0, 186.0, 327.0, 661.0, 1336.0, 3280.0, 10837.0, 54130.0, 529903.0, 381067.0, 50328.0, 10320.0, 3151.0, 1315.0, 625.0, 323.0, 197.0, 114.0, 69.0, 36.0, 28.0, 13.0, 12.0, 11.0, 10.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.1150503158569336, -0.11004447937011719, -0.10503864288330078, -0.10003280639648438, -0.09502696990966797, -0.09002113342285156, -0.08501529693603516, -0.08000946044921875, -0.07500362396240234, -0.06999778747558594, -0.06499195098876953, -0.059986114501953125, -0.05498027801513672, -0.04997444152832031, -0.044968605041503906, -0.0399627685546875, -0.034956932067871094, -0.029951095581054688, -0.02494525909423828, -0.019939422607421875, -0.014933586120605469, -0.009927749633789062, -0.004921913146972656, 8.392333984375e-05, 0.005089759826660156, 0.010095596313476562, 0.015101432800292969, 0.020107269287109375, 0.02511310577392578, 0.030118942260742188, 0.035124778747558594, 0.040130615234375, 0.045136451721191406, 0.05014228820800781, 0.05514812469482422, 0.060153961181640625, 0.06515979766845703, 0.07016563415527344, 0.07517147064208984, 0.08017730712890625, 0.08518314361572266, 0.09018898010253906, 0.09519481658935547, 0.10020065307617188, 0.10520648956298828, 0.11021232604980469, 0.1152181625366211, 0.1202239990234375, 0.1252298355102539, 0.1302356719970703, 0.13524150848388672, 0.14024734497070312, 0.14525318145751953, 0.15025901794433594, 0.15526485443115234, 0.16027069091796875, 0.16527652740478516, 0.17028236389160156, 0.17528820037841797, 0.18029403686523438, 0.18529987335205078, 0.1903057098388672, 0.1953115463256836, 0.2003173828125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 18.0, 28.0, 43.0, 62.0, 77.0, 90.0, 102.0, 106.0, 97.0, 76.0, 69.0, 52.0, 46.0, 27.0, 20.0, 13.0, 12.0, 12.0, 7.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.13680076599121094, -0.13138961791992188, -0.1259784698486328, -0.12056732177734375, -0.11515617370605469, -0.10974502563476562, -0.10433387756347656, -0.0989227294921875, -0.09351158142089844, -0.08810043334960938, -0.08268928527832031, -0.07727813720703125, -0.07186698913574219, -0.06645584106445312, -0.06104469299316406, -0.055633544921875, -0.05022239685058594, -0.044811248779296875, -0.03940010070800781, -0.03398895263671875, -0.028577804565429688, -0.023166656494140625, -0.017755508422851562, -0.0123443603515625, -0.0069332122802734375, -0.001522064208984375, 0.0038890838623046875, 0.00930023193359375, 0.014711380004882812, 0.020122528076171875, 0.025533676147460938, 0.03094482421875, 0.03635597229003906, 0.041767120361328125, 0.04717826843261719, 0.05258941650390625, 0.05800056457519531, 0.06341171264648438, 0.06882286071777344, 0.0742340087890625, 0.07964515686035156, 0.08505630493164062, 0.09046745300292969, 0.09587860107421875, 0.10128974914550781, 0.10670089721679688, 0.11211204528808594, 0.117523193359375, 0.12293434143066406, 0.12834548950195312, 0.1337566375732422, 0.13916778564453125, 0.1445789337158203, 0.14999008178710938, 0.15540122985839844, 0.1608123779296875, 0.16622352600097656, 0.17163467407226562, 0.1770458221435547, 0.18245697021484375, 0.1878681182861328, 0.19327926635742188, 0.19869041442871094, 0.2041015625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 11.0, 15.0, 53.0, 138.0, 368.0, 226.0, 98.0, 42.0, 22.0, 11.0, 3.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.138543128967285, -4.003957271575928, -3.869371175765991, -3.7347850799560547, -3.6001992225646973, -3.4656131267547607, -3.331027030944824, -3.196441173553467, -3.0618550777435303, -2.9272689819335938, -2.7926831245422363, -2.6580970287323, -2.5235109329223633, -2.388925075531006, -2.2543389797210693, -2.119752883911133, -1.9851670265197754, -1.8505810499191284, -1.7159950733184814, -1.581408977508545, -1.446823000907898, -1.312237024307251, -1.1776509284973145, -1.0430649518966675, -0.9084789752960205, -0.7738929986953735, -0.6393069624900818, -0.50472092628479, -0.37013494968414307, -0.2355489730834961, -0.10096293687820435, 0.0336230993270874, 0.16820955276489258, 0.30279555916786194, 0.4373815655708313, 0.571967601776123, 0.70655357837677, 0.841139554977417, 0.9757255911827087, 1.1103116273880005, 1.2448976039886475, 1.3794835805892944, 1.5140695571899414, 1.648655652999878, 1.783241629600525, 1.9178276062011719, 2.0524137020111084, 2.186999797821045, 2.3215856552124023, 2.456171751022339, 2.5907576084136963, 2.725343704223633, 2.8599295616149902, 2.9945156574249268, 3.1291017532348633, 3.2636876106262207, 3.3982737064361572, 3.5328598022460938, 3.667445659637451, 3.8020317554473877, 3.936617851257324, 4.071203708648682, 4.205789566040039, 4.340375900268555, 4.474961757659912]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 9.0, 2.0, 7.0, 11.0, 9.0, 6.0, 18.0, 18.0, 6.0, 22.0, 18.0, 15.0, 18.0, 21.0, 25.0, 27.0, 34.0, 41.0, 58.0, 57.0, 69.0, 82.0, 69.0, 38.0, 29.0, 41.0, 23.0, 36.0, 27.0, 17.0, 20.0, 25.0, 13.0, 8.0, 12.0, 14.0, 10.0, 4.0, 5.0, 5.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.6017582416534424, -1.5445072650909424, -1.4872561693191528, -1.4300051927566528, -1.3727542161941528, -1.3155031204223633, -1.2582521438598633, -1.2010011672973633, -1.1437501907348633, -1.0864992141723633, -1.0292481184005737, -0.9719971418380737, -0.9147461652755737, -0.857495129108429, -0.8002440929412842, -0.7429931163787842, -0.6857420802116394, -0.6284910440444946, -0.5712400674819946, -0.5139890313148499, -0.45673805475234985, -0.3994870185852051, -0.3422360122203827, -0.2849850058555603, -0.22773399949073792, -0.17048299312591553, -0.11323197931051254, -0.05598096549510956, 0.0012700408697128296, 0.05852106213569641, 0.1157720685005188, 0.1730230748653412, 0.23027408123016357, 0.28752508759498596, 0.34477609395980835, 0.4020271301269531, 0.4592781066894531, 0.5165291428565979, 0.5737801790237427, 0.6310311555862427, 0.6882821321487427, 0.7455331683158875, 0.8027841448783875, 0.8600351810455322, 0.9172861576080322, 0.974537193775177, 1.0317882299423218, 1.0890392065048218, 1.1462903022766113, 1.2035412788391113, 1.2607923746109009, 1.3180433511734009, 1.3752943277359009, 1.4325454235076904, 1.4897964000701904, 1.5470473766326904, 1.6042983531951904, 1.6615493297576904, 1.71880042552948, 1.77605140209198, 1.83330237865448, 1.8905534744262695, 1.9478044509887695, 2.0050554275512695, 2.0623064041137695]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 5.0, 12.0, 24.0, 31.0, 32.0, 69.0, 108.0, 172.0, 280.0, 438.0, 675.0, 1161.0, 1893.0, 3447.0, 6629.0, 13700.0, 33753.0, 103302.0, 402006.0, 1646387.0, 1482275.0, 350428.0, 91498.0, 29836.0, 12356.0, 5959.0, 3134.0, 1875.0, 1073.0, 653.0, 408.0, 267.0, 150.0, 69.0, 59.0, 35.0, 27.0, 18.0, 14.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14013671875, -0.13600921630859375, -0.1318817138671875, -0.12775421142578125, -0.123626708984375, -0.11949920654296875, -0.1153717041015625, -0.11124420166015625, -0.10711669921875, -0.10298919677734375, -0.0988616943359375, -0.09473419189453125, -0.090606689453125, -0.08647918701171875, -0.0823516845703125, -0.07822418212890625, -0.0740966796875, -0.06996917724609375, -0.0658416748046875, -0.06171417236328125, -0.057586669921875, -0.05345916748046875, -0.0493316650390625, -0.04520416259765625, -0.04107666015625, -0.03694915771484375, -0.0328216552734375, -0.02869415283203125, -0.024566650390625, -0.02043914794921875, -0.0163116455078125, -0.01218414306640625, -0.008056640625, -0.00392913818359375, 0.0001983642578125, 0.00432586669921875, 0.008453369140625, 0.01258087158203125, 0.0167083740234375, 0.02083587646484375, 0.02496337890625, 0.02909088134765625, 0.0332183837890625, 0.03734588623046875, 0.041473388671875, 0.04560089111328125, 0.0497283935546875, 0.05385589599609375, 0.0579833984375, 0.06211090087890625, 0.0662384033203125, 0.07036590576171875, 0.074493408203125, 0.07862091064453125, 0.0827484130859375, 0.08687591552734375, 0.09100341796875, 0.09513092041015625, 0.0992584228515625, 0.10338592529296875, 0.107513427734375, 0.11164093017578125, 0.1157684326171875, 0.11989593505859375, 0.1240234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 5.0, 7.0, 11.0, 14.0, 20.0, 23.0, 29.0, 22.0, 38.0, 36.0, 63.0, 51.0, 60.0, 61.0, 54.0, 53.0, 62.0, 59.0, 50.0, 51.0, 45.0, 35.0, 37.0, 22.0, 18.0, 18.0, 12.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.123931884765625, -0.11895751953125, -0.113983154296875, -0.1090087890625, -0.104034423828125, -0.09906005859375, -0.094085693359375, -0.089111328125, -0.084136962890625, -0.07916259765625, -0.074188232421875, -0.0692138671875, -0.064239501953125, -0.05926513671875, -0.054290771484375, -0.04931640625, -0.044342041015625, -0.03936767578125, -0.034393310546875, -0.0294189453125, -0.024444580078125, -0.01947021484375, -0.014495849609375, -0.009521484375, -0.004547119140625, 0.00042724609375, 0.005401611328125, 0.0103759765625, 0.015350341796875, 0.02032470703125, 0.025299072265625, 0.0302734375, 0.035247802734375, 0.04022216796875, 0.045196533203125, 0.0501708984375, 0.055145263671875, 0.06011962890625, 0.065093994140625, 0.070068359375, 0.075042724609375, 0.08001708984375, 0.084991455078125, 0.0899658203125, 0.094940185546875, 0.09991455078125, 0.104888916015625, 0.10986328125, 0.114837646484375, 0.11981201171875, 0.124786376953125, 0.1297607421875, 0.134735107421875, 0.13970947265625, 0.144683837890625, 0.149658203125, 0.154632568359375, 0.15960693359375, 0.164581298828125, 0.1695556640625, 0.174530029296875, 0.17950439453125, 0.184478759765625, 0.189453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 2.0, 10.0, 14.0, 15.0, 28.0, 38.0, 43.0, 70.0, 129.0, 333.0, 940.0, 3906.0, 24059.0, 455195.0, 3603635.0, 92717.0, 10125.0, 1950.0, 569.0, 226.0, 105.0, 52.0, 42.0, 16.0, 21.0, 14.0, 11.0, 9.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.383544921875, -0.3677482604980469, -0.35195159912109375, -0.3361549377441406, -0.3203582763671875, -0.3045616149902344, -0.28876495361328125, -0.2729682922363281, -0.257171630859375, -0.24137496948242188, -0.22557830810546875, -0.20978164672851562, -0.1939849853515625, -0.17818832397460938, -0.16239166259765625, -0.14659500122070312, -0.13079833984375, -0.11500167846679688, -0.09920501708984375, -0.08340835571289062, -0.0676116943359375, -0.051815032958984375, -0.03601837158203125, -0.020221710205078125, -0.004425048828125, 0.011371612548828125, 0.02716827392578125, 0.042964935302734375, 0.0587615966796875, 0.07455825805664062, 0.09035491943359375, 0.10615158081054688, 0.1219482421875, 0.13774490356445312, 0.15354156494140625, 0.16933822631835938, 0.1851348876953125, 0.20093154907226562, 0.21672821044921875, 0.23252487182617188, 0.248321533203125, 0.2641181945800781, 0.27991485595703125, 0.2957115173339844, 0.3115081787109375, 0.3273048400878906, 0.34310150146484375, 0.3588981628417969, 0.37469482421875, 0.3904914855957031, 0.40628814697265625, 0.4220848083496094, 0.4378814697265625, 0.4536781311035156, 0.46947479248046875, 0.4852714538574219, 0.501068115234375, 0.5168647766113281, 0.5326614379882812, 0.5484580993652344, 0.5642547607421875, 0.5800514221191406, 0.5958480834960938, 0.6116447448730469, 0.62744140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 8.0, 2.0, 6.0, 12.0, 10.0, 19.0, 19.0, 32.0, 42.0, 58.0, 100.0, 171.0, 275.0, 437.0, 746.0, 810.0, 524.0, 287.0, 167.0, 104.0, 64.0, 41.0, 34.0, 33.0, 17.0, 10.0, 10.0, 13.0, 5.0, 7.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3916015625, -0.3810615539550781, -0.37052154541015625, -0.3599815368652344, -0.3494415283203125, -0.3389015197753906, -0.32836151123046875, -0.3178215026855469, -0.307281494140625, -0.2967414855957031, -0.28620147705078125, -0.2756614685058594, -0.2651214599609375, -0.2545814514160156, -0.24404144287109375, -0.23350143432617188, -0.22296142578125, -0.21242141723632812, -0.20188140869140625, -0.19134140014648438, -0.1808013916015625, -0.17026138305664062, -0.15972137451171875, -0.14918136596679688, -0.138641357421875, -0.12810134887695312, -0.11756134033203125, -0.10702133178710938, -0.0964813232421875, -0.08594131469726562, -0.07540130615234375, -0.06486129760742188, -0.0543212890625, -0.043781280517578125, -0.03324127197265625, -0.022701263427734375, -0.0121612548828125, -0.001621246337890625, 0.00891876220703125, 0.019458770751953125, 0.029998779296875, 0.040538787841796875, 0.05107879638671875, 0.061618804931640625, 0.0721588134765625, 0.08269882202148438, 0.09323883056640625, 0.10377883911132812, 0.11431884765625, 0.12485885620117188, 0.13539886474609375, 0.14593887329101562, 0.1564788818359375, 0.16701889038085938, 0.17755889892578125, 0.18809890747070312, 0.198638916015625, 0.20917892456054688, 0.21971893310546875, 0.23025894165039062, 0.2407989501953125, 0.2513389587402344, 0.26187896728515625, 0.2724189758300781, 0.282958984375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 3.0, 10.0, 24.0, 64.0, 145.0, 249.0, 246.0, 146.0, 69.0, 27.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0440897941589355, -4.911666393280029, -4.779242515563965, -4.646819114685059, -4.514395236968994, -4.381971836090088, -4.249547958374023, -4.117124557495117, -3.984700918197632, -3.8522772789001465, -3.719853639602661, -3.587430000305176, -3.4550065994262695, -3.322582721710205, -3.190159320831299, -3.0577356815338135, -2.925312042236328, -2.7928884029388428, -2.6604647636413574, -2.528041124343872, -2.3956174850463867, -2.2631940841674805, -2.130770444869995, -1.9983468055725098, -1.8659231662750244, -1.733499526977539, -1.6010758876800537, -1.468652367591858, -1.3362287282943726, -1.2038050889968872, -1.0713815689086914, -0.938957929611206, -0.8065338134765625, -0.6741101741790771, -0.5416865944862366, -0.4092629849910736, -0.27683937549591064, -0.1444157361984253, -0.011992156505584717, 0.12043142318725586, 0.2528550624847412, 0.3852786719799042, 0.5177022814750671, 0.6501258611679077, 0.7825495004653931, 0.9149731397628784, 1.0473966598510742, 1.1798202991485596, 1.312243938446045, 1.4446675777435303, 1.5770912170410156, 1.7095147371292114, 1.8419383764266968, 1.9743620157241821, 2.106785535812378, 2.2392091751098633, 2.3716328144073486, 2.504056453704834, 2.6364800930023193, 2.7689037322998047, 2.901327133178711, 3.0337510108947754, 3.1661744117736816, 3.298598051071167, 3.4310216903686523]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 11.0, 6.0, 8.0, 9.0, 17.0, 17.0, 15.0, 25.0, 34.0, 31.0, 37.0, 46.0, 47.0, 49.0, 33.0, 54.0, 46.0, 53.0, 44.0, 46.0, 44.0, 52.0, 53.0, 33.0, 30.0, 29.0, 30.0, 25.0, 16.0, 16.0, 13.0, 6.0, 4.0, 2.0, 4.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3673722743988037, -1.3215018510818481, -1.2756314277648926, -1.229761004447937, -1.1838905811309814, -1.1380200386047363, -1.0921496152877808, -1.0462791919708252, -1.0004087686538696, -0.9545383453369141, -0.9086679220199585, -0.8627974390983582, -0.8169270157814026, -0.771056592464447, -0.7251861095428467, -0.6793156862258911, -0.6334452629089355, -0.58757483959198, -0.5417044162750244, -0.4958339333534241, -0.4499635100364685, -0.40409308671951294, -0.358222633600235, -0.31235218048095703, -0.26648175716400146, -0.2206113189458847, -0.17474088072776794, -0.12887044250965118, -0.08300000429153442, -0.037129566073417664, 0.008740872144699097, 0.05461132526397705, 0.10048174858093262, 0.14635218679904938, 0.19222262501716614, 0.2380930632352829, 0.28396350145339966, 0.3298339247703552, 0.3757043778896332, 0.42157483100891113, 0.4674452543258667, 0.5133156776428223, 0.5591861009597778, 0.6050565838813782, 0.6509270071983337, 0.6967974305152893, 0.7426679134368896, 0.7885383367538452, 0.8344087600708008, 0.8802791833877563, 0.9261496067047119, 0.9720200896263123, 1.017890453338623, 1.0637609958648682, 1.1096314191818237, 1.1555018424987793, 1.2013722658157349, 1.2472426891326904, 1.293113112449646, 1.3389835357666016, 1.3848540782928467, 1.4307245016098022, 1.4765949249267578, 1.5224653482437134, 1.568335771560669]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 16.0, 13.0, 24.0, 38.0, 45.0, 36.0, 69.0, 129.0, 173.0, 230.0, 398.0, 610.0, 1126.0, 2025.0, 4449.0, 10884.0, 30482.0, 105444.0, 432839.0, 338181.0, 79935.0, 24216.0, 8927.0, 3840.0, 1819.0, 969.0, 542.0, 338.0, 208.0, 145.0, 92.0, 80.0, 62.0, 39.0, 29.0, 33.0, 14.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.239990234375, -0.23291015625, -0.225830078125, -0.21875, -0.211669921875, -0.20458984375, -0.197509765625, -0.1904296875, -0.183349609375, -0.17626953125, -0.169189453125, -0.162109375, -0.155029296875, -0.14794921875, -0.140869140625, -0.1337890625, -0.126708984375, -0.11962890625, -0.112548828125, -0.10546875, -0.098388671875, -0.09130859375, -0.084228515625, -0.0771484375, -0.070068359375, -0.06298828125, -0.055908203125, -0.048828125, -0.041748046875, -0.03466796875, -0.027587890625, -0.0205078125, -0.013427734375, -0.00634765625, 0.000732421875, 0.0078125, 0.014892578125, 0.02197265625, 0.029052734375, 0.0361328125, 0.043212890625, 0.05029296875, 0.057373046875, 0.064453125, 0.071533203125, 0.07861328125, 0.085693359375, 0.0927734375, 0.099853515625, 0.10693359375, 0.114013671875, 0.12109375, 0.128173828125, 0.13525390625, 0.142333984375, 0.1494140625, 0.156494140625, 0.16357421875, 0.170654296875, 0.177734375, 0.184814453125, 0.19189453125, 0.198974609375, 0.2060546875, 0.213134765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 9.0, 12.0, 10.0, 14.0, 27.0, 15.0, 19.0, 28.0, 33.0, 46.0, 25.0, 37.0, 36.0, 46.0, 49.0, 50.0, 50.0, 38.0, 52.0, 63.0, 38.0, 39.0, 30.0, 35.0, 27.0, 29.0, 24.0, 16.0, 13.0, 15.0, 16.0, 15.0, 10.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11859130859375, -0.11428546905517578, -0.10997962951660156, -0.10567378997802734, -0.10136795043945312, -0.0970621109008789, -0.09275627136230469, -0.08845043182373047, -0.08414459228515625, -0.07983875274658203, -0.07553291320800781, -0.0712270736694336, -0.06692123413085938, -0.06261539459228516, -0.05830955505371094, -0.05400371551513672, -0.0496978759765625, -0.04539203643798828, -0.04108619689941406, -0.036780357360839844, -0.032474517822265625, -0.028168678283691406, -0.023862838745117188, -0.01955699920654297, -0.01525115966796875, -0.010945320129394531, -0.0066394805908203125, -0.0023336410522460938, 0.001972198486328125, 0.006278038024902344, 0.010583877563476562, 0.014889717102050781, 0.019195556640625, 0.02350139617919922, 0.027807235717773438, 0.032113075256347656, 0.036418914794921875, 0.040724754333496094, 0.04503059387207031, 0.04933643341064453, 0.05364227294921875, 0.05794811248779297, 0.06225395202636719, 0.0665597915649414, 0.07086563110351562, 0.07517147064208984, 0.07947731018066406, 0.08378314971923828, 0.0880889892578125, 0.09239482879638672, 0.09670066833496094, 0.10100650787353516, 0.10531234741210938, 0.1096181869506836, 0.11392402648925781, 0.11822986602783203, 0.12253570556640625, 0.12684154510498047, 0.1311473846435547, 0.1354532241821289, 0.13975906372070312, 0.14406490325927734, 0.14837074279785156, 0.15267658233642578, 0.156982421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 11.0, 9.0, 18.0, 28.0, 51.0, 64.0, 101.0, 153.0, 262.0, 496.0, 1004.0, 2531.0, 8028.0, 42743.0, 671849.0, 282905.0, 28249.0, 6195.0, 1935.0, 865.0, 433.0, 221.0, 137.0, 78.0, 48.0, 42.0, 34.0, 22.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28564453125, -0.27368927001953125, -0.2617340087890625, -0.24977874755859375, -0.237823486328125, -0.22586822509765625, -0.2139129638671875, -0.20195770263671875, -0.19000244140625, -0.17804718017578125, -0.1660919189453125, -0.15413665771484375, -0.142181396484375, -0.13022613525390625, -0.1182708740234375, -0.10631561279296875, -0.0943603515625, -0.08240509033203125, -0.0704498291015625, -0.05849456787109375, -0.046539306640625, -0.03458404541015625, -0.0226287841796875, -0.01067352294921875, 0.00128173828125, 0.01323699951171875, 0.0251922607421875, 0.03714752197265625, 0.049102783203125, 0.06105804443359375, 0.0730133056640625, 0.08496856689453125, 0.096923828125, 0.10887908935546875, 0.1208343505859375, 0.13278961181640625, 0.144744873046875, 0.15670013427734375, 0.1686553955078125, 0.18061065673828125, 0.19256591796875, 0.20452117919921875, 0.2164764404296875, 0.22843170166015625, 0.240386962890625, 0.25234222412109375, 0.2642974853515625, 0.27625274658203125, 0.2882080078125, 0.30016326904296875, 0.3121185302734375, 0.32407379150390625, 0.336029052734375, 0.34798431396484375, 0.3599395751953125, 0.37189483642578125, 0.38385009765625, 0.39580535888671875, 0.4077606201171875, 0.41971588134765625, 0.431671142578125, 0.44362640380859375, 0.4555816650390625, 0.46753692626953125, 0.4794921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 3.0, 10.0, 22.0, 13.0, 19.0, 23.0, 30.0, 38.0, 50.0, 32.0, 65.0, 50.0, 62.0, 61.0, 58.0, 52.0, 59.0, 52.0, 46.0, 44.0, 38.0, 26.0, 19.0, 17.0, 24.0, 14.0, 8.0, 12.0, 7.0, 10.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5231170654296875, -0.504730224609375, -0.4863433837890625, -0.46795654296875, -0.4495697021484375, -0.431182861328125, -0.4127960205078125, -0.3944091796875, -0.3760223388671875, -0.357635498046875, -0.3392486572265625, -0.32086181640625, -0.3024749755859375, -0.284088134765625, -0.2657012939453125, -0.247314453125, -0.2289276123046875, -0.210540771484375, -0.1921539306640625, -0.17376708984375, -0.1553802490234375, -0.136993408203125, -0.1186065673828125, -0.1002197265625, -0.0818328857421875, -0.063446044921875, -0.0450592041015625, -0.02667236328125, -0.0082855224609375, 0.010101318359375, 0.0284881591796875, 0.046875, 0.0652618408203125, 0.083648681640625, 0.1020355224609375, 0.12042236328125, 0.1388092041015625, 0.157196044921875, 0.1755828857421875, 0.1939697265625, 0.2123565673828125, 0.230743408203125, 0.2491302490234375, 0.26751708984375, 0.2859039306640625, 0.304290771484375, 0.3226776123046875, 0.341064453125, 0.3594512939453125, 0.377838134765625, 0.3962249755859375, 0.41461181640625, 0.4329986572265625, 0.451385498046875, 0.4697723388671875, 0.4881591796875, 0.5065460205078125, 0.524932861328125, 0.5433197021484375, 0.56170654296875, 0.5800933837890625, 0.598480224609375, 0.6168670654296875, 0.63525390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 9.0, 2.0, 6.0, 11.0, 14.0, 30.0, 28.0, 33.0, 44.0, 59.0, 100.0, 145.0, 196.0, 303.0, 529.0, 829.0, 1454.0, 2780.0, 5724.0, 12783.0, 31947.0, 99060.0, 586230.0, 209806.0, 57592.0, 20768.0, 8862.0, 4106.0, 2084.0, 1148.0, 673.0, 420.0, 249.0, 160.0, 107.0, 80.0, 46.0, 32.0, 23.0, 13.0, 8.0, 10.0, 7.0, 5.0, 7.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 4.0], "bins": [-0.08319091796875, -0.08065223693847656, -0.07811355590820312, -0.07557487487792969, -0.07303619384765625, -0.07049751281738281, -0.06795883178710938, -0.06542015075683594, -0.0628814697265625, -0.06034278869628906, -0.057804107666015625, -0.05526542663574219, -0.05272674560546875, -0.05018806457519531, -0.047649383544921875, -0.04511070251464844, -0.042572021484375, -0.04003334045410156, -0.037494659423828125, -0.03495597839355469, -0.03241729736328125, -0.029878616333007812, -0.027339935302734375, -0.024801254272460938, -0.0222625732421875, -0.019723892211914062, -0.017185211181640625, -0.014646530151367188, -0.01210784912109375, -0.009569168090820312, -0.007030487060546875, -0.0044918060302734375, -0.001953125, 0.0005855560302734375, 0.003124237060546875, 0.0056629180908203125, 0.00820159912109375, 0.010740280151367188, 0.013278961181640625, 0.015817642211914062, 0.0183563232421875, 0.020895004272460938, 0.023433685302734375, 0.025972366333007812, 0.02851104736328125, 0.031049728393554688, 0.033588409423828125, 0.03612709045410156, 0.038665771484375, 0.04120445251464844, 0.043743133544921875, 0.04628181457519531, 0.04882049560546875, 0.05135917663574219, 0.053897857666015625, 0.05643653869628906, 0.0589752197265625, 0.06151390075683594, 0.06405258178710938, 0.06659126281738281, 0.06912994384765625, 0.07166862487792969, 0.07420730590820312, 0.07674598693847656, 0.07928466796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 11.0, 10.0, 22.0, 24.0, 35.0, 39.0, 73.0, 83.0, 104.0, 117.0, 117.0, 100.0, 70.0, 46.0, 36.0, 23.0, 15.0, 16.0, 15.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.279613494873047e-05, -4.148110747337341e-05, -4.016607999801636e-05, -3.88510525226593e-05, -3.7536025047302246e-05, -3.622099757194519e-05, -3.4905970096588135e-05, -3.359094262123108e-05, -3.2275915145874023e-05, -3.096088767051697e-05, -2.9645860195159912e-05, -2.8330832719802856e-05, -2.70158052444458e-05, -2.5700777769088745e-05, -2.438575029373169e-05, -2.3070722818374634e-05, -2.1755695343017578e-05, -2.0440667867660522e-05, -1.9125640392303467e-05, -1.781061291694641e-05, -1.6495585441589355e-05, -1.51805579662323e-05, -1.3865530490875244e-05, -1.2550503015518188e-05, -1.1235475540161133e-05, -9.920448064804077e-06, -8.605420589447021e-06, -7.290393114089966e-06, -5.97536563873291e-06, -4.6603381633758545e-06, -3.345310688018799e-06, -2.030283212661743e-06, -7.152557373046875e-07, 5.997717380523682e-07, 1.914799213409424e-06, 3.2298266887664795e-06, 4.544854164123535e-06, 5.859881639480591e-06, 7.1749091148376465e-06, 8.489936590194702e-06, 9.804964065551758e-06, 1.1119991540908813e-05, 1.2435019016265869e-05, 1.3750046491622925e-05, 1.506507396697998e-05, 1.6380101442337036e-05, 1.7695128917694092e-05, 1.9010156393051147e-05, 2.0325183868408203e-05, 2.164021134376526e-05, 2.2955238819122314e-05, 2.427026629447937e-05, 2.5585293769836426e-05, 2.690032124519348e-05, 2.8215348720550537e-05, 2.9530376195907593e-05, 3.084540367126465e-05, 3.2160431146621704e-05, 3.347545862197876e-05, 3.4790486097335815e-05, 3.610551357269287e-05, 3.742054104804993e-05, 3.873556852340698e-05, 4.005059599876404e-05, 4.1365623474121094e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 10.0, 9.0, 11.0, 15.0, 25.0, 46.0, 51.0, 95.0, 140.0, 179.0, 314.0, 582.0, 1192.0, 2235.0, 4990.0, 12902.0, 39959.0, 177229.0, 657557.0, 106219.0, 27575.0, 9382.0, 3827.0, 1788.0, 896.0, 475.0, 317.0, 184.0, 116.0, 55.0, 51.0, 46.0, 27.0, 14.0, 15.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11260986328125, -0.10942363739013672, -0.10623741149902344, -0.10305118560791016, -0.09986495971679688, -0.0966787338256836, -0.09349250793457031, -0.09030628204345703, -0.08712005615234375, -0.08393383026123047, -0.08074760437011719, -0.0775613784790039, -0.07437515258789062, -0.07118892669677734, -0.06800270080566406, -0.06481647491455078, -0.0616302490234375, -0.05844402313232422, -0.05525779724121094, -0.052071571350097656, -0.048885345458984375, -0.045699119567871094, -0.04251289367675781, -0.03932666778564453, -0.03614044189453125, -0.03295421600341797, -0.029767990112304688, -0.026581764221191406, -0.023395538330078125, -0.020209312438964844, -0.017023086547851562, -0.013836860656738281, -0.010650634765625, -0.007464408874511719, -0.0042781829833984375, -0.0010919570922851562, 0.002094268798828125, 0.005280494689941406, 0.008466720581054688, 0.011652946472167969, 0.01483917236328125, 0.01802539825439453, 0.021211624145507812, 0.024397850036621094, 0.027584075927734375, 0.030770301818847656, 0.03395652770996094, 0.03714275360107422, 0.0403289794921875, 0.04351520538330078, 0.04670143127441406, 0.049887657165527344, 0.053073883056640625, 0.056260108947753906, 0.05944633483886719, 0.06263256072998047, 0.06581878662109375, 0.06900501251220703, 0.07219123840332031, 0.0753774642944336, 0.07856369018554688, 0.08174991607666016, 0.08493614196777344, 0.08812236785888672, 0.09130859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 14.0, 19.0, 17.0, 24.0, 39.0, 50.0, 54.0, 76.0, 89.0, 101.0, 87.0, 86.0, 60.0, 73.0, 53.0, 24.0, 22.0, 22.0, 14.0, 11.0, 8.0, 7.0, 10.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112060546875, -0.10832786560058594, -0.10459518432617188, -0.10086250305175781, -0.09712982177734375, -0.09339714050292969, -0.08966445922851562, -0.08593177795410156, -0.0821990966796875, -0.07846641540527344, -0.07473373413085938, -0.07100105285644531, -0.06726837158203125, -0.06353569030761719, -0.059803009033203125, -0.05607032775878906, -0.052337646484375, -0.04860496520996094, -0.044872283935546875, -0.04113960266113281, -0.03740692138671875, -0.03367424011230469, -0.029941558837890625, -0.026208877563476562, -0.0224761962890625, -0.018743515014648438, -0.015010833740234375, -0.011278152465820312, -0.00754547119140625, -0.0038127899169921875, -8.0108642578125e-05, 0.0036525726318359375, 0.00738525390625, 0.011117935180664062, 0.014850616455078125, 0.018583297729492188, 0.02231597900390625, 0.026048660278320312, 0.029781341552734375, 0.03351402282714844, 0.0372467041015625, 0.04097938537597656, 0.044712066650390625, 0.04844474792480469, 0.05217742919921875, 0.05591011047363281, 0.059642791748046875, 0.06337547302246094, 0.067108154296875, 0.07084083557128906, 0.07457351684570312, 0.07830619812011719, 0.08203887939453125, 0.08577156066894531, 0.08950424194335938, 0.09323692321777344, 0.0969696044921875, 0.10070228576660156, 0.10443496704101562, 0.10816764831542969, 0.11190032958984375, 0.11563301086425781, 0.11936569213867188, 0.12309837341308594, 0.1268310546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 69.0, 148.0, 346.0, 197.0, 100.0, 42.0, 29.0, 11.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.927361011505127, -3.8200178146362305, -3.712674617767334, -3.6053314208984375, -3.497988224029541, -3.3906450271606445, -3.283301830291748, -3.1759586334228516, -3.068615436553955, -2.9612722396850586, -2.853929042816162, -2.7465858459472656, -2.639242649078369, -2.5318994522094727, -2.424556255340576, -2.3172130584716797, -2.209869861602783, -2.1025266647338867, -1.9951834678649902, -1.8878402709960938, -1.7804970741271973, -1.6731538772583008, -1.5658106803894043, -1.4584674835205078, -1.3511242866516113, -1.2437810897827148, -1.1364378929138184, -1.0290946960449219, -0.9217514991760254, -0.8144083023071289, -0.7070651054382324, -0.5997219085693359, -0.49237847328186035, -0.38503527641296387, -0.2776920795440674, -0.1703488826751709, -0.06300568580627441, 0.04433751106262207, 0.15168070793151855, 0.25902390480041504, 0.3663671016693115, 0.473710298538208, 0.5810534954071045, 0.688396692276001, 0.7957398891448975, 0.903083086013794, 1.0104262828826904, 1.117769479751587, 1.2251126766204834, 1.3324558734893799, 1.4397990703582764, 1.5471422672271729, 1.6544854640960693, 1.7618286609649658, 1.8691718578338623, 1.9765150547027588, 2.0838582515716553, 2.1912014484405518, 2.2985446453094482, 2.4058878421783447, 2.513231039047241, 2.6205742359161377, 2.727917432785034, 2.8352606296539307, 2.942603826522827]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 10.0, 13.0, 18.0, 8.0, 24.0, 12.0, 20.0, 26.0, 27.0, 32.0, 27.0, 41.0, 40.0, 88.0, 98.0, 86.0, 71.0, 51.0, 31.0, 36.0, 33.0, 30.0, 36.0, 18.0, 19.0, 17.0, 13.0, 8.0, 8.0, 12.0, 6.0, 3.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.4488959312438965, -2.380946159362793, -2.3129966259002686, -2.245047092437744, -2.1770973205566406, -2.109147548675537, -2.0411980152130127, -1.9732483625411987, -1.9052987098693848, -1.8373490571975708, -1.7693994045257568, -1.7014497518539429, -1.633500099182129, -1.565550446510315, -1.497600793838501, -1.429651141166687, -1.361701488494873, -1.293751835823059, -1.2258021831512451, -1.1578525304794312, -1.0899028778076172, -1.0219532251358032, -0.9540035724639893, -0.8860539197921753, -0.8181042671203613, -0.7501546144485474, -0.6822049617767334, -0.6142553091049194, -0.5463056564331055, -0.4783560037612915, -0.41040635108947754, -0.3424566984176636, -0.2745072841644287, -0.20655763149261475, -0.13860797882080078, -0.07065832614898682, -0.0027086734771728516, 0.06524097919464111, 0.13319063186645508, 0.20114028453826904, 0.269089937210083, 0.337039589881897, 0.40498924255371094, 0.4729388952255249, 0.5408885478973389, 0.6088382005691528, 0.6767878532409668, 0.7447375059127808, 0.8126871585845947, 0.8806368112564087, 0.9485864639282227, 1.0165361166000366, 1.0844857692718506, 1.1524354219436646, 1.2203850746154785, 1.2883347272872925, 1.3562843799591064, 1.4242340326309204, 1.4921836853027344, 1.5601333379745483, 1.6280829906463623, 1.6960326433181763, 1.7639822959899902, 1.8319319486618042, 1.8998816013336182]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 16.0, 4.0, 12.0, 13.0, 27.0, 38.0, 47.0, 68.0, 116.0, 162.0, 260.0, 405.0, 569.0, 1023.0, 1918.0, 3807.0, 9282.0, 26173.0, 100880.0, 550573.0, 2311126.0, 965677.0, 163309.0, 36321.0, 11928.0, 5015.0, 2350.0, 1246.0, 679.0, 424.0, 247.0, 174.0, 114.0, 97.0, 59.0, 35.0, 23.0, 23.0, 11.0, 8.0, 9.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.183349609375, -0.1782073974609375, -0.173065185546875, -0.1679229736328125, -0.16278076171875, -0.1576385498046875, -0.152496337890625, -0.1473541259765625, -0.1422119140625, -0.1370697021484375, -0.131927490234375, -0.1267852783203125, -0.12164306640625, -0.1165008544921875, -0.111358642578125, -0.1062164306640625, -0.10107421875, -0.0959320068359375, -0.090789794921875, -0.0856475830078125, -0.08050537109375, -0.0753631591796875, -0.070220947265625, -0.0650787353515625, -0.0599365234375, -0.0547943115234375, -0.049652099609375, -0.0445098876953125, -0.03936767578125, -0.0342254638671875, -0.029083251953125, -0.0239410400390625, -0.018798828125, -0.0136566162109375, -0.008514404296875, -0.0033721923828125, 0.00177001953125, 0.0069122314453125, 0.012054443359375, 0.0171966552734375, 0.0223388671875, 0.0274810791015625, 0.032623291015625, 0.0377655029296875, 0.04290771484375, 0.0480499267578125, 0.053192138671875, 0.0583343505859375, 0.0634765625, 0.0686187744140625, 0.073760986328125, 0.0789031982421875, 0.08404541015625, 0.0891876220703125, 0.094329833984375, 0.0994720458984375, 0.1046142578125, 0.1097564697265625, 0.114898681640625, 0.1200408935546875, 0.12518310546875, 0.1303253173828125, 0.135467529296875, 0.1406097412109375, 0.145751953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 8.0, 13.0, 17.0, 16.0, 24.0, 31.0, 36.0, 40.0, 35.0, 47.0, 46.0, 49.0, 55.0, 60.0, 52.0, 50.0, 50.0, 50.0, 46.0, 41.0, 39.0, 34.0, 29.0, 19.0, 22.0, 29.0, 11.0, 14.0, 9.0, 10.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1396484375, -0.13487815856933594, -0.13010787963867188, -0.1253376007080078, -0.12056732177734375, -0.11579704284667969, -0.11102676391601562, -0.10625648498535156, -0.1014862060546875, -0.09671592712402344, -0.09194564819335938, -0.08717536926269531, -0.08240509033203125, -0.07763481140136719, -0.07286453247070312, -0.06809425354003906, -0.063323974609375, -0.05855369567871094, -0.053783416748046875, -0.04901313781738281, -0.04424285888671875, -0.03947257995605469, -0.034702301025390625, -0.029932022094726562, -0.0251617431640625, -0.020391464233398438, -0.015621185302734375, -0.010850906372070312, -0.00608062744140625, -0.0013103485107421875, 0.003459930419921875, 0.008230209350585938, 0.01300048828125, 0.017770767211914062, 0.022541046142578125, 0.027311325073242188, 0.03208160400390625, 0.03685188293457031, 0.041622161865234375, 0.04639244079589844, 0.0511627197265625, 0.05593299865722656, 0.060703277587890625, 0.06547355651855469, 0.07024383544921875, 0.07501411437988281, 0.07978439331054688, 0.08455467224121094, 0.089324951171875, 0.09409523010253906, 0.09886550903320312, 0.10363578796386719, 0.10840606689453125, 0.11317634582519531, 0.11794662475585938, 0.12271690368652344, 0.1274871826171875, 0.13225746154785156, 0.13702774047851562, 0.1417980194091797, 0.14656829833984375, 0.1513385772705078, 0.15610885620117188, 0.16087913513183594, 0.1656494140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0, 7.0, 4.0, 15.0, 7.0, 20.0, 30.0, 28.0, 62.0, 87.0, 159.0, 379.0, 927.0, 3276.0, 15552.0, 157508.0, 3681146.0, 307217.0, 21876.0, 4076.0, 1067.0, 364.0, 176.0, 95.0, 57.0, 34.0, 24.0, 20.0, 18.0, 8.0, 6.0, 9.0, 7.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.437744140625, -0.424713134765625, -0.41168212890625, -0.398651123046875, -0.3856201171875, -0.372589111328125, -0.35955810546875, -0.346527099609375, -0.33349609375, -0.320465087890625, -0.30743408203125, -0.294403076171875, -0.2813720703125, -0.268341064453125, -0.25531005859375, -0.242279052734375, -0.229248046875, -0.216217041015625, -0.20318603515625, -0.190155029296875, -0.1771240234375, -0.164093017578125, -0.15106201171875, -0.138031005859375, -0.125, -0.111968994140625, -0.09893798828125, -0.085906982421875, -0.0728759765625, -0.059844970703125, -0.04681396484375, -0.033782958984375, -0.020751953125, -0.007720947265625, 0.00531005859375, 0.018341064453125, 0.0313720703125, 0.044403076171875, 0.05743408203125, 0.070465087890625, 0.08349609375, 0.096527099609375, 0.10955810546875, 0.122589111328125, 0.1356201171875, 0.148651123046875, 0.16168212890625, 0.174713134765625, 0.187744140625, 0.200775146484375, 0.21380615234375, 0.226837158203125, 0.2398681640625, 0.252899169921875, 0.26593017578125, 0.278961181640625, 0.2919921875, 0.305023193359375, 0.31805419921875, 0.331085205078125, 0.3441162109375, 0.357147216796875, 0.37017822265625, 0.383209228515625, 0.396240234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 8.0, 14.0, 16.0, 21.0, 24.0, 33.0, 59.0, 86.0, 141.0, 222.0, 367.0, 613.0, 753.0, 627.0, 400.0, 252.0, 143.0, 89.0, 59.0, 33.0, 27.0, 11.0, 15.0, 7.0, 12.0, 8.0, 4.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2664604187011719, -0.25679779052734375, -0.24713516235351562, -0.2374725341796875, -0.22780990600585938, -0.21814727783203125, -0.20848464965820312, -0.198822021484375, -0.18915939331054688, -0.17949676513671875, -0.16983413696289062, -0.1601715087890625, -0.15050888061523438, -0.14084625244140625, -0.13118362426757812, -0.12152099609375, -0.11185836791992188, -0.10219573974609375, -0.09253311157226562, -0.0828704833984375, -0.07320785522460938, -0.06354522705078125, -0.053882598876953125, -0.044219970703125, -0.034557342529296875, -0.02489471435546875, -0.015232086181640625, -0.0055694580078125, 0.004093170166015625, 0.01375579833984375, 0.023418426513671875, 0.0330810546875, 0.042743682861328125, 0.05240631103515625, 0.062068939208984375, 0.0717315673828125, 0.08139419555664062, 0.09105682373046875, 0.10071945190429688, 0.110382080078125, 0.12004470825195312, 0.12970733642578125, 0.13936996459960938, 0.1490325927734375, 0.15869522094726562, 0.16835784912109375, 0.17802047729492188, 0.18768310546875, 0.19734573364257812, 0.20700836181640625, 0.21667098999023438, 0.2263336181640625, 0.23599624633789062, 0.24565887451171875, 0.2553215026855469, 0.264984130859375, 0.2746467590332031, 0.28430938720703125, 0.2939720153808594, 0.3036346435546875, 0.3132972717285156, 0.32295989990234375, 0.3326225280761719, 0.34228515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 10.0, 17.0, 26.0, 35.0, 80.0, 148.0, 194.0, 168.0, 143.0, 79.0, 42.0, 17.0, 6.0, 7.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.446486234664917, -3.3627686500549316, -3.2790513038635254, -3.19533371925354, -3.1116161346435547, -3.0278987884521484, -2.944181203842163, -2.8604636192321777, -2.7767462730407715, -2.693028688430786, -2.60931134223938, -2.5255937576293945, -2.4418764114379883, -2.358158826828003, -2.2744412422180176, -2.1907238960266113, -2.107006311416626, -2.0232887268066406, -1.9395713806152344, -1.855853796005249, -1.7721363306045532, -1.6884188652038574, -1.604701280593872, -1.5209838151931763, -1.4372663497924805, -1.3535488843917847, -1.2698314189910889, -1.1861138343811035, -1.1023963689804077, -1.018678903579712, -0.9349613785743713, -0.8512438535690308, -0.7675262689590454, -0.6838088035583496, -0.600091278553009, -0.5163737535476685, -0.43265628814697266, -0.34893879294395447, -0.2652212977409363, -0.1815037727355957, -0.0977863073348999, -0.014068812131881714, 0.06964868307113647, 0.15336617827415466, 0.23708367347717285, 0.32080116868019104, 0.40451866388320923, 0.4882361888885498, 0.5719536542892456, 0.6556711196899414, 0.739388644695282, 0.8231061697006226, 0.9068236351013184, 0.9905411005020142, 1.07425856590271, 1.1579761505126953, 1.2416936159133911, 1.325411081314087, 1.4091286659240723, 1.492846131324768, 1.5765635967254639, 1.6602810621261597, 1.7439985275268555, 1.8277161121368408, 1.9114335775375366]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 5.0, 6.0, 8.0, 6.0, 9.0, 15.0, 7.0, 13.0, 23.0, 23.0, 14.0, 21.0, 25.0, 35.0, 33.0, 30.0, 38.0, 49.0, 50.0, 43.0, 60.0, 45.0, 41.0, 43.0, 35.0, 28.0, 37.0, 34.0, 34.0, 18.0, 33.0, 20.0, 16.0, 14.0, 11.0, 11.0, 13.0, 7.0, 6.0, 10.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.135279655456543, -1.0982357263565063, -1.0611919164657593, -1.0241479873657227, -0.9871041774749756, -0.950060248374939, -0.9130163788795471, -0.8759725093841553, -0.8389286398887634, -0.8018847703933716, -0.7648409008979797, -0.7277970314025879, -0.6907531023025513, -0.6537092924118042, -0.6166653633117676, -0.5796214938163757, -0.5425776243209839, -0.505533754825592, -0.4684898853302002, -0.43144598603248596, -0.3944021165370941, -0.35735824704170227, -0.32031434774398804, -0.2832704782485962, -0.24622660875320435, -0.2091827392578125, -0.17213885486125946, -0.13509497046470642, -0.09805110096931458, -0.06100723147392273, -0.02396334707736969, 0.01308053731918335, 0.050124406814575195, 0.08716828376054764, 0.12421216070652008, 0.16125604510307312, 0.19829991459846497, 0.2353437840938568, 0.27238768339157104, 0.3094315528869629, 0.34647542238235474, 0.3835192918777466, 0.4205631613731384, 0.45760706067085266, 0.4946509301662445, 0.531694769859314, 0.5687386989593506, 0.6057825684547424, 0.6428264379501343, 0.6798703074455261, 0.716914176940918, 0.7539580464363098, 0.7910019159317017, 0.8280458450317383, 0.8650897145271301, 0.902133584022522, 0.9391774535179138, 0.9762213230133057, 1.0132652521133423, 1.0503090620040894, 1.087352991104126, 1.124396800994873, 1.1614407300949097, 1.1984846591949463, 1.2355284690856934]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 3.0, 5.0, 5.0, 11.0, 5.0, 17.0, 28.0, 29.0, 43.0, 43.0, 69.0, 105.0, 188.0, 250.0, 439.0, 774.0, 1364.0, 2631.0, 5794.0, 13820.0, 37773.0, 131265.0, 478820.0, 268692.0, 67010.0, 22275.0, 8767.0, 3848.0, 1929.0, 928.0, 561.0, 382.0, 203.0, 140.0, 91.0, 66.0, 51.0, 29.0, 34.0, 17.0, 14.0, 8.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.2301025390625, -0.2232837677001953, -0.21646499633789062, -0.20964622497558594, -0.20282745361328125, -0.19600868225097656, -0.18918991088867188, -0.1823711395263672, -0.1755523681640625, -0.1687335968017578, -0.16191482543945312, -0.15509605407714844, -0.14827728271484375, -0.14145851135253906, -0.13463973999023438, -0.1278209686279297, -0.121002197265625, -0.11418342590332031, -0.10736465454101562, -0.10054588317871094, -0.09372711181640625, -0.08690834045410156, -0.08008956909179688, -0.07327079772949219, -0.0664520263671875, -0.05963325500488281, -0.052814483642578125, -0.04599571228027344, -0.03917694091796875, -0.03235816955566406, -0.025539398193359375, -0.018720626831054688, -0.01190185546875, -0.0050830841064453125, 0.001735687255859375, 0.008554458618164062, 0.01537322998046875, 0.022192001342773438, 0.029010772705078125, 0.03582954406738281, 0.0426483154296875, 0.04946708679199219, 0.056285858154296875, 0.06310462951660156, 0.06992340087890625, 0.07674217224121094, 0.08356094360351562, 0.09037971496582031, 0.097198486328125, 0.10401725769042969, 0.11083602905273438, 0.11765480041503906, 0.12447357177734375, 0.13129234313964844, 0.13811111450195312, 0.1449298858642578, 0.1517486572265625, 0.1585674285888672, 0.16538619995117188, 0.17220497131347656, 0.17902374267578125, 0.18584251403808594, 0.19266128540039062, 0.1994800567626953, 0.206298828125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 3.0, 10.0, 21.0, 18.0, 19.0, 27.0, 32.0, 49.0, 49.0, 51.0, 59.0, 57.0, 58.0, 56.0, 64.0, 58.0, 46.0, 52.0, 55.0, 44.0, 20.0, 26.0, 31.0, 24.0, 21.0, 16.0, 9.0, 7.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.1547107696533203, -0.14914321899414062, -0.14357566833496094, -0.13800811767578125, -0.13244056701660156, -0.12687301635742188, -0.12130546569824219, -0.1157379150390625, -0.11017036437988281, -0.10460281372070312, -0.09903526306152344, -0.09346771240234375, -0.08790016174316406, -0.08233261108398438, -0.07676506042480469, -0.071197509765625, -0.06562995910644531, -0.060062408447265625, -0.05449485778808594, -0.04892730712890625, -0.04335975646972656, -0.037792205810546875, -0.03222465515136719, -0.0266571044921875, -0.021089553833007812, -0.015522003173828125, -0.009954452514648438, -0.00438690185546875, 0.0011806488037109375, 0.006748199462890625, 0.012315750122070312, 0.01788330078125, 0.023450851440429688, 0.029018402099609375, 0.03458595275878906, 0.04015350341796875, 0.04572105407714844, 0.051288604736328125, 0.05685615539550781, 0.0624237060546875, 0.06799125671386719, 0.07355880737304688, 0.07912635803222656, 0.08469390869140625, 0.09026145935058594, 0.09582901000976562, 0.10139656066894531, 0.106964111328125, 0.11253166198730469, 0.11809921264648438, 0.12366676330566406, 0.12923431396484375, 0.13480186462402344, 0.14036941528320312, 0.1459369659423828, 0.1515045166015625, 0.1570720672607422, 0.16263961791992188, 0.16820716857910156, 0.17377471923828125, 0.17934226989746094, 0.18490982055664062, 0.1904773712158203, 0.196044921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 6.0, 3.0, 3.0, 7.0, 17.0, 27.0, 31.0, 40.0, 47.0, 92.0, 161.0, 276.0, 560.0, 1135.0, 2895.0, 10171.0, 66972.0, 845876.0, 101087.0, 13074.0, 3431.0, 1265.0, 583.0, 326.0, 167.0, 102.0, 68.0, 39.0, 39.0, 17.0, 18.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.46459197998046875, -0.4511566162109375, -0.43772125244140625, -0.424285888671875, -0.41085052490234375, -0.3974151611328125, -0.38397979736328125, -0.37054443359375, -0.35710906982421875, -0.3436737060546875, -0.33023834228515625, -0.316802978515625, -0.30336761474609375, -0.2899322509765625, -0.27649688720703125, -0.2630615234375, -0.24962615966796875, -0.2361907958984375, -0.22275543212890625, -0.209320068359375, -0.19588470458984375, -0.1824493408203125, -0.16901397705078125, -0.15557861328125, -0.14214324951171875, -0.1287078857421875, -0.11527252197265625, -0.101837158203125, -0.08840179443359375, -0.0749664306640625, -0.06153106689453125, -0.048095703125, -0.03466033935546875, -0.0212249755859375, -0.00778961181640625, 0.005645751953125, 0.01908111572265625, 0.0325164794921875, 0.04595184326171875, 0.05938720703125, 0.07282257080078125, 0.0862579345703125, 0.09969329833984375, 0.113128662109375, 0.12656402587890625, 0.1399993896484375, 0.15343475341796875, 0.1668701171875, 0.18030548095703125, 0.1937408447265625, 0.20717620849609375, 0.220611572265625, 0.23404693603515625, 0.2474822998046875, 0.26091766357421875, 0.27435302734375, 0.28778839111328125, 0.3012237548828125, 0.31465911865234375, 0.328094482421875, 0.34152984619140625, 0.3549652099609375, 0.36840057373046875, 0.3818359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 12.0, 14.0, 22.0, 14.0, 20.0, 26.0, 30.0, 43.0, 39.0, 40.0, 35.0, 51.0, 56.0, 61.0, 52.0, 54.0, 63.0, 47.0, 47.0, 50.0, 37.0, 30.0, 27.0, 19.0, 19.0, 17.0, 12.0, 13.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6171875, -0.5996780395507812, -0.5821685791015625, -0.5646591186523438, -0.547149658203125, -0.5296401977539062, -0.5121307373046875, -0.49462127685546875, -0.47711181640625, -0.45960235595703125, -0.4420928955078125, -0.42458343505859375, -0.407073974609375, -0.38956451416015625, -0.3720550537109375, -0.35454559326171875, -0.3370361328125, -0.31952667236328125, -0.3020172119140625, -0.28450775146484375, -0.266998291015625, -0.24948883056640625, -0.2319793701171875, -0.21446990966796875, -0.19696044921875, -0.17945098876953125, -0.1619415283203125, -0.14443206787109375, -0.126922607421875, -0.10941314697265625, -0.0919036865234375, -0.07439422607421875, -0.056884765625, -0.03937530517578125, -0.0218658447265625, -0.00435638427734375, 0.013153076171875, 0.03066253662109375, 0.0481719970703125, 0.06568145751953125, 0.08319091796875, 0.10070037841796875, 0.1182098388671875, 0.13571929931640625, 0.153228759765625, 0.17073822021484375, 0.1882476806640625, 0.20575714111328125, 0.2232666015625, 0.24077606201171875, 0.2582855224609375, 0.27579498291015625, 0.293304443359375, 0.31081390380859375, 0.3283233642578125, 0.34583282470703125, 0.36334228515625, 0.38085174560546875, 0.3983612060546875, 0.41587066650390625, 0.433380126953125, 0.45088958740234375, 0.4683990478515625, 0.48590850830078125, 0.50341796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 2.0, 15.0, 15.0, 19.0, 21.0, 31.0, 48.0, 61.0, 90.0, 126.0, 219.0, 361.0, 722.0, 1392.0, 2931.0, 7089.0, 19007.0, 65566.0, 578260.0, 286714.0, 56531.0, 17409.0, 6269.0, 2716.0, 1278.0, 622.0, 356.0, 250.0, 120.0, 92.0, 68.0, 44.0, 28.0, 16.0, 19.0, 15.0, 15.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07635498046875, -0.07396507263183594, -0.07157516479492188, -0.06918525695800781, -0.06679534912109375, -0.06440544128417969, -0.062015533447265625, -0.05962562561035156, -0.0572357177734375, -0.05484580993652344, -0.052455902099609375, -0.05006599426269531, -0.04767608642578125, -0.04528617858886719, -0.042896270751953125, -0.04050636291503906, -0.038116455078125, -0.03572654724121094, -0.033336639404296875, -0.030946731567382812, -0.02855682373046875, -0.026166915893554688, -0.023777008056640625, -0.021387100219726562, -0.0189971923828125, -0.016607284545898438, -0.014217376708984375, -0.011827468872070312, -0.00943756103515625, -0.0070476531982421875, -0.004657745361328125, -0.0022678375244140625, 0.0001220703125, 0.0025119781494140625, 0.004901885986328125, 0.0072917938232421875, 0.00968170166015625, 0.012071609497070312, 0.014461517333984375, 0.016851425170898438, 0.0192413330078125, 0.021631240844726562, 0.024021148681640625, 0.026411056518554688, 0.02880096435546875, 0.031190872192382812, 0.033580780029296875, 0.03597068786621094, 0.038360595703125, 0.04075050354003906, 0.043140411376953125, 0.04553031921386719, 0.04792022705078125, 0.05031013488769531, 0.052700042724609375, 0.05508995056152344, 0.0574798583984375, 0.05986976623535156, 0.062259674072265625, 0.06464958190917969, 0.06703948974609375, 0.06942939758300781, 0.07181930541992188, 0.07420921325683594, 0.07659912109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 12.0, 16.0, 19.0, 39.0, 50.0, 91.0, 132.0, 164.0, 161.0, 114.0, 80.0, 49.0, 31.0, 17.0, 8.0, 10.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7610530853271484e-05, -3.6094337701797485e-05, -3.4578144550323486e-05, -3.306195139884949e-05, -3.154575824737549e-05, -3.002956509590149e-05, -2.851337194442749e-05, -2.699717879295349e-05, -2.5480985641479492e-05, -2.3964792490005493e-05, -2.2448599338531494e-05, -2.0932406187057495e-05, -1.9416213035583496e-05, -1.7900019884109497e-05, -1.6383826732635498e-05, -1.4867633581161499e-05, -1.33514404296875e-05, -1.1835247278213501e-05, -1.0319054126739502e-05, -8.802860975265503e-06, -7.286667823791504e-06, -5.770474672317505e-06, -4.254281520843506e-06, -2.738088369369507e-06, -1.2218952178955078e-06, 2.942979335784912e-07, 1.8104910850524902e-06, 3.3266842365264893e-06, 4.842877388000488e-06, 6.359070539474487e-06, 7.875263690948486e-06, 9.391456842422485e-06, 1.0907649993896484e-05, 1.2423843145370483e-05, 1.3940036296844482e-05, 1.545622944831848e-05, 1.697242259979248e-05, 1.848861575126648e-05, 2.000480890274048e-05, 2.1521002054214478e-05, 2.3037195205688477e-05, 2.4553388357162476e-05, 2.6069581508636475e-05, 2.7585774660110474e-05, 2.9101967811584473e-05, 3.061816096305847e-05, 3.213435411453247e-05, 3.365054726600647e-05, 3.516674041748047e-05, 3.668293356895447e-05, 3.819912672042847e-05, 3.9715319871902466e-05, 4.1231513023376465e-05, 4.2747706174850464e-05, 4.426389932632446e-05, 4.578009247779846e-05, 4.729628562927246e-05, 4.881247878074646e-05, 5.032867193222046e-05, 5.184486508369446e-05, 5.336105823516846e-05, 5.4877251386642456e-05, 5.6393444538116455e-05, 5.7909637689590454e-05, 5.942583084106445e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 10.0, 7.0, 5.0, 22.0, 13.0, 37.0, 46.0, 63.0, 101.0, 136.0, 216.0, 322.0, 567.0, 914.0, 1822.0, 3689.0, 8857.0, 24360.0, 77773.0, 555502.0, 270513.0, 66546.0, 21721.0, 7971.0, 3484.0, 1611.0, 865.0, 474.0, 299.0, 192.0, 140.0, 75.0, 69.0, 33.0, 24.0, 18.0, 12.0, 14.0, 12.0, 5.0, 5.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06024169921875, -0.058005332946777344, -0.05576896667480469, -0.05353260040283203, -0.051296234130859375, -0.04905986785888672, -0.04682350158691406, -0.044587135314941406, -0.04235076904296875, -0.040114402770996094, -0.03787803649902344, -0.03564167022705078, -0.033405303955078125, -0.03116893768310547, -0.028932571411132812, -0.026696205139160156, -0.0244598388671875, -0.022223472595214844, -0.019987106323242188, -0.01775074005126953, -0.015514373779296875, -0.013278007507324219, -0.011041641235351562, -0.008805274963378906, -0.00656890869140625, -0.004332542419433594, -0.0020961761474609375, 0.00014019012451171875, 0.002376556396484375, 0.004612922668457031, 0.0068492889404296875, 0.009085655212402344, 0.011322021484375, 0.013558387756347656, 0.015794754028320312, 0.01803112030029297, 0.020267486572265625, 0.02250385284423828, 0.024740219116210938, 0.026976585388183594, 0.02921295166015625, 0.031449317932128906, 0.03368568420410156, 0.03592205047607422, 0.038158416748046875, 0.04039478302001953, 0.04263114929199219, 0.044867515563964844, 0.0471038818359375, 0.049340248107910156, 0.05157661437988281, 0.05381298065185547, 0.056049346923828125, 0.05828571319580078, 0.06052207946777344, 0.0627584457397461, 0.06499481201171875, 0.0672311782836914, 0.06946754455566406, 0.07170391082763672, 0.07394027709960938, 0.07617664337158203, 0.07841300964355469, 0.08064937591552734, 0.0828857421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 2.0, 6.0, 5.0, 12.0, 27.0, 24.0, 29.0, 37.0, 58.0, 49.0, 71.0, 99.0, 96.0, 90.0, 85.0, 76.0, 55.0, 44.0, 28.0, 23.0, 20.0, 12.0, 10.0, 14.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1109619140625, -0.10774707794189453, -0.10453224182128906, -0.1013174057006836, -0.09810256958007812, -0.09488773345947266, -0.09167289733886719, -0.08845806121826172, -0.08524322509765625, -0.08202838897705078, -0.07881355285644531, -0.07559871673583984, -0.07238388061523438, -0.0691690444946289, -0.06595420837402344, -0.06273937225341797, -0.0595245361328125, -0.05630970001220703, -0.05309486389160156, -0.049880027770996094, -0.046665191650390625, -0.043450355529785156, -0.04023551940917969, -0.03702068328857422, -0.03380584716796875, -0.03059101104736328, -0.027376174926757812, -0.024161338806152344, -0.020946502685546875, -0.017731666564941406, -0.014516830444335938, -0.011301994323730469, -0.008087158203125, -0.004872322082519531, -0.0016574859619140625, 0.0015573501586914062, 0.004772186279296875, 0.007987022399902344, 0.011201858520507812, 0.014416694641113281, 0.01763153076171875, 0.02084636688232422, 0.024061203002929688, 0.027276039123535156, 0.030490875244140625, 0.033705711364746094, 0.03692054748535156, 0.04013538360595703, 0.0433502197265625, 0.04656505584716797, 0.04977989196777344, 0.052994728088378906, 0.056209564208984375, 0.059424400329589844, 0.06263923645019531, 0.06585407257080078, 0.06906890869140625, 0.07228374481201172, 0.07549858093261719, 0.07871341705322266, 0.08192825317382812, 0.0851430892944336, 0.08835792541503906, 0.09157276153564453, 0.09478759765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 13.0, 30.0, 52.0, 145.0, 395.0, 190.0, 94.0, 38.0, 18.0, 8.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1198501586914062, -3.0021679401397705, -2.8844857215881348, -2.76680326461792, -2.649121046066284, -2.5314388275146484, -2.4137563705444336, -2.296074151992798, -2.178391933441162, -2.0607097148895264, -1.943027377128601, -1.8253450393676758, -1.70766282081604, -1.5899806022644043, -1.472298264503479, -1.3546159267425537, -1.236933708190918, -1.1192514896392822, -1.001569151878357, -0.8838868737220764, -0.7662045955657959, -0.6485223174095154, -0.5308400392532349, -0.41315776109695435, -0.29547548294067383, -0.1777932047843933, -0.06011092662811279, 0.057571351528167725, 0.17525362968444824, 0.29293590784072876, 0.4106181859970093, 0.5283004641532898, 0.6459827423095703, 0.7636650204658508, 0.8813472986221313, 0.9990295767784119, 1.1167118549346924, 1.2343940734863281, 1.3520764112472534, 1.4697587490081787, 1.5874409675598145, 1.7051231861114502, 1.8228055238723755, 1.9404878616333008, 2.0581700801849365, 2.1758522987365723, 2.293534755706787, 2.411216974258423, 2.5288991928100586, 2.6465814113616943, 2.76426362991333, 2.881946086883545, 2.9996283054351807, 3.1173105239868164, 3.2349929809570312, 3.352675199508667, 3.4703574180603027, 3.5880396366119385, 3.705721855163574, 3.823404312133789, 3.941086530685425, 4.0587687492370605, 4.176451206207275, 4.294133186340332, 4.411815643310547]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 1.0, 8.0, 9.0, 8.0, 7.0, 9.0, 13.0, 20.0, 24.0, 21.0, 24.0, 30.0, 33.0, 53.0, 41.0, 95.0, 111.0, 123.0, 78.0, 45.0, 36.0, 23.0, 26.0, 40.0, 24.0, 17.0, 16.0, 16.0, 7.0, 6.0, 9.0, 4.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9430243968963623, -1.8712377548217773, -1.7994511127471924, -1.7276644706726074, -1.6558778285980225, -1.5840911865234375, -1.512304425239563, -1.440517783164978, -1.368731141090393, -1.296944499015808, -1.2251578569412231, -1.1533712148666382, -1.0815844535827637, -1.0097978115081787, -0.9380111694335938, -0.8662245273590088, -0.7944378852844238, -0.7226512432098389, -0.6508646011352539, -0.5790778994560242, -0.5072912573814392, -0.43550461530685425, -0.3637179434299469, -0.29193127155303955, -0.2201446294784546, -0.14835797250270844, -0.07657131552696228, -0.0047846585512161255, 0.06700199842453003, 0.138788640499115, 0.21057531237602234, 0.2823619842529297, 0.35414886474609375, 0.4259355068206787, 0.49772217869758606, 0.5695088505744934, 0.6412954926490784, 0.7130821347236633, 0.7848688364028931, 0.856655478477478, 0.928442120552063, 1.000228762626648, 1.072015404701233, 1.1438020467758179, 1.2155888080596924, 1.2873754501342773, 1.3591620922088623, 1.4309487342834473, 1.5027353763580322, 1.5745220184326172, 1.6463086605072021, 1.718095302581787, 1.789881944656372, 1.861668586730957, 1.9334553480148315, 2.005241870880127, 2.077028751373291, 2.148815393447876, 2.220602035522461, 2.292388677597046, 2.364175319671631, 2.435961961746216, 2.507748603820801, 2.579535484313965, 2.6513218879699707]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 9.0, 12.0, 18.0, 29.0, 44.0, 69.0, 109.0, 219.0, 326.0, 577.0, 931.0, 1560.0, 2929.0, 5842.0, 11608.0, 25967.0, 67381.0, 209872.0, 718566.0, 1725985.0, 977459.0, 292639.0, 88269.0, 33125.0, 14784.0, 7118.0, 3802.0, 2064.0, 1191.0, 665.0, 391.0, 267.0, 176.0, 103.0, 68.0, 47.0, 19.0, 14.0, 10.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15789222717285156, -0.15196609497070312, -0.1460399627685547, -0.14011383056640625, -0.1341876983642578, -0.12826156616210938, -0.12233543395996094, -0.1164093017578125, -0.11048316955566406, -0.10455703735351562, -0.09863090515136719, -0.09270477294921875, -0.08677864074707031, -0.08085250854492188, -0.07492637634277344, -0.069000244140625, -0.06307411193847656, -0.057147979736328125, -0.05122184753417969, -0.04529571533203125, -0.03936958312988281, -0.033443450927734375, -0.027517318725585938, -0.0215911865234375, -0.015665054321289062, -0.009738922119140625, -0.0038127899169921875, 0.00211334228515625, 0.008039474487304688, 0.013965606689453125, 0.019891738891601562, 0.02581787109375, 0.03174400329589844, 0.037670135498046875, 0.04359626770019531, 0.04952239990234375, 0.05544853210449219, 0.061374664306640625, 0.06730079650878906, 0.0732269287109375, 0.07915306091308594, 0.08507919311523438, 0.09100532531738281, 0.09693145751953125, 0.10285758972167969, 0.10878372192382812, 0.11470985412597656, 0.120635986328125, 0.12656211853027344, 0.13248825073242188, 0.1384143829345703, 0.14434051513671875, 0.1502666473388672, 0.15619277954101562, 0.16211891174316406, 0.1680450439453125, 0.17397117614746094, 0.17989730834960938, 0.1858234405517578, 0.19174957275390625, 0.1976757049560547, 0.20360183715820312, 0.20952796936035156, 0.2154541015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 15.0, 27.0, 22.0, 28.0, 37.0, 45.0, 48.0, 51.0, 43.0, 64.0, 49.0, 46.0, 48.0, 54.0, 43.0, 46.0, 43.0, 32.0, 44.0, 30.0, 33.0, 27.0, 13.0, 18.0, 11.0, 16.0, 9.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1119384765625, -0.10716056823730469, -0.10238265991210938, -0.09760475158691406, -0.09282684326171875, -0.08804893493652344, -0.08327102661132812, -0.07849311828613281, -0.0737152099609375, -0.06893730163574219, -0.06415939331054688, -0.05938148498535156, -0.05460357666015625, -0.04982566833496094, -0.045047760009765625, -0.04026985168457031, -0.035491943359375, -0.030714035034179688, -0.025936126708984375, -0.021158218383789062, -0.01638031005859375, -0.011602401733398438, -0.006824493408203125, -0.0020465850830078125, 0.0027313232421875, 0.0075092315673828125, 0.012287139892578125, 0.017065048217773438, 0.02184295654296875, 0.026620864868164062, 0.031398773193359375, 0.03617668151855469, 0.04095458984375, 0.04573249816894531, 0.050510406494140625, 0.05528831481933594, 0.06006622314453125, 0.06484413146972656, 0.06962203979492188, 0.07439994812011719, 0.0791778564453125, 0.08395576477050781, 0.08873367309570312, 0.09351158142089844, 0.09828948974609375, 0.10306739807128906, 0.10784530639648438, 0.11262321472167969, 0.117401123046875, 0.12217903137207031, 0.12695693969726562, 0.13173484802246094, 0.13651275634765625, 0.14129066467285156, 0.14606857299804688, 0.1508464813232422, 0.1556243896484375, 0.1604022979736328, 0.16518020629882812, 0.16995811462402344, 0.17473602294921875, 0.17951393127441406, 0.18429183959960938, 0.1890697479248047, 0.19384765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 11.0, 18.0, 22.0, 37.0, 63.0, 104.0, 241.0, 506.0, 1368.0, 8017.0, 2181553.0, 1992035.0, 8033.0, 1276.0, 484.0, 221.0, 131.0, 69.0, 37.0, 19.0, 15.0, 1.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.8212890625, -1.7789306640625, -1.736572265625, -1.6942138671875, -1.65185546875, -1.6094970703125, -1.567138671875, -1.5247802734375, -1.482421875, -1.4400634765625, -1.397705078125, -1.3553466796875, -1.31298828125, -1.2706298828125, -1.228271484375, -1.1859130859375, -1.1435546875, -1.1011962890625, -1.058837890625, -1.0164794921875, -0.97412109375, -0.9317626953125, -0.889404296875, -0.8470458984375, -0.8046875, -0.7623291015625, -0.719970703125, -0.6776123046875, -0.63525390625, -0.5928955078125, -0.550537109375, -0.5081787109375, -0.4658203125, -0.4234619140625, -0.381103515625, -0.3387451171875, -0.29638671875, -0.2540283203125, -0.211669921875, -0.1693115234375, -0.126953125, -0.0845947265625, -0.042236328125, 0.0001220703125, 0.04248046875, 0.0848388671875, 0.127197265625, 0.1695556640625, 0.2119140625, 0.2542724609375, 0.296630859375, 0.3389892578125, 0.38134765625, 0.4237060546875, 0.466064453125, 0.5084228515625, 0.55078125, 0.5931396484375, 0.635498046875, 0.6778564453125, 0.72021484375, 0.7625732421875, 0.804931640625, 0.8472900390625, 0.8896484375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 13.0, 9.0, 26.0, 18.0, 33.0, 49.0, 69.0, 94.0, 131.0, 209.0, 313.0, 476.0, 700.0, 601.0, 405.0, 251.0, 200.0, 135.0, 104.0, 74.0, 47.0, 33.0, 26.0, 20.0, 15.0, 10.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5709953308105469, -0.5550765991210938, -0.5391578674316406, -0.5232391357421875, -0.5073204040527344, -0.49140167236328125, -0.4754829406738281, -0.459564208984375, -0.4436454772949219, -0.42772674560546875, -0.4118080139160156, -0.3958892822265625, -0.3799705505371094, -0.36405181884765625, -0.3481330871582031, -0.33221435546875, -0.3162956237792969, -0.30037689208984375, -0.2844581604003906, -0.2685394287109375, -0.2526206970214844, -0.23670196533203125, -0.22078323364257812, -0.204864501953125, -0.18894577026367188, -0.17302703857421875, -0.15710830688476562, -0.1411895751953125, -0.12527084350585938, -0.10935211181640625, -0.09343338012695312, -0.0775146484375, -0.061595916748046875, -0.04567718505859375, -0.029758453369140625, -0.0138397216796875, 0.002079010009765625, 0.01799774169921875, 0.033916473388671875, 0.049835205078125, 0.06575393676757812, 0.08167266845703125, 0.09759140014648438, 0.1135101318359375, 0.12942886352539062, 0.14534759521484375, 0.16126632690429688, 0.17718505859375, 0.19310379028320312, 0.20902252197265625, 0.22494125366210938, 0.2408599853515625, 0.2567787170410156, 0.27269744873046875, 0.2886161804199219, 0.304534912109375, 0.3204536437988281, 0.33637237548828125, 0.3522911071777344, 0.3682098388671875, 0.3841285705566406, 0.40004730224609375, 0.4159660339355469, 0.431884765625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 6.0, 6.0, 6.0, 19.0, 37.0, 70.0, 166.0, 283.0, 213.0, 99.0, 51.0, 19.0, 14.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.26026725769043, -11.991594314575195, -11.722922325134277, -11.454249382019043, -11.185577392578125, -10.91690444946289, -10.648231506347656, -10.379559516906738, -10.110886573791504, -9.84221363067627, -9.573541641235352, -9.304868698120117, -9.036195755004883, -8.767523765563965, -8.49885082244873, -8.230178833007812, -7.961505889892578, -7.692833423614502, -7.424160957336426, -7.155488014221191, -6.886815547943115, -6.618143081665039, -6.349470138549805, -6.0807976722717285, -5.812125205993652, -5.543452739715576, -5.2747802734375, -5.006107330322266, -4.7374348640441895, -4.468762397766113, -4.200089454650879, -3.9314169883728027, -3.6627445220947266, -3.3940720558166504, -3.125399351119995, -2.85672664642334, -2.5880541801452637, -2.3193817138671875, -2.0507090091705322, -1.7820364236831665, -1.5133638381958008, -1.244691252708435, -0.9760186672210693, -0.7073460817337036, -0.4386734962463379, -0.17000091075897217, 0.09867167472839355, 0.3673442602157593, 0.636016845703125, 0.9046894311904907, 1.1733620166778564, 1.4420346021652222, 1.710707187652588, 1.9793797731399536, 2.2480523586273193, 2.5167250633239746, 2.785397529602051, 3.054069995880127, 3.3227427005767822, 3.5914154052734375, 3.8600878715515137, 4.12876033782959, 4.397433280944824, 4.6661057472229, 4.934778213500977]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 1.0, 4.0, 8.0, 9.0, 14.0, 16.0, 24.0, 17.0, 23.0, 27.0, 31.0, 38.0, 33.0, 37.0, 62.0, 61.0, 76.0, 70.0, 66.0, 55.0, 45.0, 38.0, 46.0, 32.0, 21.0, 16.0, 19.0, 15.0, 26.0, 17.0, 12.0, 10.0, 11.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.313432455062866, -2.2276346683502197, -2.1418368816375732, -2.0560390949249268, -1.9702411890029907, -1.8844434022903442, -1.7986454963684082, -1.7128477096557617, -1.6270499229431152, -1.5412521362304688, -1.4554543495178223, -1.3696564435958862, -1.2838586568832397, -1.1980608701705933, -1.1122629642486572, -1.0264651775360107, -0.9406673908233643, -0.8548696041107178, -0.7690717577934265, -0.6832739114761353, -0.5974761247634888, -0.5116783380508423, -0.425880491733551, -0.34008264541625977, -0.2542848587036133, -0.1684870421886444, -0.08268922567367554, 0.003108590841293335, 0.08890640735626221, 0.17470422387123108, 0.26050204038619995, 0.3462998867034912, 0.4320974349975586, 0.5178952217102051, 0.6036930680274963, 0.6894909143447876, 0.7752887010574341, 0.8610864877700806, 0.9468843340873718, 1.032682180404663, 1.1184799671173096, 1.204277753829956, 1.2900755405426025, 1.3758734464645386, 1.461671233177185, 1.5474690198898315, 1.6332669258117676, 1.719064712524414, 1.8048624992370605, 1.890660285949707, 1.9764580726623535, 2.062255859375, 2.1480536460876465, 2.233851671218872, 2.3196494579315186, 2.405447244644165, 2.4912450313568115, 2.577042818069458, 2.6628406047821045, 2.748638391494751, 2.8344364166259766, 2.920234203338623, 3.0060319900512695, 3.091829776763916, 3.1776275634765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 5.0, 7.0, 11.0, 15.0, 18.0, 18.0, 47.0, 64.0, 105.0, 118.0, 228.0, 433.0, 857.0, 2091.0, 5885.0, 18699.0, 84983.0, 676636.0, 208585.0, 34354.0, 9437.0, 3298.0, 1316.0, 538.0, 326.0, 155.0, 98.0, 60.0, 34.0, 36.0, 28.0, 18.0, 12.0, 11.0, 9.0, 10.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.33882904052734375, -0.3287811279296875, -0.31873321533203125, -0.308685302734375, -0.29863739013671875, -0.2885894775390625, -0.27854156494140625, -0.26849365234375, -0.25844573974609375, -0.2483978271484375, -0.23834991455078125, -0.228302001953125, -0.21825408935546875, -0.2082061767578125, -0.19815826416015625, -0.1881103515625, -0.17806243896484375, -0.1680145263671875, -0.15796661376953125, -0.147918701171875, -0.13787078857421875, -0.1278228759765625, -0.11777496337890625, -0.10772705078125, -0.09767913818359375, -0.0876312255859375, -0.07758331298828125, -0.067535400390625, -0.05748748779296875, -0.0474395751953125, -0.03739166259765625, -0.02734375, -0.01729583740234375, -0.0072479248046875, 0.00279998779296875, 0.012847900390625, 0.02289581298828125, 0.0329437255859375, 0.04299163818359375, 0.05303955078125, 0.06308746337890625, 0.0731353759765625, 0.08318328857421875, 0.093231201171875, 0.10327911376953125, 0.1133270263671875, 0.12337493896484375, 0.1334228515625, 0.14347076416015625, 0.1535186767578125, 0.16356658935546875, 0.173614501953125, 0.18366241455078125, 0.1937103271484375, 0.20375823974609375, 0.21380615234375, 0.22385406494140625, 0.2339019775390625, 0.24394989013671875, 0.253997802734375, 0.26404571533203125, 0.2740936279296875, 0.28414154052734375, 0.294189453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 10.0, 11.0, 15.0, 20.0, 18.0, 22.0, 38.0, 24.0, 28.0, 44.0, 49.0, 58.0, 67.0, 45.0, 49.0, 44.0, 49.0, 53.0, 47.0, 41.0, 35.0, 39.0, 30.0, 29.0, 25.0, 15.0, 14.0, 7.0, 11.0, 7.0, 12.0, 2.0, 7.0, 1.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19921875, -0.19310760498046875, -0.1869964599609375, -0.18088531494140625, -0.174774169921875, -0.16866302490234375, -0.1625518798828125, -0.15644073486328125, -0.15032958984375, -0.14421844482421875, -0.1381072998046875, -0.13199615478515625, -0.125885009765625, -0.11977386474609375, -0.1136627197265625, -0.10755157470703125, -0.1014404296875, -0.09532928466796875, -0.0892181396484375, -0.08310699462890625, -0.076995849609375, -0.07088470458984375, -0.0647735595703125, -0.05866241455078125, -0.05255126953125, -0.04644012451171875, -0.0403289794921875, -0.03421783447265625, -0.028106689453125, -0.02199554443359375, -0.0158843994140625, -0.00977325439453125, -0.003662109375, 0.00244903564453125, 0.0085601806640625, 0.01467132568359375, 0.020782470703125, 0.02689361572265625, 0.0330047607421875, 0.03911590576171875, 0.04522705078125, 0.05133819580078125, 0.0574493408203125, 0.06356048583984375, 0.069671630859375, 0.07578277587890625, 0.0818939208984375, 0.08800506591796875, 0.0941162109375, 0.10022735595703125, 0.1063385009765625, 0.11244964599609375, 0.118560791015625, 0.12467193603515625, 0.1307830810546875, 0.13689422607421875, 0.14300537109375, 0.14911651611328125, 0.1552276611328125, 0.16133880615234375, 0.167449951171875, 0.17356109619140625, 0.1796722412109375, 0.18578338623046875, 0.19189453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 15.0, 7.0, 12.0, 22.0, 32.0, 57.0, 72.0, 126.0, 225.0, 483.0, 1171.0, 3884.0, 25038.0, 883539.0, 118919.0, 10877.0, 2361.0, 815.0, 382.0, 203.0, 117.0, 60.0, 37.0, 25.0, 16.0, 18.0, 8.0, 7.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.433837890625, -0.41927337646484375, -0.4047088623046875, -0.39014434814453125, -0.375579833984375, -0.36101531982421875, -0.3464508056640625, -0.33188629150390625, -0.31732177734375, -0.30275726318359375, -0.2881927490234375, -0.27362823486328125, -0.259063720703125, -0.24449920654296875, -0.2299346923828125, -0.21537017822265625, -0.2008056640625, -0.18624114990234375, -0.1716766357421875, -0.15711212158203125, -0.142547607421875, -0.12798309326171875, -0.1134185791015625, -0.09885406494140625, -0.08428955078125, -0.06972503662109375, -0.0551605224609375, -0.04059600830078125, -0.026031494140625, -0.01146697998046875, 0.0030975341796875, 0.01766204833984375, 0.0322265625, 0.04679107666015625, 0.0613555908203125, 0.07592010498046875, 0.090484619140625, 0.10504913330078125, 0.1196136474609375, 0.13417816162109375, 0.14874267578125, 0.16330718994140625, 0.1778717041015625, 0.19243621826171875, 0.207000732421875, 0.22156524658203125, 0.2361297607421875, 0.25069427490234375, 0.2652587890625, 0.27982330322265625, 0.2943878173828125, 0.30895233154296875, 0.323516845703125, 0.33808135986328125, 0.3526458740234375, 0.36721038818359375, 0.38177490234375, 0.39633941650390625, 0.4109039306640625, 0.42546844482421875, 0.440032958984375, 0.45459747314453125, 0.4691619873046875, 0.48372650146484375, 0.498291015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 8.0, 7.0, 6.0, 7.0, 10.0, 11.0, 18.0, 12.0, 12.0, 30.0, 25.0, 36.0, 41.0, 58.0, 73.0, 78.0, 97.0, 72.0, 56.0, 50.0, 40.0, 37.0, 35.0, 31.0, 25.0, 23.0, 14.0, 16.0, 18.0, 8.0, 5.0, 13.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.748046875, -0.7234573364257812, -0.6988677978515625, -0.6742782592773438, -0.649688720703125, -0.6250991821289062, -0.6005096435546875, -0.5759201049804688, -0.55133056640625, -0.5267410278320312, -0.5021514892578125, -0.47756195068359375, -0.452972412109375, -0.42838287353515625, -0.4037933349609375, -0.37920379638671875, -0.3546142578125, -0.33002471923828125, -0.3054351806640625, -0.28084564208984375, -0.256256103515625, -0.23166656494140625, -0.2070770263671875, -0.18248748779296875, -0.15789794921875, -0.13330841064453125, -0.1087188720703125, -0.08412933349609375, -0.059539794921875, -0.03495025634765625, -0.0103607177734375, 0.01422882080078125, 0.038818359375, 0.06340789794921875, 0.0879974365234375, 0.11258697509765625, 0.137176513671875, 0.16176605224609375, 0.1863555908203125, 0.21094512939453125, 0.23553466796875, 0.26012420654296875, 0.2847137451171875, 0.30930328369140625, 0.333892822265625, 0.35848236083984375, 0.3830718994140625, 0.40766143798828125, 0.4322509765625, 0.45684051513671875, 0.4814300537109375, 0.5060195922851562, 0.530609130859375, 0.5551986694335938, 0.5797882080078125, 0.6043777465820312, 0.62896728515625, 0.6535568237304688, 0.6781463623046875, 0.7027359008789062, 0.727325439453125, 0.7519149780273438, 0.7765045166015625, 0.8010940551757812, 0.82568359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 9.0, 6.0, 3.0, 7.0, 4.0, 11.0, 13.0, 9.0, 15.0, 20.0, 28.0, 39.0, 45.0, 64.0, 83.0, 127.0, 167.0, 316.0, 487.0, 787.0, 1327.0, 2666.0, 5718.0, 13841.0, 42385.0, 233341.0, 673081.0, 46450.0, 14892.0, 6161.0, 2779.0, 1397.0, 832.0, 469.0, 331.0, 187.0, 118.0, 92.0, 62.0, 44.0, 22.0, 22.0, 21.0, 10.0, 12.0, 10.0, 12.0, 13.0, 7.0, 7.0, 4.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.047393798828125, -0.045866966247558594, -0.04434013366699219, -0.04281330108642578, -0.041286468505859375, -0.03975963592529297, -0.03823280334472656, -0.036705970764160156, -0.03517913818359375, -0.033652305603027344, -0.03212547302246094, -0.03059864044189453, -0.029071807861328125, -0.02754497528076172, -0.026018142700195312, -0.024491310119628906, -0.0229644775390625, -0.021437644958496094, -0.019910812377929688, -0.01838397979736328, -0.016857147216796875, -0.015330314636230469, -0.013803482055664062, -0.012276649475097656, -0.01074981689453125, -0.009222984313964844, -0.0076961517333984375, -0.006169319152832031, -0.004642486572265625, -0.0031156539916992188, -0.0015888214111328125, -6.198883056640625e-05, 0.00146484375, 0.0029916763305664062, 0.0045185089111328125, 0.006045341491699219, 0.007572174072265625, 0.009099006652832031, 0.010625839233398438, 0.012152671813964844, 0.01367950439453125, 0.015206336975097656, 0.016733169555664062, 0.01826000213623047, 0.019786834716796875, 0.02131366729736328, 0.022840499877929688, 0.024367332458496094, 0.0258941650390625, 0.027420997619628906, 0.028947830200195312, 0.03047466278076172, 0.032001495361328125, 0.03352832794189453, 0.03505516052246094, 0.036581993103027344, 0.03810882568359375, 0.039635658264160156, 0.04116249084472656, 0.04268932342529297, 0.044216156005859375, 0.04574298858642578, 0.04726982116699219, 0.048796653747558594, 0.050323486328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 12.0, 14.0, 12.0, 17.0, 19.0, 38.0, 44.0, 96.0, 108.0, 115.0, 117.0, 114.0, 71.0, 55.0, 37.0, 25.0, 24.0, 18.0, 12.0, 17.0, 9.0, 5.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.24249267578125e-05, -3.141164779663086e-05, -3.039836883544922e-05, -2.9385089874267578e-05, -2.8371810913085938e-05, -2.7358531951904297e-05, -2.6345252990722656e-05, -2.5331974029541016e-05, -2.4318695068359375e-05, -2.3305416107177734e-05, -2.2292137145996094e-05, -2.1278858184814453e-05, -2.0265579223632812e-05, -1.9252300262451172e-05, -1.823902130126953e-05, -1.722574234008789e-05, -1.621246337890625e-05, -1.519918441772461e-05, -1.4185905456542969e-05, -1.3172626495361328e-05, -1.2159347534179688e-05, -1.1146068572998047e-05, -1.0132789611816406e-05, -9.119510650634766e-06, -8.106231689453125e-06, -7.092952728271484e-06, -6.079673767089844e-06, -5.066394805908203e-06, -4.0531158447265625e-06, -3.039836883544922e-06, -2.0265579223632812e-06, -1.0132789611816406e-06, 0.0, 1.0132789611816406e-06, 2.0265579223632812e-06, 3.039836883544922e-06, 4.0531158447265625e-06, 5.066394805908203e-06, 6.079673767089844e-06, 7.092952728271484e-06, 8.106231689453125e-06, 9.119510650634766e-06, 1.0132789611816406e-05, 1.1146068572998047e-05, 1.2159347534179688e-05, 1.3172626495361328e-05, 1.4185905456542969e-05, 1.519918441772461e-05, 1.621246337890625e-05, 1.722574234008789e-05, 1.823902130126953e-05, 1.9252300262451172e-05, 2.0265579223632812e-05, 2.1278858184814453e-05, 2.2292137145996094e-05, 2.3305416107177734e-05, 2.4318695068359375e-05, 2.5331974029541016e-05, 2.6345252990722656e-05, 2.7358531951904297e-05, 2.8371810913085938e-05, 2.9385089874267578e-05, 3.039836883544922e-05, 3.141164779663086e-05, 3.24249267578125e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 7.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 13.0, 16.0, 23.0, 61.0, 75.0, 99.0, 173.0, 277.0, 459.0, 890.0, 1632.0, 3374.0, 7893.0, 21603.0, 80445.0, 781310.0, 107366.0, 25591.0, 9090.0, 3901.0, 1879.0, 963.0, 517.0, 339.0, 177.0, 109.0, 86.0, 57.0, 35.0, 15.0, 13.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05322265625, -0.051482200622558594, -0.04974174499511719, -0.04800128936767578, -0.046260833740234375, -0.04452037811279297, -0.04277992248535156, -0.041039466857910156, -0.03929901123046875, -0.037558555603027344, -0.03581809997558594, -0.03407764434814453, -0.032337188720703125, -0.03059673309326172, -0.028856277465820312, -0.027115821838378906, -0.0253753662109375, -0.023634910583496094, -0.021894454956054688, -0.02015399932861328, -0.018413543701171875, -0.01667308807373047, -0.014932632446289062, -0.013192176818847656, -0.01145172119140625, -0.009711265563964844, -0.007970809936523438, -0.006230354309082031, -0.004489898681640625, -0.0027494430541992188, -0.0010089874267578125, 0.0007314682006835938, 0.002471923828125, 0.004212379455566406, 0.0059528350830078125, 0.007693290710449219, 0.009433746337890625, 0.011174201965332031, 0.012914657592773438, 0.014655113220214844, 0.01639556884765625, 0.018136024475097656, 0.019876480102539062, 0.02161693572998047, 0.023357391357421875, 0.02509784698486328, 0.026838302612304688, 0.028578758239746094, 0.0303192138671875, 0.032059669494628906, 0.03380012512207031, 0.03554058074951172, 0.037281036376953125, 0.03902149200439453, 0.04076194763183594, 0.042502403259277344, 0.04424285888671875, 0.045983314514160156, 0.04772377014160156, 0.04946422576904297, 0.051204681396484375, 0.05294513702392578, 0.05468559265136719, 0.056426048278808594, 0.05816650390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 10.0, 7.0, 13.0, 12.0, 21.0, 28.0, 34.0, 49.0, 99.0, 169.0, 189.0, 127.0, 72.0, 51.0, 19.0, 17.0, 21.0, 19.0, 9.0, 10.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.146484375, -0.14219284057617188, -0.13790130615234375, -0.13360977172851562, -0.1293182373046875, -0.12502670288085938, -0.12073516845703125, -0.11644363403320312, -0.112152099609375, -0.10786056518554688, -0.10356903076171875, -0.09927749633789062, -0.0949859619140625, -0.09069442749023438, -0.08640289306640625, -0.08211135864257812, -0.07781982421875, -0.07352828979492188, -0.06923675537109375, -0.06494522094726562, -0.0606536865234375, -0.056362152099609375, -0.05207061767578125, -0.047779083251953125, -0.043487548828125, -0.039196014404296875, -0.03490447998046875, -0.030612945556640625, -0.0263214111328125, -0.022029876708984375, -0.01773834228515625, -0.013446807861328125, -0.0091552734375, -0.004863739013671875, -0.00057220458984375, 0.003719329833984375, 0.0080108642578125, 0.012302398681640625, 0.01659393310546875, 0.020885467529296875, 0.025177001953125, 0.029468536376953125, 0.03376007080078125, 0.038051605224609375, 0.0423431396484375, 0.046634674072265625, 0.05092620849609375, 0.055217742919921875, 0.05950927734375, 0.06380081176757812, 0.06809234619140625, 0.07238388061523438, 0.0766754150390625, 0.08096694946289062, 0.08525848388671875, 0.08955001831054688, 0.093841552734375, 0.09813308715820312, 0.10242462158203125, 0.10671615600585938, 0.1110076904296875, 0.11529922485351562, 0.11959075927734375, 0.12388229370117188, 0.128173828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 11.0, 10.0, 34.0, 74.0, 316.0, 400.0, 94.0, 37.0, 14.0, 4.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525306224822998, -2.3678910732269287, -2.2104761600494385, -2.053061008453369, -1.8956459760665894, -1.7382309436798096, -1.5808157920837402, -1.4234007596969604, -1.2659857273101807, -1.1085706949234009, -0.9511556029319763, -0.7937405109405518, -0.636325478553772, -0.4789104461669922, -0.3214953541755676, -0.16408026218414307, -0.006665229797363281, 0.1507498323917389, 0.30816489458084106, 0.46557995676994324, 0.6229950189590454, 0.7804100513458252, 0.9378251433372498, 1.0952402353286743, 1.252655267715454, 1.4100703001022339, 1.5674853324890137, 1.724900484085083, 1.8823155164718628, 2.0397305488586426, 2.197145700454712, 2.3545608520507812, 2.5119762420654297, 2.669391393661499, 2.8268063068389893, 2.9842214584350586, 3.141636371612549, 3.299051523208618, 3.4564666748046875, 3.6138815879821777, 3.771296739578247, 3.9287118911743164, 4.086126804351807, 4.243541717529297, 4.400957107543945, 4.5583720207214355, 4.715786933898926, 4.873202323913574, 5.0306172370910645, 5.188032150268555, 5.345447540283203, 5.502862453460693, 5.660277366638184, 5.817692756652832, 5.975107669830322, 6.1325225830078125, 6.289937973022461, 6.447352886199951, 6.6047682762146, 6.76218318939209, 6.91959810256958, 7.07701301574707, 7.234428405761719, 7.391843318939209, 7.549258232116699]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 10.0, 3.0, 2.0, 6.0, 6.0, 5.0, 12.0, 5.0, 16.0, 12.0, 14.0, 22.0, 27.0, 18.0, 37.0, 58.0, 96.0, 106.0, 97.0, 96.0, 88.0, 51.0, 24.0, 25.0, 19.0, 18.0, 18.0, 20.0, 9.0, 14.0, 6.0, 10.0, 7.0, 7.0, 7.0, 1.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-2.1506664752960205, -2.091336488723755, -2.0320067405700684, -1.9726767539978027, -1.913346767425537, -1.854016900062561, -1.794687032699585, -1.7353570461273193, -1.6760271787643433, -1.6166973114013672, -1.5573673248291016, -1.4980374574661255, -1.4387074708938599, -1.3793776035308838, -1.3200476169586182, -1.260717749595642, -1.201387882232666, -1.14205801486969, -1.0827280282974243, -1.0233981609344482, -0.9640682339668274, -0.9047383069992065, -0.8454083800315857, -0.7860784530639648, -0.7267484664916992, -0.6674185395240784, -0.6080886125564575, -0.5487587451934814, -0.4894288182258606, -0.43009889125823975, -0.3707689642906189, -0.31143906712532043, -0.252109169960022, -0.19277925789356232, -0.13344934582710266, -0.07411941885948181, -0.014789506793022156, 0.0445404052734375, 0.10387033224105835, 0.1632002294063568, 0.22253015637397766, 0.2818600833415985, 0.341189980506897, 0.4005199074745178, 0.45984983444213867, 0.5191797018051147, 0.5785096883773804, 0.6378395557403564, 0.6971694827079773, 0.7564994096755981, 0.815829336643219, 0.8751592636108398, 0.9344891309738159, 0.9938190579414368, 1.0531489849090576, 1.1124788522720337, 1.1718088388442993, 1.2311387062072754, 1.290468692779541, 1.349798560142517, 1.4091285467147827, 1.4684584140777588, 1.5277884006500244, 1.5871182680130005, 1.6464481353759766]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 3.0, 5.0, 5.0, 9.0, 9.0, 25.0, 21.0, 24.0, 24.0, 25.0, 35.0, 36.0, 36.0, 43.0, 75.0, 178.0, 122.0, 37.0, 38.0, 28.0, 35.0, 28.0, 14.0, 21.0, 18.0, 14.0, 12.0, 12.0, 10.0, 11.0, 9.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17202186584472656, -0.16643142700195312, -0.1608409881591797, -0.15525054931640625, -0.1496601104736328, -0.14406967163085938, -0.13847923278808594, -0.1328887939453125, -0.12729835510253906, -0.12170791625976562, -0.11611747741699219, -0.11052703857421875, -0.10493659973144531, -0.09934616088867188, -0.09375572204589844, -0.088165283203125, -0.08257484436035156, -0.07698440551757812, -0.07139396667480469, -0.06580352783203125, -0.06021308898925781, -0.054622650146484375, -0.04903221130371094, -0.0434417724609375, -0.03785133361816406, -0.032260894775390625, -0.026670455932617188, -0.02108001708984375, -0.015489578247070312, -0.009899139404296875, -0.0043087005615234375, 0.00128173828125, 0.0068721771240234375, 0.012462615966796875, 0.018053054809570312, 0.02364349365234375, 0.029233932495117188, 0.034824371337890625, 0.04041481018066406, 0.0460052490234375, 0.05159568786621094, 0.057186126708984375, 0.06277656555175781, 0.06836700439453125, 0.07395744323730469, 0.07954788208007812, 0.08513832092285156, 0.090728759765625, 0.09631919860839844, 0.10190963745117188, 0.10750007629394531, 0.11309051513671875, 0.11868095397949219, 0.12427139282226562, 0.12986183166503906, 0.1354522705078125, 0.14104270935058594, 0.14663314819335938, 0.1522235870361328, 0.15781402587890625, 0.1634044647216797, 0.16899490356445312, 0.17458534240722656, 0.18017578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 6.0, 7.0, 4.0, 7.0, 3.0, 2.0, 7.0, 4.0, 9.0, 16.0, 35.0, 44.0, 46.0, 92.0, 125.0, 221.0, 619.0, 1842.0, 7046.0, 775399.0, 7592187.0, 7675.0, 1837.0, 650.0, 255.0, 160.0, 71.0, 53.0, 30.0, 41.0, 19.0, 16.0, 12.0, 10.0, 10.0, 6.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.56608247756958, -1.5213700532913208, -1.476657509803772, -1.4319450855255127, -1.3872326612472534, -1.3425201177597046, -1.2978076934814453, -1.2530951499938965, -1.2083827257156372, -1.163670301437378, -1.118957757949829, -1.0742453336715698, -1.0295329093933105, -0.9848203659057617, -0.9401079416275024, -0.8953954577445984, -0.8506830334663391, -0.8059705495834351, -0.7612581253051758, -0.7165456414222717, -0.6718331575393677, -0.6271207332611084, -0.5824082493782043, -0.5376957654953003, -0.49298331141471863, -0.44827085733413696, -0.4035583734512329, -0.35884591937065125, -0.3141334652900696, -0.2694209814071655, -0.22470852732658386, -0.1799960434436798, -0.13528358936309814, -0.09057112038135529, -0.045858658850193024, -0.0011461973190307617, 0.0435662716627121, 0.08827874064445496, 0.13299119472503662, 0.17770367860794067, 0.22241613268852234, 0.267128586769104, 0.31184107065200806, 0.3565535247325897, 0.4012659788131714, 0.44597846269607544, 0.4906909167766571, 0.5354033708572388, 0.5801158547401428, 0.6248283386230469, 0.6695407629013062, 0.7142532467842102, 0.7589657306671143, 0.8036781549453735, 0.8483906388282776, 0.8931031227111816, 0.9378155469894409, 0.982528030872345, 1.027240514755249, 1.0719529390335083, 1.1166653633117676, 1.1613779067993164, 1.2060903310775757, 1.250802755355835, 1.2955152988433838]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 4.0, 6.0, 9.0, 5.0, 4.0, 3.0, 4.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.898141384124756, -2.814516544342041, -2.730891704559326, -2.6472666263580322, -2.5636417865753174, -2.4800169467926025, -2.3963918685913086, -2.3127670288085938, -2.229142189025879, -2.145517349243164, -2.061892509460449, -1.9782674312591553, -1.8946425914764404, -1.8110177516937256, -1.7273927927017212, -1.6437678337097168, -1.560142993927002, -1.476518154144287, -1.3928931951522827, -1.3092682361602783, -1.2256433963775635, -1.1420185565948486, -1.0583935976028442, -0.9747686982154846, -0.891143798828125, -0.8075188994407654, -0.7238940000534058, -0.6402691006660461, -0.5566442012786865, -0.4730193018913269, -0.3893944025039673, -0.30576950311660767, -0.22214460372924805, -0.13851970434188843, -0.05489480495452881, 0.02873009443283081, 0.11235499382019043, 0.19597989320755005, 0.27960479259490967, 0.3632296919822693, 0.4468545913696289, 0.5304794907569885, 0.6141043901443481, 0.6977292895317078, 0.7813541889190674, 0.864979088306427, 0.9486039876937866, 1.032228946685791, 1.1158537864685059, 1.1994786262512207, 1.283103585243225, 1.3667285442352295, 1.4503533840179443, 1.5339782238006592, 1.6176031827926636, 1.701228141784668, 1.7848529815673828, 1.8684778213500977, 1.952102780342102, 2.0357277393341064, 2.1193525791168213, 2.202977418899536, 2.28660249710083, 2.370227336883545, 2.4538521766662598]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 13.0, 18.0, 14.0, 18.0, 20.0, 27.0, 30.0, 29.0, 35.0, 35.0, 42.0, 45.0, 63.0, 51.0, 59.0, 53.0, 49.0, 48.0, 43.0, 33.0, 30.0, 23.0, 16.0, 36.0, 23.0, 25.0, 18.0, 14.0, 9.0, 10.0, 9.0, 11.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.135498046875, -0.13158798217773438, -0.12767791748046875, -0.12376785278320312, -0.1198577880859375, -0.11594772338867188, -0.11203765869140625, -0.10812759399414062, -0.104217529296875, -0.10030746459960938, -0.09639739990234375, -0.09248733520507812, -0.0885772705078125, -0.08466720581054688, -0.08075714111328125, -0.07684707641601562, -0.07293701171875, -0.06902694702148438, -0.06511688232421875, -0.061206817626953125, -0.0572967529296875, -0.053386688232421875, -0.04947662353515625, -0.045566558837890625, -0.041656494140625, -0.037746429443359375, -0.03383636474609375, -0.029926300048828125, -0.0260162353515625, -0.022106170654296875, -0.01819610595703125, -0.014286041259765625, -0.0103759765625, -0.006465911865234375, -0.00255584716796875, 0.001354217529296875, 0.0052642822265625, 0.009174346923828125, 0.01308441162109375, 0.016994476318359375, 0.020904541015625, 0.024814605712890625, 0.02872467041015625, 0.032634735107421875, 0.0365447998046875, 0.040454864501953125, 0.04436492919921875, 0.048274993896484375, 0.05218505859375, 0.056095123291015625, 0.06000518798828125, 0.06391525268554688, 0.0678253173828125, 0.07173538208007812, 0.07564544677734375, 0.07955551147460938, 0.083465576171875, 0.08737564086914062, 0.09128570556640625, 0.09519577026367188, 0.0991058349609375, 0.10301589965820312, 0.10692596435546875, 0.11083602905273438, 0.11474609375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 10.0, 6.0, 3.0, 7.0, 4.0, 13.0, 18.0, 15.0, 31.0, 45.0, 74.0, 125.0, 224.0, 380.0, 686.0, 1298.0, 2816.0, 5900.0, 13840.0, 34008.0, 86404.0, 173172.0, 121570.0, 48901.0, 19288.0, 8168.0, 3634.0, 1723.0, 865.0, 418.0, 224.0, 126.0, 97.0, 52.0, 35.0, 24.0, 16.0, 20.0, 11.0, 8.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.109375, -1.0774002075195312, -1.0454254150390625, -1.0134506225585938, -0.981475830078125, -0.9495010375976562, -0.9175262451171875, -0.8855514526367188, -0.85357666015625, -0.8216018676757812, -0.7896270751953125, -0.7576522827148438, -0.725677490234375, -0.6937026977539062, -0.6617279052734375, -0.6297531127929688, -0.5977783203125, -0.5658035278320312, -0.5338287353515625, -0.5018539428710938, -0.469879150390625, -0.43790435791015625, -0.4059295654296875, -0.37395477294921875, -0.34197998046875, -0.31000518798828125, -0.2780303955078125, -0.24605560302734375, -0.214080810546875, -0.18210601806640625, -0.1501312255859375, -0.11815643310546875, -0.086181640625, -0.05420684814453125, -0.0222320556640625, 0.00974273681640625, 0.041717529296875, 0.07369232177734375, 0.1056671142578125, 0.13764190673828125, 0.16961669921875, 0.20159149169921875, 0.2335662841796875, 0.26554107666015625, 0.297515869140625, 0.32949066162109375, 0.3614654541015625, 0.39344024658203125, 0.4254150390625, 0.45738983154296875, 0.4893646240234375, 0.5213394165039062, 0.553314208984375, 0.5852890014648438, 0.6172637939453125, 0.6492385864257812, 0.68121337890625, 0.7131881713867188, 0.7451629638671875, 0.7771377563476562, 0.809112548828125, 0.8410873413085938, 0.8730621337890625, 0.9050369262695312, 0.93701171875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 9.0, 12.0, 14.0, 16.0, 22.0, 30.0, 21.0, 32.0, 29.0, 33.0, 57.0, 44.0, 67.0, 52.0, 60.0, 52.0, 65.0, 46.0, 39.0, 32.0, 43.0, 32.0, 25.0, 22.0, 25.0, 19.0, 9.0, 12.0, 12.0, 6.0, 9.0, 7.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.187744140625, -0.182769775390625, -0.17779541015625, -0.172821044921875, -0.1678466796875, -0.162872314453125, -0.15789794921875, -0.152923583984375, -0.14794921875, -0.142974853515625, -0.13800048828125, -0.133026123046875, -0.1280517578125, -0.123077392578125, -0.11810302734375, -0.113128662109375, -0.108154296875, -0.103179931640625, -0.09820556640625, -0.093231201171875, -0.0882568359375, -0.083282470703125, -0.07830810546875, -0.073333740234375, -0.068359375, -0.063385009765625, -0.05841064453125, -0.053436279296875, -0.0484619140625, -0.043487548828125, -0.03851318359375, -0.033538818359375, -0.028564453125, -0.023590087890625, -0.01861572265625, -0.013641357421875, -0.0086669921875, -0.003692626953125, 0.00128173828125, 0.006256103515625, 0.01123046875, 0.016204833984375, 0.02117919921875, 0.026153564453125, 0.0311279296875, 0.036102294921875, 0.04107666015625, 0.046051025390625, 0.051025390625, 0.055999755859375, 0.06097412109375, 0.065948486328125, 0.0709228515625, 0.075897216796875, 0.08087158203125, 0.085845947265625, 0.0908203125, 0.095794677734375, 0.10076904296875, 0.105743408203125, 0.1107177734375, 0.115692138671875, 0.12066650390625, 0.125640869140625, 0.130615234375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 4.0, 6.0, 8.0, 13.0, 25.0, 53.0, 96.0, 90.0, 69.0, 49.0, 18.0, 8.0, 7.0, 6.0, 3.0, 6.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.331541895866394, -1.2872164249420166, -1.2428910732269287, -1.1985657215118408, -1.1542402505874634, -1.109914779663086, -1.065589427947998, -1.0212640762329102, -0.9769386053085327, -0.9326131939888, -0.8882877826690674, -0.8439623713493347, -0.799636960029602, -0.7553115487098694, -0.7109861373901367, -0.666660726070404, -0.6223353147506714, -0.5780099034309387, -0.533684492111206, -0.4893590807914734, -0.4450336694717407, -0.40070825815200806, -0.3563828468322754, -0.3120574355125427, -0.26773202419281006, -0.2234066128730774, -0.17908120155334473, -0.13475579023361206, -0.0904303789138794, -0.04610496759414673, -0.0017795562744140625, 0.042545855045318604, 0.08687114715576172, 0.13119655847549438, 0.17552196979522705, 0.21984738111495972, 0.2641727924346924, 0.30849820375442505, 0.3528236150741577, 0.3971490263938904, 0.44147443771362305, 0.4857998490333557, 0.5301252603530884, 0.574450671672821, 0.6187760829925537, 0.6631014943122864, 0.707426905632019, 0.7517523169517517, 0.7960777282714844, 0.840403139591217, 0.8847285509109497, 0.9290539622306824, 0.973379373550415, 1.017704725265503, 1.0620301961898804, 1.1063556671142578, 1.1506810188293457, 1.1950063705444336, 1.239331841468811, 1.2836573123931885, 1.3279826641082764, 1.3723080158233643, 1.4166334867477417, 1.4609589576721191, 1.505284309387207]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 8.0, 7.0, 17.0, 22.0, 57.0, 71.0, 94.0, 70.0, 42.0, 19.0, 14.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1043403148651123, -1.0688014030456543, -1.0332624912261963, -0.9977235794067383, -0.9621846675872803, -0.9266457557678223, -0.8911067843437195, -0.8555678725242615, -0.8200289607048035, -0.7844900488853455, -0.7489511370658875, -0.7134122252464294, -0.6778732538223267, -0.6423343420028687, -0.6067954301834106, -0.5712565183639526, -0.5357176065444946, -0.5001786947250366, -0.4646397829055786, -0.4291008412837982, -0.3935619294643402, -0.3580230176448822, -0.3224840760231018, -0.2869451642036438, -0.2514062523841858, -0.21586734056472778, -0.18032841384410858, -0.14478948712348938, -0.10925057530403137, -0.07371166348457336, -0.03817273676395416, -0.002633810043334961, 0.03290510177612305, 0.06844402104616165, 0.10398294031620026, 0.13952186703681946, 0.17506077885627747, 0.21059969067573547, 0.24613861739635468, 0.2816775441169739, 0.3172164559364319, 0.3527553677558899, 0.3882942795753479, 0.4238332211971283, 0.4593721330165863, 0.4949110448360443, 0.5304499864578247, 0.5659888982772827, 0.6015278100967407, 0.6370667219161987, 0.6726056337356567, 0.7081445455551147, 0.7436834573745728, 0.7792223691940308, 0.8147613406181335, 0.8503002524375916, 0.8858391642570496, 0.9213780760765076, 0.9569169878959656, 0.9924558997154236, 1.0279948711395264, 1.0635337829589844, 1.0990726947784424, 1.1346116065979004, 1.1701505184173584]}, "eval/loss": 0.34626105427742004, "eval/wer": 0.10119000396667989, "eval/runtime": 713.9632, "eval/samples_per_second": 3.7, "eval/steps_per_second": 0.464, "train/train_runtime": 25980.5507, "train/train_samples_per_second": 5.492, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 2.498668275362574} \ No newline at end of file +{"train/loss": 0.2069, "train/learning_rate": 1.9512195121951218e-06, "train/epoch": 5.0, "train/global_step": 1115, "_runtime": 26937, "_timestamp": 1648264065, "_step": 1118, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 13.0, 18.0, 25.0, 50.0, 74.0, 109.0, 157.0, 160.0, 161.0, 89.0, 56.0, 41.0, 23.0, 17.0, 7.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.614524245262146, -0.5559785962104797, -0.4974329471588135, -0.4388873279094696, -0.38034167885780334, -0.3217960298061371, -0.2632504105567932, -0.20470476150512695, -0.1461591124534607, -0.08761347085237503, -0.029067829251289368, 0.029477804899215698, 0.08802345395088196, 0.14656910300254822, 0.2051147222518921, 0.26366037130355835, 0.3222060203552246, 0.38075166940689087, 0.43929731845855713, 0.497842937707901, 0.5563886165618896, 0.6149342060089111, 0.6734798550605774, 0.7320255041122437, 0.7905711531639099, 0.8491168022155762, 0.9076624512672424, 0.9662081003189087, 1.0247536897659302, 1.0832993984222412, 1.1418449878692627, 1.2003905773162842, 1.2589364051818848, 1.3174819946289062, 1.3760277032852173, 1.4345732927322388, 1.4931190013885498, 1.5516645908355713, 1.6102101802825928, 1.6687558889389038, 1.7273015975952148, 1.7858471870422363, 1.8443928956985474, 1.9029384851455688, 1.9614841938018799, 2.0200297832489014, 2.078575372695923, 2.1371212005615234, 2.195666790008545, 2.2542123794555664, 2.312757968902588, 2.3713037967681885, 2.42984938621521, 2.4883949756622314, 2.546940565109253, 2.6054863929748535, 2.664031744003296, 2.7225773334503174, 2.781122922897339, 2.8396687507629395, 2.898214340209961, 2.9567599296569824, 3.015305519104004, 3.0738511085510254, 3.132396936416626]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 4.0, 7.0, 7.0, 5.0, 8.0, 16.0, 17.0, 13.0, 14.0, 24.0, 20.0, 25.0, 31.0, 27.0, 24.0, 39.0, 29.0, 38.0, 51.0, 40.0, 46.0, 41.0, 32.0, 36.0, 41.0, 34.0, 39.0, 27.0, 32.0, 14.0, 23.0, 25.0, 27.0, 19.0, 19.0, 13.0, 9.0, 15.0, 14.0, 10.0, 5.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 5.0], "bins": [-0.7400795221328735, -0.7190272808074951, -0.6979750990867615, -0.6769228577613831, -0.6558706760406494, -0.634818434715271, -0.6137662529945374, -0.5927140116691589, -0.5716618299484253, -0.5506095886230469, -0.5295574069023132, -0.5085051655769348, -0.48745298385620117, -0.46640077233314514, -0.4453485608100891, -0.4242963194847107, -0.40324410796165466, -0.38219189643859863, -0.3611396849155426, -0.3400874733924866, -0.31903526186943054, -0.2979830503463745, -0.2769308090209961, -0.25587862730026245, -0.23482640087604523, -0.2137741893529892, -0.19272197782993317, -0.17166975140571594, -0.1506175398826599, -0.12956532835960388, -0.10851311683654785, -0.08746090531349182, -0.06640869379043579, -0.04535648226737976, -0.024304267019033432, -0.0032520517706871033, 0.017800159752368927, 0.03885237127542496, 0.059904590249061584, 0.08095680177211761, 0.10200901329517365, 0.12306122481822968, 0.1441134363412857, 0.16516566276550293, 0.18621787428855896, 0.207270085811615, 0.22832229733467102, 0.24937450885772705, 0.2704267203807831, 0.2914789319038391, 0.31253114342689514, 0.33358335494995117, 0.3546355664730072, 0.37568777799606323, 0.39674001932144165, 0.4177922010421753, 0.4388444423675537, 0.45989665389060974, 0.48094886541366577, 0.5020011067390442, 0.5230532884597778, 0.5441055297851562, 0.5651577115058899, 0.5862099528312683, 0.607262134552002]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 17.0, 15.0, 26.0, 30.0, 35.0, 63.0, 97.0, 128.0, 188.0, 280.0, 440.0, 788.0, 1307.0, 2487.0, 5555.0, 14801.0, 99328.0, 1248391.0, 2544552.0, 235525.0, 25350.0, 7514.0, 3245.0, 1628.0, 850.0, 515.0, 345.0, 222.0, 156.0, 135.0, 69.0, 52.0, 37.0, 32.0, 17.0, 15.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0], "bins": [-3.935546875, -3.829681396484375, -3.72381591796875, -3.617950439453125, -3.5120849609375, -3.406219482421875, -3.30035400390625, -3.194488525390625, -3.088623046875, -2.982757568359375, -2.87689208984375, -2.771026611328125, -2.6651611328125, -2.559295654296875, -2.45343017578125, -2.347564697265625, -2.24169921875, -2.135833740234375, -2.02996826171875, -1.924102783203125, -1.8182373046875, -1.712371826171875, -1.60650634765625, -1.500640869140625, -1.394775390625, -1.288909912109375, -1.18304443359375, -1.077178955078125, -0.9713134765625, -0.865447998046875, -0.75958251953125, -0.653717041015625, -0.5478515625, -0.441986083984375, -0.33612060546875, -0.230255126953125, -0.1243896484375, -0.018524169921875, 0.08734130859375, 0.193206787109375, 0.299072265625, 0.404937744140625, 0.51080322265625, 0.616668701171875, 0.7225341796875, 0.828399658203125, 0.93426513671875, 1.040130615234375, 1.14599609375, 1.251861572265625, 1.35772705078125, 1.463592529296875, 1.5694580078125, 1.675323486328125, 1.78118896484375, 1.887054443359375, 1.992919921875, 2.098785400390625, 2.20465087890625, 2.310516357421875, 2.4163818359375, 2.522247314453125, 2.62811279296875, 2.733978271484375, 2.83984375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 9.0, 10.0, 8.0, 20.0, 18.0, 26.0, 21.0, 22.0, 34.0, 32.0, 29.0, 33.0, 45.0, 34.0, 57.0, 56.0, 54.0, 32.0, 41.0, 46.0, 38.0, 50.0, 33.0, 23.0, 30.0, 22.0, 29.0, 18.0, 22.0, 15.0, 10.0, 8.0, 12.0, 9.0, 9.0, 10.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.7158203125, -1.6680145263671875, -1.620208740234375, -1.5724029541015625, -1.52459716796875, -1.4767913818359375, -1.428985595703125, -1.3811798095703125, -1.3333740234375, -1.2855682373046875, -1.237762451171875, -1.1899566650390625, -1.14215087890625, -1.0943450927734375, -1.046539306640625, -0.9987335205078125, -0.950927734375, -0.9031219482421875, -0.855316162109375, -0.8075103759765625, -0.75970458984375, -0.7118988037109375, -0.664093017578125, -0.6162872314453125, -0.5684814453125, -0.5206756591796875, -0.472869873046875, -0.4250640869140625, -0.37725830078125, -0.3294525146484375, -0.281646728515625, -0.2338409423828125, -0.18603515625, -0.1382293701171875, -0.090423583984375, -0.0426177978515625, 0.00518798828125, 0.0529937744140625, 0.100799560546875, 0.1486053466796875, 0.1964111328125, 0.2442169189453125, 0.292022705078125, 0.3398284912109375, 0.38763427734375, 0.4354400634765625, 0.483245849609375, 0.5310516357421875, 0.578857421875, 0.6266632080078125, 0.674468994140625, 0.7222747802734375, 0.77008056640625, 0.8178863525390625, 0.865692138671875, 0.9134979248046875, 0.9613037109375, 1.0091094970703125, 1.056915283203125, 1.1047210693359375, 1.15252685546875, 1.2003326416015625, 1.248138427734375, 1.2959442138671875, 1.34375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 13.0, 22.0, 17.0, 39.0, 74.0, 132.0, 333.0, 1811.0, 55303.0, 4126606.0, 8398.0, 912.0, 313.0, 113.0, 58.0, 41.0, 24.0, 17.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9609375, -12.533203125, -12.10546875, -11.677734375, -11.25, -10.822265625, -10.39453125, -9.966796875, -9.5390625, -9.111328125, -8.68359375, -8.255859375, -7.828125, -7.400390625, -6.97265625, -6.544921875, -6.1171875, -5.689453125, -5.26171875, -4.833984375, -4.40625, -3.978515625, -3.55078125, -3.123046875, -2.6953125, -2.267578125, -1.83984375, -1.412109375, -0.984375, -0.556640625, -0.12890625, 0.298828125, 0.7265625, 1.154296875, 1.58203125, 2.009765625, 2.4375, 2.865234375, 3.29296875, 3.720703125, 4.1484375, 4.576171875, 5.00390625, 5.431640625, 5.859375, 6.287109375, 6.71484375, 7.142578125, 7.5703125, 7.998046875, 8.42578125, 8.853515625, 9.28125, 9.708984375, 10.13671875, 10.564453125, 10.9921875, 11.419921875, 11.84765625, 12.275390625, 12.703125, 13.130859375, 13.55859375, 13.986328125, 14.4140625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 4.0, 9.0, 10.0, 24.0, 21.0, 44.0, 79.0, 118.0, 221.0, 658.0, 1295.0, 822.0, 338.0, 165.0, 90.0, 63.0, 32.0, 25.0, 15.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8875885009765625, -0.854278564453125, -0.8209686279296875, -0.78765869140625, -0.7543487548828125, -0.721038818359375, -0.6877288818359375, -0.6544189453125, -0.6211090087890625, -0.587799072265625, -0.5544891357421875, -0.52117919921875, -0.4878692626953125, -0.454559326171875, -0.4212493896484375, -0.387939453125, -0.3546295166015625, -0.321319580078125, -0.2880096435546875, -0.25469970703125, -0.2213897705078125, -0.188079833984375, -0.1547698974609375, -0.1214599609375, -0.0881500244140625, -0.054840087890625, -0.0215301513671875, 0.01177978515625, 0.0450897216796875, 0.078399658203125, 0.1117095947265625, 0.14501953125, 0.1783294677734375, 0.211639404296875, 0.2449493408203125, 0.27825927734375, 0.3115692138671875, 0.344879150390625, 0.3781890869140625, 0.4114990234375, 0.4448089599609375, 0.478118896484375, 0.5114288330078125, 0.54473876953125, 0.5780487060546875, 0.611358642578125, 0.6446685791015625, 0.677978515625, 0.7112884521484375, 0.744598388671875, 0.7779083251953125, 0.81121826171875, 0.8445281982421875, 0.877838134765625, 0.9111480712890625, 0.9444580078125, 0.9777679443359375, 1.011077880859375, 1.0443878173828125, 1.07769775390625, 1.1110076904296875, 1.144317626953125, 1.1776275634765625, 1.2109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 11.0, 17.0, 15.0, 18.0, 14.0, 20.0, 32.0, 35.0, 61.0, 62.0, 76.0, 86.0, 81.0, 95.0, 81.0, 64.0, 50.0, 33.0, 34.0, 23.0, 23.0, 12.0, 14.0, 11.0, 7.0, 10.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.188549280166626, -2.1190285682678223, -2.0495080947875977, -1.979987382888794, -1.9104666709899902, -1.840946078300476, -1.771425485610962, -1.7019047737121582, -1.632384181022644, -1.5628635883331299, -1.4933428764343262, -1.423822283744812, -1.3543016910552979, -1.2847809791564941, -1.21526038646698, -1.1457397937774658, -1.076219081878662, -1.006698489189148, -0.9371777772903442, -0.8676571846008301, -0.7981365323066711, -0.7286158800125122, -0.659095287322998, -0.5895746350288391, -0.5200539827346802, -0.45053333044052124, -0.3810127079486847, -0.31149208545684814, -0.2419714331626892, -0.17245078086853027, -0.10293015837669373, -0.03340953588485718, 0.03611111640930176, 0.1056317538022995, 0.17515239119529724, 0.24467302858829498, 0.3141936659812927, 0.38371431827545166, 0.4532349407672882, 0.5227555632591248, 0.5922762155532837, 0.6617968678474426, 0.7313175201416016, 0.8008381128311157, 0.8703587651252747, 0.9398794174194336, 1.0094000101089478, 1.078920602798462, 1.1484413146972656, 1.2179619073867798, 1.2874826192855835, 1.3570032119750977, 1.4265239238739014, 1.4960445165634155, 1.5655651092529297, 1.6350858211517334, 1.7046064138412476, 1.7741270065307617, 1.8436477184295654, 1.9131683111190796, 1.9826889038085938, 2.0522096157073975, 2.121730327606201, 2.191250801086426, 2.2607715129852295]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 5.0, 14.0, 12.0, 11.0, 14.0, 19.0, 16.0, 28.0, 35.0, 36.0, 40.0, 39.0, 38.0, 44.0, 50.0, 42.0, 38.0, 56.0, 36.0, 38.0, 51.0, 35.0, 32.0, 40.0, 25.0, 32.0, 25.0, 25.0, 22.0, 16.0, 18.0, 9.0, 15.0, 8.0, 8.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.7684389352798462, -1.720792293548584, -1.6731456518173218, -1.6254990100860596, -1.5778523683547974, -1.5302057266235352, -1.482559084892273, -1.4349124431610107, -1.3872658014297485, -1.3396191596984863, -1.2919725179672241, -1.244325876235962, -1.1966792345046997, -1.1490325927734375, -1.1013859510421753, -1.053739309310913, -1.0060926675796509, -0.9584460258483887, -0.9107993841171265, -0.8631527423858643, -0.815506100654602, -0.7678594589233398, -0.7202128171920776, -0.6725661754608154, -0.6249195337295532, -0.577272891998291, -0.5296262502670288, -0.4819796085357666, -0.4343329668045044, -0.3866863250732422, -0.33903968334198, -0.2913930416107178, -0.24374651908874512, -0.1960998773574829, -0.1484532356262207, -0.1008065938949585, -0.05315995216369629, -0.005513310432434082, 0.042133331298828125, 0.08977997303009033, 0.13742661476135254, 0.18507325649261475, 0.23271989822387695, 0.28036653995513916, 0.32801318168640137, 0.3756598234176636, 0.4233064651489258, 0.470953106880188, 0.5185997486114502, 0.5662463903427124, 0.6138930320739746, 0.6615396738052368, 0.709186315536499, 0.7568329572677612, 0.8044795989990234, 0.8521262407302856, 0.8997728824615479, 0.9474195241928101, 0.9950661659240723, 1.0427128076553345, 1.0903594493865967, 1.1380060911178589, 1.185652732849121, 1.2332993745803833, 1.2809460163116455]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 6.0, 12.0, 14.0, 30.0, 32.0, 40.0, 67.0, 108.0, 162.0, 249.0, 372.0, 607.0, 898.0, 1588.0, 2695.0, 5145.0, 9935.0, 21051.0, 46848.0, 108909.0, 254478.0, 324257.0, 151142.0, 64048.0, 27879.0, 13056.0, 6534.0, 3393.0, 1934.0, 1120.0, 672.0, 438.0, 292.0, 169.0, 120.0, 70.0, 46.0, 38.0, 32.0, 26.0, 17.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.755859375, -0.7308197021484375, -0.705780029296875, -0.6807403564453125, -0.65570068359375, -0.6306610107421875, -0.605621337890625, -0.5805816650390625, -0.5555419921875, -0.5305023193359375, -0.505462646484375, -0.4804229736328125, -0.45538330078125, -0.4303436279296875, -0.405303955078125, -0.3802642822265625, -0.355224609375, -0.3301849365234375, -0.305145263671875, -0.2801055908203125, -0.25506591796875, -0.2300262451171875, -0.204986572265625, -0.1799468994140625, -0.1549072265625, -0.1298675537109375, -0.104827880859375, -0.0797882080078125, -0.05474853515625, -0.0297088623046875, -0.004669189453125, 0.0203704833984375, 0.04541015625, 0.0704498291015625, 0.095489501953125, 0.1205291748046875, 0.14556884765625, 0.1706085205078125, 0.195648193359375, 0.2206878662109375, 0.2457275390625, 0.2707672119140625, 0.295806884765625, 0.3208465576171875, 0.34588623046875, 0.3709259033203125, 0.395965576171875, 0.4210052490234375, 0.446044921875, 0.4710845947265625, 0.496124267578125, 0.5211639404296875, 0.54620361328125, 0.5712432861328125, 0.596282958984375, 0.6213226318359375, 0.6463623046875, 0.6714019775390625, 0.696441650390625, 0.7214813232421875, 0.74652099609375, 0.7715606689453125, 0.796600341796875, 0.8216400146484375, 0.8466796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 10.0, 10.0, 23.0, 10.0, 16.0, 19.0, 30.0, 30.0, 38.0, 42.0, 45.0, 43.0, 32.0, 37.0, 54.0, 42.0, 37.0, 43.0, 49.0, 38.0, 43.0, 39.0, 39.0, 27.0, 31.0, 26.0, 19.0, 21.0, 17.0, 9.0, 12.0, 9.0, 12.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.998291015625, -0.96826171875, -0.938232421875, -0.908203125, -0.878173828125, -0.84814453125, -0.818115234375, -0.7880859375, -0.758056640625, -0.72802734375, -0.697998046875, -0.66796875, -0.637939453125, -0.60791015625, -0.577880859375, -0.5478515625, -0.517822265625, -0.48779296875, -0.457763671875, -0.427734375, -0.397705078125, -0.36767578125, -0.337646484375, -0.3076171875, -0.277587890625, -0.24755859375, -0.217529296875, -0.1875, -0.157470703125, -0.12744140625, -0.097412109375, -0.0673828125, -0.037353515625, -0.00732421875, 0.022705078125, 0.052734375, 0.082763671875, 0.11279296875, 0.142822265625, 0.1728515625, 0.202880859375, 0.23291015625, 0.262939453125, 0.29296875, 0.322998046875, 0.35302734375, 0.383056640625, 0.4130859375, 0.443115234375, 0.47314453125, 0.503173828125, 0.533203125, 0.563232421875, 0.59326171875, 0.623291015625, 0.6533203125, 0.683349609375, 0.71337890625, 0.743408203125, 0.7734375, 0.803466796875, 0.83349609375, 0.863525390625, 0.8935546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 13.0, 17.0, 28.0, 52.0, 85.0, 107.0, 175.0, 312.0, 434.0, 930.0, 1738.0, 3460.0, 8021.0, 20772.0, 64294.0, 239131.0, 472048.0, 163144.0, 45991.0, 15690.0, 6183.0, 2696.0, 1385.0, 761.0, 396.0, 246.0, 149.0, 87.0, 65.0, 33.0, 31.0, 19.0, 15.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8739700317382812, -0.8431549072265625, -0.8123397827148438, -0.781524658203125, -0.7507095336914062, -0.7198944091796875, -0.6890792846679688, -0.65826416015625, -0.6274490356445312, -0.5966339111328125, -0.5658187866210938, -0.535003662109375, -0.5041885375976562, -0.4733734130859375, -0.44255828857421875, -0.4117431640625, -0.38092803955078125, -0.3501129150390625, -0.31929779052734375, -0.288482666015625, -0.25766754150390625, -0.2268524169921875, -0.19603729248046875, -0.16522216796875, -0.13440704345703125, -0.1035919189453125, -0.07277679443359375, -0.041961669921875, -0.01114654541015625, 0.0196685791015625, 0.05048370361328125, 0.081298828125, 0.11211395263671875, 0.1429290771484375, 0.17374420166015625, 0.204559326171875, 0.23537445068359375, 0.2661895751953125, 0.29700469970703125, 0.32781982421875, 0.35863494873046875, 0.3894500732421875, 0.42026519775390625, 0.451080322265625, 0.48189544677734375, 0.5127105712890625, 0.5435256958007812, 0.5743408203125, 0.6051559448242188, 0.6359710693359375, 0.6667861938476562, 0.697601318359375, 0.7284164428710938, 0.7592315673828125, 0.7900466918945312, 0.82086181640625, 0.8516769409179688, 0.8824920654296875, 0.9133071899414062, 0.944122314453125, 0.9749374389648438, 1.0057525634765625, 1.0365676879882812, 1.0673828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 10.0, 16.0, 15.0, 13.0, 10.0, 22.0, 20.0, 16.0, 32.0, 44.0, 43.0, 35.0, 49.0, 47.0, 51.0, 32.0, 48.0, 46.0, 51.0, 33.0, 51.0, 42.0, 29.0, 29.0, 25.0, 22.0, 16.0, 18.0, 19.0, 11.0, 9.0, 11.0, 14.0, 6.0, 8.0, 7.0, 4.0, 3.0, 8.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9306640625, -1.8682098388671875, -1.805755615234375, -1.7433013916015625, -1.68084716796875, -1.6183929443359375, -1.555938720703125, -1.4934844970703125, -1.4310302734375, -1.3685760498046875, -1.306121826171875, -1.2436676025390625, -1.18121337890625, -1.1187591552734375, -1.056304931640625, -0.9938507080078125, -0.931396484375, -0.8689422607421875, -0.806488037109375, -0.7440338134765625, -0.68157958984375, -0.6191253662109375, -0.556671142578125, -0.4942169189453125, -0.4317626953125, -0.3693084716796875, -0.306854248046875, -0.2444000244140625, -0.18194580078125, -0.1194915771484375, -0.057037353515625, 0.0054168701171875, 0.06787109375, 0.1303253173828125, 0.192779541015625, 0.2552337646484375, 0.31768798828125, 0.3801422119140625, 0.442596435546875, 0.5050506591796875, 0.5675048828125, 0.6299591064453125, 0.692413330078125, 0.7548675537109375, 0.81732177734375, 0.8797760009765625, 0.942230224609375, 1.0046844482421875, 1.067138671875, 1.1295928955078125, 1.192047119140625, 1.2545013427734375, 1.31695556640625, 1.3794097900390625, 1.441864013671875, 1.5043182373046875, 1.5667724609375, 1.6292266845703125, 1.691680908203125, 1.7541351318359375, 1.81658935546875, 1.8790435791015625, 1.941497802734375, 2.0039520263671875, 2.06640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 12.0, 15.0, 35.0, 54.0, 45.0, 76.0, 145.0, 205.0, 311.0, 530.0, 876.0, 1483.0, 2792.0, 5473.0, 12108.0, 30805.0, 131137.0, 624842.0, 174003.0, 36964.0, 13422.0, 6118.0, 2921.0, 1680.0, 1002.0, 531.0, 346.0, 207.0, 121.0, 92.0, 54.0, 37.0, 25.0, 25.0, 12.0, 12.0, 10.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2384033203125, -0.23130226135253906, -0.22420120239257812, -0.2171001434326172, -0.20999908447265625, -0.2028980255126953, -0.19579696655273438, -0.18869590759277344, -0.1815948486328125, -0.17449378967285156, -0.16739273071289062, -0.1602916717529297, -0.15319061279296875, -0.1460895538330078, -0.13898849487304688, -0.13188743591308594, -0.124786376953125, -0.11768531799316406, -0.11058425903320312, -0.10348320007324219, -0.09638214111328125, -0.08928108215332031, -0.08218002319335938, -0.07507896423339844, -0.0679779052734375, -0.06087684631347656, -0.053775787353515625, -0.04667472839355469, -0.03957366943359375, -0.03247261047363281, -0.025371551513671875, -0.018270492553710938, -0.01116943359375, -0.0040683746337890625, 0.003032684326171875, 0.010133743286132812, 0.01723480224609375, 0.024335861206054688, 0.031436920166015625, 0.03853797912597656, 0.0456390380859375, 0.05274009704589844, 0.059841156005859375, 0.06694221496582031, 0.07404327392578125, 0.08114433288574219, 0.08824539184570312, 0.09534645080566406, 0.102447509765625, 0.10954856872558594, 0.11664962768554688, 0.12375068664550781, 0.13085174560546875, 0.1379528045654297, 0.14505386352539062, 0.15215492248535156, 0.1592559814453125, 0.16635704040527344, 0.17345809936523438, 0.1805591583251953, 0.18766021728515625, 0.1947612762451172, 0.20186233520507812, 0.20896339416503906, 0.216064453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 6.0, 10.0, 18.0, 15.0, 39.0, 41.0, 103.0, 150.0, 203.0, 140.0, 85.0, 47.0, 30.0, 23.0, 21.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020241737365722656, -0.0001963600516319275, -0.00019030272960662842, -0.00018424540758132935, -0.00017818808555603027, -0.0001721307635307312, -0.00016607344150543213, -0.00016001611948013306, -0.00015395879745483398, -0.0001479014754295349, -0.00014184415340423584, -0.00013578683137893677, -0.0001297295093536377, -0.00012367218732833862, -0.00011761486530303955, -0.00011155754327774048, -0.0001055002212524414, -9.944289922714233e-05, -9.338557720184326e-05, -8.732825517654419e-05, -8.127093315124512e-05, -7.521361112594604e-05, -6.915628910064697e-05, -6.30989670753479e-05, -5.704164505004883e-05, -5.0984323024749756e-05, -4.4927000999450684e-05, -3.886967897415161e-05, -3.281235694885254e-05, -2.6755034923553467e-05, -2.0697712898254395e-05, -1.4640390872955322e-05, -8.58306884765625e-06, -2.5257468223571777e-06, 3.5315752029418945e-06, 9.588897228240967e-06, 1.564621925354004e-05, 2.170354127883911e-05, 2.7760863304138184e-05, 3.3818185329437256e-05, 3.987550735473633e-05, 4.59328293800354e-05, 5.199015140533447e-05, 5.8047473430633545e-05, 6.410479545593262e-05, 7.016211748123169e-05, 7.621943950653076e-05, 8.227676153182983e-05, 8.83340835571289e-05, 9.439140558242798e-05, 0.00010044872760772705, 0.00010650604963302612, 0.0001125633716583252, 0.00011862069368362427, 0.00012467801570892334, 0.0001307353377342224, 0.00013679265975952148, 0.00014284998178482056, 0.00014890730381011963, 0.0001549646258354187, 0.00016102194786071777, 0.00016707926988601685, 0.00017313659191131592, 0.000179193913936615, 0.00018525123596191406]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 2.0, 4.0, 5.0, 3.0, 13.0, 14.0, 24.0, 28.0, 41.0, 96.0, 135.0, 308.0, 653.0, 1396.0, 3181.0, 8031.0, 24139.0, 112015.0, 642628.0, 202067.0, 35427.0, 10828.0, 4172.0, 1705.0, 808.0, 386.0, 180.0, 86.0, 48.0, 37.0, 25.0, 12.0, 15.0, 6.0, 10.0, 1.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.287109375, -0.2785758972167969, -0.27004241943359375, -0.2615089416503906, -0.2529754638671875, -0.24444198608398438, -0.23590850830078125, -0.22737503051757812, -0.218841552734375, -0.21030807495117188, -0.20177459716796875, -0.19324111938476562, -0.1847076416015625, -0.17617416381835938, -0.16764068603515625, -0.15910720825195312, -0.15057373046875, -0.14204025268554688, -0.13350677490234375, -0.12497329711914062, -0.1164398193359375, -0.10790634155273438, -0.09937286376953125, -0.09083938598632812, -0.082305908203125, -0.07377243041992188, -0.06523895263671875, -0.056705474853515625, -0.0481719970703125, -0.039638519287109375, -0.03110504150390625, -0.022571563720703125, -0.0140380859375, -0.005504608154296875, 0.00302886962890625, 0.011562347412109375, 0.0200958251953125, 0.028629302978515625, 0.03716278076171875, 0.045696258544921875, 0.054229736328125, 0.06276321411132812, 0.07129669189453125, 0.07983016967773438, 0.0883636474609375, 0.09689712524414062, 0.10543060302734375, 0.11396408081054688, 0.12249755859375, 0.13103103637695312, 0.13956451416015625, 0.14809799194335938, 0.1566314697265625, 0.16516494750976562, 0.17369842529296875, 0.18223190307617188, 0.190765380859375, 0.19929885864257812, 0.20783233642578125, 0.21636581420898438, 0.2248992919921875, 0.23343276977539062, 0.24196624755859375, 0.2504997253417969, 0.259033203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 10.0, 8.0, 15.0, 15.0, 18.0, 27.0, 44.0, 43.0, 61.0, 75.0, 82.0, 101.0, 95.0, 86.0, 59.0, 53.0, 30.0, 36.0, 27.0, 23.0, 7.0, 10.0, 13.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0701904296875, -0.0681161880493164, -0.06604194641113281, -0.06396770477294922, -0.061893463134765625, -0.05981922149658203, -0.05774497985839844, -0.055670738220214844, -0.05359649658203125, -0.051522254943847656, -0.04944801330566406, -0.04737377166748047, -0.045299530029296875, -0.04322528839111328, -0.04115104675292969, -0.039076805114746094, -0.0370025634765625, -0.034928321838378906, -0.03285408020019531, -0.03077983856201172, -0.028705596923828125, -0.02663135528564453, -0.024557113647460938, -0.022482872009277344, -0.02040863037109375, -0.018334388732910156, -0.016260147094726562, -0.014185905456542969, -0.012111663818359375, -0.010037422180175781, -0.007963180541992188, -0.005888938903808594, -0.003814697265625, -0.0017404556274414062, 0.0003337860107421875, 0.0024080276489257812, 0.004482269287109375, 0.006556510925292969, 0.008630752563476562, 0.010704994201660156, 0.01277923583984375, 0.014853477478027344, 0.016927719116210938, 0.01900196075439453, 0.021076202392578125, 0.02315044403076172, 0.025224685668945312, 0.027298927307128906, 0.0293731689453125, 0.031447410583496094, 0.03352165222167969, 0.03559589385986328, 0.037670135498046875, 0.03974437713623047, 0.04181861877441406, 0.043892860412597656, 0.04596710205078125, 0.048041343688964844, 0.05011558532714844, 0.05218982696533203, 0.054264068603515625, 0.05633831024169922, 0.05841255187988281, 0.060486793518066406, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 7.0, 13.0, 33.0, 42.0, 62.0, 98.0, 145.0, 196.0, 152.0, 105.0, 47.0, 40.0, 29.0, 10.0, 7.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.620237350463867, -2.541998863220215, -2.4637603759765625, -2.385521650314331, -2.3072831630706787, -2.2290446758270264, -2.150806188583374, -2.0725677013397217, -1.9943290948867798, -1.9160906076431274, -1.8378520011901855, -1.7596135139465332, -1.6813750267028809, -1.603136420249939, -1.5248979330062866, -1.4466593265533447, -1.3684208393096924, -1.29018235206604, -1.2119437456130981, -1.1337052583694458, -1.055466651916504, -0.9772281646728516, -0.8989896774291992, -0.8207511305809021, -0.742512583732605, -0.6642740368843079, -0.5860354900360107, -0.5077970027923584, -0.4295584559440613, -0.35131990909576416, -0.27308139204978943, -0.1948428750038147, -0.11660432815551758, -0.03836579620838165, 0.03987273573875427, 0.1181112676858902, 0.19634979963302612, 0.27458834648132324, 0.352826863527298, 0.4310653805732727, 0.5093039274215698, 0.5875424742698669, 0.6657810211181641, 0.7440195083618164, 0.8222580552101135, 0.9004966020584106, 0.978735089302063, 1.0569736957550049, 1.1352121829986572, 1.2134506702423096, 1.2916892766952515, 1.3699277639389038, 1.4481663703918457, 1.526404857635498, 1.6046433448791504, 1.6828818321228027, 1.7611204385757446, 1.839358925819397, 1.9175975322723389, 1.9958360195159912, 2.0740745067596436, 2.152313232421875, 2.2305517196655273, 2.3087902069091797, 2.387028694152832]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 3.0, 7.0, 12.0, 21.0, 21.0, 18.0, 17.0, 27.0, 28.0, 34.0, 37.0, 38.0, 35.0, 38.0, 47.0, 43.0, 41.0, 41.0, 27.0, 46.0, 40.0, 49.0, 34.0, 33.0, 30.0, 30.0, 31.0, 27.0, 21.0, 20.0, 9.0, 7.0, 20.0, 10.0, 14.0, 6.0, 5.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.9393354058265686, -0.9121330976486206, -0.8849307894706726, -0.8577284812927246, -0.8305262327194214, -0.8033239245414734, -0.7761216163635254, -0.7489193081855774, -0.7217170000076294, -0.6945146918296814, -0.6673123836517334, -0.6401101350784302, -0.6129078269004822, -0.5857055187225342, -0.5585032105445862, -0.5313009023666382, -0.504098653793335, -0.47689634561538696, -0.44969406723976135, -0.42249175906181335, -0.39528948068618774, -0.36808717250823975, -0.34088486433029175, -0.31368255615234375, -0.28648027777671814, -0.25927796959877014, -0.23207569122314453, -0.20487338304519653, -0.17767108976840973, -0.15046879649162292, -0.12326648831367493, -0.09606419503688812, -0.06886190176010132, -0.041659604758024216, -0.014457307755947113, 0.012744992971420288, 0.03994728624820709, 0.0671495795249939, 0.0943518877029419, 0.1215541809797287, 0.1487564742565155, 0.1759587675333023, 0.2031610608100891, 0.2303633689880371, 0.2575656771659851, 0.2847679555416107, 0.3119702637195587, 0.3391725420951843, 0.3663748502731323, 0.3935771584510803, 0.42077943682670593, 0.44798174500465393, 0.47518402338027954, 0.5023863315582275, 0.5295886397361755, 0.5567909479141235, 0.5839931964874268, 0.6111955046653748, 0.6383978128433228, 0.665600061416626, 0.692802369594574, 0.720004677772522, 0.74720698595047, 0.774409294128418, 0.801611602306366]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 7.0, 16.0, 12.0, 33.0, 37.0, 41.0, 50.0, 69.0, 115.0, 182.0, 279.0, 471.0, 820.0, 1381.0, 2596.0, 5119.0, 10773.0, 24766.0, 60498.0, 157344.0, 343180.0, 261970.0, 104436.0, 40859.0, 17267.0, 7853.0, 3695.0, 1915.0, 1006.0, 600.0, 358.0, 242.0, 179.0, 122.0, 76.0, 58.0, 33.0, 22.0, 21.0, 14.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37939453125, -0.3674583435058594, -0.35552215576171875, -0.3435859680175781, -0.3316497802734375, -0.3197135925292969, -0.30777740478515625, -0.2958412170410156, -0.283905029296875, -0.2719688415527344, -0.26003265380859375, -0.24809646606445312, -0.2361602783203125, -0.22422409057617188, -0.21228790283203125, -0.20035171508789062, -0.18841552734375, -0.17647933959960938, -0.16454315185546875, -0.15260696411132812, -0.1406707763671875, -0.12873458862304688, -0.11679840087890625, -0.10486221313476562, -0.092926025390625, -0.08098983764648438, -0.06905364990234375, -0.057117462158203125, -0.0451812744140625, -0.033245086669921875, -0.02130889892578125, -0.009372711181640625, 0.0025634765625, 0.014499664306640625, 0.02643585205078125, 0.038372039794921875, 0.0503082275390625, 0.062244415283203125, 0.07418060302734375, 0.08611679077148438, 0.098052978515625, 0.10998916625976562, 0.12192535400390625, 0.13386154174804688, 0.1457977294921875, 0.15773391723632812, 0.16967010498046875, 0.18160629272460938, 0.19354248046875, 0.20547866821289062, 0.21741485595703125, 0.22935104370117188, 0.2412872314453125, 0.2532234191894531, 0.26515960693359375, 0.2770957946777344, 0.289031982421875, 0.3009681701660156, 0.31290435791015625, 0.3248405456542969, 0.3367767333984375, 0.3487129211425781, 0.36064910888671875, 0.3725852966308594, 0.384521484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 11.0, 12.0, 11.0, 20.0, 15.0, 14.0, 23.0, 19.0, 30.0, 37.0, 36.0, 36.0, 40.0, 29.0, 44.0, 36.0, 39.0, 54.0, 48.0, 47.0, 31.0, 45.0, 42.0, 37.0, 37.0, 29.0, 31.0, 19.0, 16.0, 16.0, 14.0, 11.0, 13.0, 6.0, 8.0, 5.0, 4.0, 6.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.45703125, -5.3033447265625, -5.149658203125, -4.9959716796875, -4.84228515625, -4.6885986328125, -4.534912109375, -4.3812255859375, -4.2275390625, -4.0738525390625, -3.920166015625, -3.7664794921875, -3.61279296875, -3.4591064453125, -3.305419921875, -3.1517333984375, -2.998046875, -2.8443603515625, -2.690673828125, -2.5369873046875, -2.38330078125, -2.2296142578125, -2.075927734375, -1.9222412109375, -1.7685546875, -1.6148681640625, -1.461181640625, -1.3074951171875, -1.15380859375, -1.0001220703125, -0.846435546875, -0.6927490234375, -0.5390625, -0.3853759765625, -0.231689453125, -0.0780029296875, 0.07568359375, 0.2293701171875, 0.383056640625, 0.5367431640625, 0.6904296875, 0.8441162109375, 0.997802734375, 1.1514892578125, 1.30517578125, 1.4588623046875, 1.612548828125, 1.7662353515625, 1.919921875, 2.0736083984375, 2.227294921875, 2.3809814453125, 2.53466796875, 2.6883544921875, 2.842041015625, 2.9957275390625, 3.1494140625, 3.3031005859375, 3.456787109375, 3.6104736328125, 3.76416015625, 3.9178466796875, 4.071533203125, 4.2252197265625, 4.37890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 10.0, 6.0, 9.0, 22.0, 13.0, 21.0, 29.0, 31.0, 41.0, 52.0, 58.0, 85.0, 124.0, 210.0, 385.0, 1213.0, 10878.0, 1012088.0, 20779.0, 1371.0, 450.0, 189.0, 108.0, 70.0, 62.0, 47.0, 42.0, 37.0, 22.0, 15.0, 14.0, 12.0, 11.0, 9.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.157867431640625, -3.06378173828125, -2.969696044921875, -2.8756103515625, -2.781524658203125, -2.68743896484375, -2.593353271484375, -2.499267578125, -2.405181884765625, -2.31109619140625, -2.217010498046875, -2.1229248046875, -2.028839111328125, -1.93475341796875, -1.840667724609375, -1.74658203125, -1.652496337890625, -1.55841064453125, -1.464324951171875, -1.3702392578125, -1.276153564453125, -1.18206787109375, -1.087982177734375, -0.993896484375, -0.899810791015625, -0.80572509765625, -0.711639404296875, -0.6175537109375, -0.523468017578125, -0.42938232421875, -0.335296630859375, -0.2412109375, -0.147125244140625, -0.05303955078125, 0.041046142578125, 0.1351318359375, 0.229217529296875, 0.32330322265625, 0.417388916015625, 0.511474609375, 0.605560302734375, 0.69964599609375, 0.793731689453125, 0.8878173828125, 0.981903076171875, 1.07598876953125, 1.170074462890625, 1.26416015625, 1.358245849609375, 1.45233154296875, 1.546417236328125, 1.6405029296875, 1.734588623046875, 1.82867431640625, 1.922760009765625, 2.016845703125, 2.110931396484375, 2.20501708984375, 2.299102783203125, 2.3931884765625, 2.487274169921875, 2.58135986328125, 2.675445556640625, 2.76953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 3.0, 11.0, 5.0, 7.0, 20.0, 11.0, 18.0, 25.0, 26.0, 34.0, 34.0, 35.0, 33.0, 52.0, 40.0, 36.0, 46.0, 51.0, 51.0, 49.0, 43.0, 35.0, 34.0, 35.0, 35.0, 34.0, 24.0, 31.0, 29.0, 16.0, 16.0, 13.0, 10.0, 11.0, 10.0, 12.0, 5.0, 2.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.99945068359375, -4.8504638671875, -4.70147705078125, -4.552490234375, -4.40350341796875, -4.2545166015625, -4.10552978515625, -3.95654296875, -3.80755615234375, -3.6585693359375, -3.50958251953125, -3.360595703125, -3.21160888671875, -3.0626220703125, -2.91363525390625, -2.7646484375, -2.61566162109375, -2.4666748046875, -2.31768798828125, -2.168701171875, -2.01971435546875, -1.8707275390625, -1.72174072265625, -1.57275390625, -1.42376708984375, -1.2747802734375, -1.12579345703125, -0.976806640625, -0.82781982421875, -0.6788330078125, -0.52984619140625, -0.380859375, -0.23187255859375, -0.0828857421875, 0.06610107421875, 0.215087890625, 0.36407470703125, 0.5130615234375, 0.66204833984375, 0.81103515625, 0.96002197265625, 1.1090087890625, 1.25799560546875, 1.406982421875, 1.55596923828125, 1.7049560546875, 1.85394287109375, 2.0029296875, 2.15191650390625, 2.3009033203125, 2.44989013671875, 2.598876953125, 2.74786376953125, 2.8968505859375, 3.04583740234375, 3.19482421875, 3.34381103515625, 3.4927978515625, 3.64178466796875, 3.790771484375, 3.93975830078125, 4.0887451171875, 4.23773193359375, 4.38671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 8.0, 13.0, 9.0, 17.0, 14.0, 33.0, 31.0, 56.0, 62.0, 98.0, 164.0, 239.0, 396.0, 774.0, 1334.0, 2655.0, 5988.0, 16645.0, 92354.0, 818880.0, 81647.0, 15690.0, 5710.0, 2542.0, 1323.0, 694.0, 411.0, 244.0, 146.0, 118.0, 74.0, 46.0, 37.0, 26.0, 15.0, 16.0, 10.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.14990234375, -0.1451396942138672, -0.14037704467773438, -0.13561439514160156, -0.13085174560546875, -0.12608909606933594, -0.12132644653320312, -0.11656379699707031, -0.1118011474609375, -0.10703849792480469, -0.10227584838867188, -0.09751319885253906, -0.09275054931640625, -0.08798789978027344, -0.08322525024414062, -0.07846260070800781, -0.073699951171875, -0.06893730163574219, -0.06417465209960938, -0.05941200256347656, -0.05464935302734375, -0.04988670349121094, -0.045124053955078125, -0.04036140441894531, -0.0355987548828125, -0.030836105346679688, -0.026073455810546875, -0.021310806274414062, -0.01654815673828125, -0.011785507202148438, -0.007022857666015625, -0.0022602081298828125, 0.00250244140625, 0.0072650909423828125, 0.012027740478515625, 0.016790390014648438, 0.02155303955078125, 0.026315689086914062, 0.031078338623046875, 0.03584098815917969, 0.0406036376953125, 0.04536628723144531, 0.050128936767578125, 0.05489158630371094, 0.05965423583984375, 0.06441688537597656, 0.06917953491210938, 0.07394218444824219, 0.078704833984375, 0.08346748352050781, 0.08823013305664062, 0.09299278259277344, 0.09775543212890625, 0.10251808166503906, 0.10728073120117188, 0.11204338073730469, 0.1168060302734375, 0.12156867980957031, 0.12633132934570312, 0.13109397888183594, 0.13585662841796875, 0.14061927795410156, 0.14538192749023438, 0.1501445770263672, 0.1549072265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 12.0, 29.0, 115.0, 453.0, 266.0, 61.0, 21.0, 11.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.128715515136719e-05, -6.92959874868393e-05, -6.73048198223114e-05, -6.531365215778351e-05, -6.332248449325562e-05, -6.133131682872772e-05, -5.934014916419983e-05, -5.7348981499671936e-05, -5.535781383514404e-05, -5.336664617061615e-05, -5.137547850608826e-05, -4.9384310841560364e-05, -4.739314317703247e-05, -4.540197551250458e-05, -4.3410807847976685e-05, -4.141964018344879e-05, -3.94284725189209e-05, -3.7437304854393005e-05, -3.544613718986511e-05, -3.345496952533722e-05, -3.1463801860809326e-05, -2.9472634196281433e-05, -2.748146653175354e-05, -2.5490298867225647e-05, -2.3499131202697754e-05, -2.150796353816986e-05, -1.9516795873641968e-05, -1.7525628209114075e-05, -1.553446054458618e-05, -1.3543292880058289e-05, -1.1552125215530396e-05, -9.560957551002502e-06, -7.569789886474609e-06, -5.578622221946716e-06, -3.5874545574188232e-06, -1.5962868928909302e-06, 3.948807716369629e-07, 2.386048436164856e-06, 4.377216100692749e-06, 6.368383765220642e-06, 8.359551429748535e-06, 1.0350719094276428e-05, 1.2341886758804321e-05, 1.4333054423332214e-05, 1.6324222087860107e-05, 1.8315389752388e-05, 2.0306557416915894e-05, 2.2297725081443787e-05, 2.428889274597168e-05, 2.6280060410499573e-05, 2.8271228075027466e-05, 3.026239573955536e-05, 3.225356340408325e-05, 3.4244731068611145e-05, 3.623589873313904e-05, 3.822706639766693e-05, 4.0218234062194824e-05, 4.220940172672272e-05, 4.420056939125061e-05, 4.6191737055778503e-05, 4.8182904720306396e-05, 5.017407238483429e-05, 5.216524004936218e-05, 5.4156407713890076e-05, 5.614757537841797e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 5.0, 10.0, 10.0, 31.0, 40.0, 55.0, 91.0, 161.0, 300.0, 612.0, 1469.0, 4791.0, 21665.0, 666509.0, 329105.0, 17157.0, 3995.0, 1339.0, 558.0, 259.0, 163.0, 84.0, 52.0, 27.0, 20.0, 17.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17557525634765625, -0.1685333251953125, -0.16149139404296875, -0.154449462890625, -0.14740753173828125, -0.1403656005859375, -0.13332366943359375, -0.12628173828125, -0.11923980712890625, -0.1121978759765625, -0.10515594482421875, -0.098114013671875, -0.09107208251953125, -0.0840301513671875, -0.07698822021484375, -0.0699462890625, -0.06290435791015625, -0.0558624267578125, -0.04882049560546875, -0.041778564453125, -0.03473663330078125, -0.0276947021484375, -0.02065277099609375, -0.01361083984375, -0.00656890869140625, 0.0004730224609375, 0.00751495361328125, 0.014556884765625, 0.02159881591796875, 0.0286407470703125, 0.03568267822265625, 0.042724609375, 0.04976654052734375, 0.0568084716796875, 0.06385040283203125, 0.070892333984375, 0.07793426513671875, 0.0849761962890625, 0.09201812744140625, 0.09906005859375, 0.10610198974609375, 0.1131439208984375, 0.12018585205078125, 0.127227783203125, 0.13426971435546875, 0.1413116455078125, 0.14835357666015625, 0.1553955078125, 0.16243743896484375, 0.1694793701171875, 0.17652130126953125, 0.183563232421875, 0.19060516357421875, 0.1976470947265625, 0.20468902587890625, 0.21173095703125, 0.21877288818359375, 0.2258148193359375, 0.23285675048828125, 0.239898681640625, 0.24694061279296875, 0.2539825439453125, 0.26102447509765625, 0.26806640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 5.0, 6.0, 9.0, 15.0, 29.0, 43.0, 90.0, 198.0, 237.0, 145.0, 87.0, 43.0, 29.0, 23.0, 13.0, 6.0, 6.0, 4.0, 5.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1058349609375, -0.10308170318603516, -0.10032844543457031, -0.09757518768310547, -0.09482192993164062, -0.09206867218017578, -0.08931541442871094, -0.0865621566772461, -0.08380889892578125, -0.0810556411743164, -0.07830238342285156, -0.07554912567138672, -0.07279586791992188, -0.07004261016845703, -0.06728935241699219, -0.06453609466552734, -0.0617828369140625, -0.059029579162597656, -0.05627632141113281, -0.05352306365966797, -0.050769805908203125, -0.04801654815673828, -0.04526329040527344, -0.042510032653808594, -0.03975677490234375, -0.037003517150878906, -0.03425025939941406, -0.03149700164794922, -0.028743743896484375, -0.02599048614501953, -0.023237228393554688, -0.020483970642089844, -0.017730712890625, -0.014977455139160156, -0.012224197387695312, -0.009470939636230469, -0.006717681884765625, -0.003964424133300781, -0.0012111663818359375, 0.0015420913696289062, 0.00429534912109375, 0.007048606872558594, 0.009801864624023438, 0.012555122375488281, 0.015308380126953125, 0.01806163787841797, 0.020814895629882812, 0.023568153381347656, 0.0263214111328125, 0.029074668884277344, 0.03182792663574219, 0.03458118438720703, 0.037334442138671875, 0.04008769989013672, 0.04284095764160156, 0.045594215393066406, 0.04834747314453125, 0.051100730895996094, 0.05385398864746094, 0.05660724639892578, 0.059360504150390625, 0.06211376190185547, 0.06486701965332031, 0.06762027740478516, 0.07037353515625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 19.0, 17.0, 16.0, 34.0, 53.0, 49.0, 66.0, 102.0, 119.0, 116.0, 97.0, 82.0, 57.0, 44.0, 28.0, 26.0, 21.0, 13.0, 6.0, 10.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.479384660720825, -2.399658441543579, -2.319932460784912, -2.240206241607666, -2.16048002243042, -2.080754041671753, -2.001027822494507, -1.9213017225265503, -1.8415756225585938, -1.7618495225906372, -1.6821233034133911, -1.6023972034454346, -1.522671103477478, -1.4429450035095215, -1.3632187843322754, -1.2834926843643188, -1.2037664651870728, -1.1240403652191162, -1.0443141460418701, -0.9645880460739136, -0.884861946105957, -0.8051357865333557, -0.7254096269607544, -0.6456835269927979, -0.5659573674201965, -0.4862312376499176, -0.40650510787963867, -0.32677894830703735, -0.24705281853675842, -0.1673266887664795, -0.08760052919387817, -0.00787442922592163, 0.07185173034667969, 0.15157786011695862, 0.23130400478839874, 0.31103014945983887, 0.3907562792301178, 0.47048240900039673, 0.550208568572998, 0.6299346685409546, 0.7096608281135559, 0.7893869876861572, 0.8691130876541138, 0.9488392472267151, 1.0285654067993164, 1.108291506767273, 1.1880176067352295, 1.2677438259124756, 1.3474699258804321, 1.4271960258483887, 1.5069222450256348, 1.5866483449935913, 1.6663744449615479, 1.746100664138794, 1.8258267641067505, 1.905552864074707, 1.9852790832519531, 2.065005302429199, 2.144731283187866, 2.2244575023651123, 2.3041837215423584, 2.3839097023010254, 2.4636359214782715, 2.5433621406555176, 2.6230881214141846]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 11.0, 6.0, 6.0, 9.0, 13.0, 9.0, 9.0, 22.0, 21.0, 28.0, 28.0, 25.0, 28.0, 37.0, 26.0, 38.0, 31.0, 35.0, 27.0, 53.0, 40.0, 33.0, 34.0, 36.0, 43.0, 39.0, 29.0, 34.0, 28.0, 25.0, 29.0, 25.0, 24.0, 13.0, 21.0, 21.0, 11.0, 9.0, 9.0, 13.0, 3.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.507295608520508, -6.283201217651367, -6.059106349945068, -5.8350114822387695, -5.610917091369629, -5.386822700500488, -5.1627278327941895, -4.938632965087891, -4.71453857421875, -4.490444183349609, -4.2663493156433105, -4.042254447937012, -3.818160057067871, -3.5940654277801514, -3.3699707984924316, -3.145876169204712, -2.921781539916992, -2.6976869106292725, -2.4735922813415527, -2.249497652053833, -2.0254030227661133, -1.8013083934783936, -1.5772137641906738, -1.353119134902954, -1.1290245056152344, -0.9049298763275146, -0.6808352470397949, -0.4567406177520752, -0.23264598846435547, -0.008551359176635742, 0.21554327011108398, 0.4396378993988037, 0.6637330055236816, 0.8878276348114014, 1.111922264099121, 1.3360168933868408, 1.5601115226745605, 1.7842061519622803, 2.00830078125, 2.2323954105377197, 2.4564900398254395, 2.680584669113159, 2.904679298400879, 3.1287739276885986, 3.3528685569763184, 3.576963186264038, 3.801057815551758, 4.025152206420898, 4.249247074127197, 4.473341941833496, 4.697436332702637, 4.921530723571777, 5.145625591278076, 5.369720458984375, 5.593814849853516, 5.817909240722656, 6.042004108428955, 6.266098976135254, 6.4901933670043945, 6.714287757873535, 6.938382625579834, 7.162477493286133, 7.386571884155273, 7.610666275024414, 7.834761142730713]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 12.0, 9.0, 8.0, 21.0, 22.0, 26.0, 48.0, 99.0, 156.0, 277.0, 616.0, 1469.0, 3742.0, 10691.0, 59128.0, 2125065.0, 1921191.0, 54649.0, 10837.0, 3561.0, 1409.0, 583.0, 268.0, 130.0, 69.0, 59.0, 16.0, 20.0, 13.0, 11.0, 13.0, 18.0, 7.0, 8.0, 3.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.103515625, -3.009429931640625, -2.91534423828125, -2.821258544921875, -2.7271728515625, -2.633087158203125, -2.53900146484375, -2.444915771484375, -2.350830078125, -2.256744384765625, -2.16265869140625, -2.068572998046875, -1.9744873046875, -1.880401611328125, -1.78631591796875, -1.692230224609375, -1.59814453125, -1.504058837890625, -1.40997314453125, -1.315887451171875, -1.2218017578125, -1.127716064453125, -1.03363037109375, -0.939544677734375, -0.845458984375, -0.751373291015625, -0.65728759765625, -0.563201904296875, -0.4691162109375, -0.375030517578125, -0.28094482421875, -0.186859130859375, -0.0927734375, 0.001312255859375, 0.09539794921875, 0.189483642578125, 0.2835693359375, 0.377655029296875, 0.47174072265625, 0.565826416015625, 0.659912109375, 0.753997802734375, 0.84808349609375, 0.942169189453125, 1.0362548828125, 1.130340576171875, 1.22442626953125, 1.318511962890625, 1.41259765625, 1.506683349609375, 1.60076904296875, 1.694854736328125, 1.7889404296875, 1.883026123046875, 1.97711181640625, 2.071197509765625, 2.165283203125, 2.259368896484375, 2.35345458984375, 2.447540283203125, 2.5416259765625, 2.635711669921875, 2.72979736328125, 2.823883056640625, 2.91796875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 7.0, 19.0, 9.0, 15.0, 23.0, 23.0, 28.0, 26.0, 37.0, 36.0, 37.0, 32.0, 39.0, 43.0, 48.0, 50.0, 44.0, 49.0, 42.0, 55.0, 44.0, 31.0, 33.0, 29.0, 32.0, 28.0, 25.0, 20.0, 19.0, 13.0, 9.0, 6.0, 7.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.2216796875, -1.1895370483398438, -1.1573944091796875, -1.1252517700195312, -1.093109130859375, -1.0609664916992188, -1.0288238525390625, -0.9966812133789062, -0.96453857421875, -0.9323959350585938, -0.9002532958984375, -0.8681106567382812, -0.835968017578125, -0.8038253784179688, -0.7716827392578125, -0.7395401000976562, -0.7073974609375, -0.6752548217773438, -0.6431121826171875, -0.6109695434570312, -0.578826904296875, -0.5466842651367188, -0.5145416259765625, -0.48239898681640625, -0.45025634765625, -0.41811370849609375, -0.3859710693359375, -0.35382843017578125, -0.321685791015625, -0.28954315185546875, -0.2574005126953125, -0.22525787353515625, -0.193115234375, -0.16097259521484375, -0.1288299560546875, -0.09668731689453125, -0.064544677734375, -0.03240203857421875, -0.0002593994140625, 0.03188323974609375, 0.06402587890625, 0.09616851806640625, 0.1283111572265625, 0.16045379638671875, 0.192596435546875, 0.22473907470703125, 0.2568817138671875, 0.28902435302734375, 0.3211669921875, 0.35330963134765625, 0.3854522705078125, 0.41759490966796875, 0.449737548828125, 0.48188018798828125, 0.5140228271484375, 0.5461654663085938, 0.57830810546875, 0.6104507446289062, 0.6425933837890625, 0.6747360229492188, 0.706878662109375, 0.7390213012695312, 0.7711639404296875, 0.8033065795898438, 0.83544921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 10.0, 20.0, 37.0, 114.0, 1006.0, 4192238.0, 634.0, 114.0, 40.0, 27.0, 8.0, 14.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -21.9296875, -20.953125, -19.9765625, -19.0, -18.0234375, -17.046875, -16.0703125, -15.09375, -14.1171875, -13.140625, -12.1640625, -11.1875, -10.2109375, -9.234375, -8.2578125, -7.28125, -6.3046875, -5.328125, -4.3515625, -3.375, -2.3984375, -1.421875, -0.4453125, 0.53125, 1.5078125, 2.484375, 3.4609375, 4.4375, 5.4140625, 6.390625, 7.3671875, 8.34375, 9.3203125, 10.296875, 11.2734375, 12.25, 13.2265625, 14.203125, 15.1796875, 16.15625, 17.1328125, 18.109375, 19.0859375, 20.0625, 21.0390625, 22.015625, 22.9921875, 23.96875, 24.9453125, 25.921875, 26.8984375, 27.875, 28.8515625, 29.828125, 30.8046875, 31.78125, 32.7578125, 33.734375, 34.7109375, 35.6875, 36.6640625, 37.640625, 38.6171875, 39.59375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 11.0, 5.0, 15.0, 15.0, 37.0, 27.0, 49.0, 65.0, 106.0, 157.0, 351.0, 758.0, 1122.0, 624.0, 294.0, 138.0, 85.0, 54.0, 45.0, 29.0, 23.0, 21.0, 9.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71826171875, -0.6973495483398438, -0.6764373779296875, -0.6555252075195312, -0.634613037109375, -0.6137008666992188, -0.5927886962890625, -0.5718765258789062, -0.55096435546875, -0.5300521850585938, -0.5091400146484375, -0.48822784423828125, -0.467315673828125, -0.44640350341796875, -0.4254913330078125, -0.40457916259765625, -0.3836669921875, -0.36275482177734375, -0.3418426513671875, -0.32093048095703125, -0.300018310546875, -0.27910614013671875, -0.2581939697265625, -0.23728179931640625, -0.21636962890625, -0.19545745849609375, -0.1745452880859375, -0.15363311767578125, -0.132720947265625, -0.11180877685546875, -0.0908966064453125, -0.06998443603515625, -0.049072265625, -0.02816009521484375, -0.0072479248046875, 0.01366424560546875, 0.034576416015625, 0.05548858642578125, 0.0764007568359375, 0.09731292724609375, 0.11822509765625, 0.13913726806640625, 0.1600494384765625, 0.18096160888671875, 0.201873779296875, 0.22278594970703125, 0.2436981201171875, 0.26461029052734375, 0.2855224609375, 0.30643463134765625, 0.3273468017578125, 0.34825897216796875, 0.369171142578125, 0.39008331298828125, 0.4109954833984375, 0.43190765380859375, 0.45281982421875, 0.47373199462890625, 0.4946441650390625, 0.5155563354492188, 0.536468505859375, 0.5573806762695312, 0.5782928466796875, 0.5992050170898438, 0.6201171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 10.0, 18.0, 18.0, 28.0, 27.0, 32.0, 61.0, 96.0, 105.0, 97.0, 135.0, 85.0, 73.0, 53.0, 37.0, 34.0, 19.0, 16.0, 11.0, 9.0, 6.0, 8.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5102577209472656, -2.450434684753418, -2.3906118869781494, -2.3307888507843018, -2.270966053009033, -2.2111430168151855, -2.151320219039917, -2.0914971828460693, -2.031674385070801, -1.9718514680862427, -1.9120285511016846, -1.8522056341171265, -1.7923827171325684, -1.7325596809387207, -1.6727367639541626, -1.6129138469696045, -1.5530908107757568, -1.4932678937911987, -1.4334449768066406, -1.3736220598220825, -1.3137991428375244, -1.2539761066436768, -1.1941531896591187, -1.1343302726745605, -1.0745073556900024, -1.0146844387054443, -0.9548615217208862, -0.8950385451316833, -0.8352156281471252, -0.7753927111625671, -0.7155697345733643, -0.6557468175888062, -0.5959240198135376, -0.5361011028289795, -0.476278156042099, -0.4164552092552185, -0.3566322922706604, -0.2968093752861023, -0.2369864284992218, -0.1771634817123413, -0.1173405647277832, -0.057517632842063904, 0.0023052990436553955, 0.062128230929374695, 0.121951162815094, 0.1817740797996521, 0.2415970265865326, 0.3014199733734131, 0.3612428903579712, 0.4210658073425293, 0.4808887541294098, 0.5407117009162903, 0.6005346179008484, 0.6603575348854065, 0.7201805114746094, 0.7800034284591675, 0.8398263454437256, 0.8996492624282837, 0.9594721794128418, 1.0192950963974, 1.079118013381958, 1.1389410495758057, 1.1987639665603638, 1.2585868835449219, 1.31840980052948]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 6.0, 15.0, 13.0, 14.0, 19.0, 28.0, 32.0, 31.0, 35.0, 33.0, 27.0, 25.0, 27.0, 33.0, 45.0, 51.0, 53.0, 46.0, 39.0, 42.0, 42.0, 32.0, 33.0, 37.0, 29.0, 23.0, 30.0, 26.0, 26.0, 11.0, 15.0, 7.0, 12.0, 6.0, 6.0, 4.0, 8.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1077584028244019, -1.0767717361450195, -1.0457850694656372, -1.0147982835769653, -0.983811616897583, -0.9528249502182007, -0.9218382835388184, -0.8908515572547913, -0.8598648309707642, -0.8288781642913818, -0.7978914380073547, -0.7669047713279724, -0.7359180450439453, -0.704931378364563, -0.6739447116851807, -0.6429579854011536, -0.6119713187217712, -0.5809846520423889, -0.5499979257583618, -0.5190112590789795, -0.4880245327949524, -0.45703786611557007, -0.42605116963386536, -0.39506447315216064, -0.36407777667045593, -0.3330910801887512, -0.3021043837070465, -0.2711176872253418, -0.24013100564479828, -0.20914430916309357, -0.17815762758255005, -0.14717093110084534, -0.11618417501449585, -0.08519747853279114, -0.05421078950166702, -0.023224100470542908, 0.007762596011161804, 0.038749292492866516, 0.06973597407341003, 0.10072267055511475, 0.13170936703681946, 0.16269606351852417, 0.19368276000022888, 0.2246694415807724, 0.2556561231613159, 0.286642849445343, 0.31762951612472534, 0.34861621260643005, 0.37960290908813477, 0.4105896055698395, 0.4415763020515442, 0.4725629687309265, 0.5035496950149536, 0.5345363616943359, 0.5655230283737183, 0.5965097546577454, 0.6274964809417725, 0.6584831476211548, 0.6894698739051819, 0.7204565405845642, 0.7514432668685913, 0.7824299335479736, 0.813416600227356, 0.8444033265113831, 0.8753899931907654]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 15.0, 14.0, 15.0, 28.0, 45.0, 82.0, 82.0, 114.0, 158.0, 217.0, 304.0, 486.0, 743.0, 1149.0, 1955.0, 3142.0, 5618.0, 10458.0, 22197.0, 51631.0, 140810.0, 387232.0, 264109.0, 87930.0, 35092.0, 15674.0, 7851.0, 4342.0, 2573.0, 1562.0, 984.0, 584.0, 417.0, 260.0, 188.0, 149.0, 102.0, 70.0, 50.0, 22.0, 28.0, 16.0, 17.0, 11.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.488037109375, -0.4731483459472656, -0.45825958251953125, -0.4433708190917969, -0.4284820556640625, -0.4135932922363281, -0.39870452880859375, -0.3838157653808594, -0.368927001953125, -0.3540382385253906, -0.33914947509765625, -0.3242607116699219, -0.3093719482421875, -0.2944831848144531, -0.27959442138671875, -0.2647056579589844, -0.24981689453125, -0.23492813110351562, -0.22003936767578125, -0.20515060424804688, -0.1902618408203125, -0.17537307739257812, -0.16048431396484375, -0.14559555053710938, -0.130706787109375, -0.11581802368164062, -0.10092926025390625, -0.08604049682617188, -0.0711517333984375, -0.056262969970703125, -0.04137420654296875, -0.026485443115234375, -0.0115966796875, 0.003292083740234375, 0.01818084716796875, 0.033069610595703125, 0.0479583740234375, 0.06284713745117188, 0.07773590087890625, 0.09262466430664062, 0.107513427734375, 0.12240219116210938, 0.13729095458984375, 0.15217971801757812, 0.1670684814453125, 0.18195724487304688, 0.19684600830078125, 0.21173477172851562, 0.22662353515625, 0.24151229858398438, 0.25640106201171875, 0.2712898254394531, 0.2861785888671875, 0.3010673522949219, 0.31595611572265625, 0.3308448791503906, 0.345733642578125, 0.3606224060058594, 0.37551116943359375, 0.3903999328613281, 0.4052886962890625, 0.4201774597167969, 0.43506622314453125, 0.4499549865722656, 0.46484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 5.0, 4.0, 6.0, 10.0, 11.0, 5.0, 10.0, 14.0, 23.0, 35.0, 33.0, 22.0, 43.0, 37.0, 34.0, 27.0, 39.0, 37.0, 57.0, 47.0, 45.0, 51.0, 49.0, 39.0, 46.0, 29.0, 33.0, 23.0, 26.0, 29.0, 24.0, 21.0, 12.0, 16.0, 10.0, 8.0, 7.0, 6.0, 3.0, 3.0, 9.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.796875, -0.774658203125, -0.75244140625, -0.730224609375, -0.7080078125, -0.685791015625, -0.66357421875, -0.641357421875, -0.619140625, -0.596923828125, -0.57470703125, -0.552490234375, -0.5302734375, -0.508056640625, -0.48583984375, -0.463623046875, -0.44140625, -0.419189453125, -0.39697265625, -0.374755859375, -0.3525390625, -0.330322265625, -0.30810546875, -0.285888671875, -0.263671875, -0.241455078125, -0.21923828125, -0.197021484375, -0.1748046875, -0.152587890625, -0.13037109375, -0.108154296875, -0.0859375, -0.063720703125, -0.04150390625, -0.019287109375, 0.0029296875, 0.025146484375, 0.04736328125, 0.069580078125, 0.091796875, 0.114013671875, 0.13623046875, 0.158447265625, 0.1806640625, 0.202880859375, 0.22509765625, 0.247314453125, 0.26953125, 0.291748046875, 0.31396484375, 0.336181640625, 0.3583984375, 0.380615234375, 0.40283203125, 0.425048828125, 0.447265625, 0.469482421875, 0.49169921875, 0.513916015625, 0.5361328125, 0.558349609375, 0.58056640625, 0.602783203125, 0.625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 8.0, 10.0, 13.0, 19.0, 19.0, 24.0, 50.0, 72.0, 74.0, 136.0, 177.0, 270.0, 450.0, 604.0, 1059.0, 1822.0, 3393.0, 6704.0, 14834.0, 38305.0, 115876.0, 385495.0, 326855.0, 93807.0, 31969.0, 12940.0, 5936.0, 3014.0, 1744.0, 1015.0, 614.0, 361.0, 275.0, 168.0, 127.0, 86.0, 67.0, 48.0, 34.0, 17.0, 18.0, 13.0, 6.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.487060546875, -0.4722633361816406, -0.45746612548828125, -0.4426689147949219, -0.4278717041015625, -0.4130744934082031, -0.39827728271484375, -0.3834800720214844, -0.368682861328125, -0.3538856506347656, -0.33908843994140625, -0.3242912292480469, -0.3094940185546875, -0.2946968078613281, -0.27989959716796875, -0.2651023864746094, -0.25030517578125, -0.23550796508789062, -0.22071075439453125, -0.20591354370117188, -0.1911163330078125, -0.17631912231445312, -0.16152191162109375, -0.14672470092773438, -0.131927490234375, -0.11713027954101562, -0.10233306884765625, -0.08753585815429688, -0.0727386474609375, -0.057941436767578125, -0.04314422607421875, -0.028347015380859375, -0.0135498046875, 0.001247406005859375, 0.01604461669921875, 0.030841827392578125, 0.0456390380859375, 0.060436248779296875, 0.07523345947265625, 0.09003067016601562, 0.104827880859375, 0.11962509155273438, 0.13442230224609375, 0.14921951293945312, 0.1640167236328125, 0.17881393432617188, 0.19361114501953125, 0.20840835571289062, 0.22320556640625, 0.23800277709960938, 0.25279998779296875, 0.2675971984863281, 0.2823944091796875, 0.2971916198730469, 0.31198883056640625, 0.3267860412597656, 0.341583251953125, 0.3563804626464844, 0.37117767333984375, 0.3859748840332031, 0.4007720947265625, 0.4155693054199219, 0.43036651611328125, 0.4451637268066406, 0.4599609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 16.0, 12.0, 22.0, 23.0, 22.0, 37.0, 29.0, 47.0, 42.0, 42.0, 63.0, 55.0, 64.0, 60.0, 68.0, 62.0, 57.0, 34.0, 45.0, 40.0, 41.0, 28.0, 13.0, 18.0, 19.0, 7.0, 6.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9990234375, -1.9416961669921875, -1.884368896484375, -1.8270416259765625, -1.76971435546875, -1.7123870849609375, -1.655059814453125, -1.5977325439453125, -1.5404052734375, -1.4830780029296875, -1.425750732421875, -1.3684234619140625, -1.31109619140625, -1.2537689208984375, -1.196441650390625, -1.1391143798828125, -1.081787109375, -1.0244598388671875, -0.967132568359375, -0.9098052978515625, -0.85247802734375, -0.7951507568359375, -0.737823486328125, -0.6804962158203125, -0.6231689453125, -0.5658416748046875, -0.508514404296875, -0.4511871337890625, -0.39385986328125, -0.3365325927734375, -0.279205322265625, -0.2218780517578125, -0.16455078125, -0.1072235107421875, -0.049896240234375, 0.0074310302734375, 0.06475830078125, 0.1220855712890625, 0.179412841796875, 0.2367401123046875, 0.2940673828125, 0.3513946533203125, 0.408721923828125, 0.4660491943359375, 0.52337646484375, 0.5807037353515625, 0.638031005859375, 0.6953582763671875, 0.752685546875, 0.8100128173828125, 0.867340087890625, 0.9246673583984375, 0.98199462890625, 1.0393218994140625, 1.096649169921875, 1.1539764404296875, 1.2113037109375, 1.2686309814453125, 1.325958251953125, 1.3832855224609375, 1.44061279296875, 1.4979400634765625, 1.555267333984375, 1.6125946044921875, 1.669921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 6.0, 9.0, 16.0, 18.0, 27.0, 33.0, 70.0, 124.0, 163.0, 284.0, 531.0, 960.0, 2233.0, 5241.0, 16280.0, 63873.0, 369235.0, 476382.0, 81931.0, 20028.0, 6236.0, 2441.0, 1108.0, 590.0, 315.0, 168.0, 94.0, 49.0, 42.0, 19.0, 12.0, 9.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.12181282043457031, -0.11789321899414062, -0.11397361755371094, -0.11005401611328125, -0.10613441467285156, -0.10221481323242188, -0.09829521179199219, -0.0943756103515625, -0.09045600891113281, -0.08653640747070312, -0.08261680603027344, -0.07869720458984375, -0.07477760314941406, -0.07085800170898438, -0.06693840026855469, -0.063018798828125, -0.05909919738769531, -0.055179595947265625, -0.05125999450683594, -0.04734039306640625, -0.04342079162597656, -0.039501190185546875, -0.03558158874511719, -0.0316619873046875, -0.027742385864257812, -0.023822784423828125, -0.019903182983398438, -0.01598358154296875, -0.012063980102539062, -0.008144378662109375, -0.0042247772216796875, -0.00030517578125, 0.0036144256591796875, 0.007534027099609375, 0.011453628540039062, 0.01537322998046875, 0.019292831420898438, 0.023212432861328125, 0.027132034301757812, 0.0310516357421875, 0.03497123718261719, 0.038890838623046875, 0.04281044006347656, 0.04673004150390625, 0.05064964294433594, 0.054569244384765625, 0.05848884582519531, 0.062408447265625, 0.06632804870605469, 0.07024765014648438, 0.07416725158691406, 0.07808685302734375, 0.08200645446777344, 0.08592605590820312, 0.08984565734863281, 0.0937652587890625, 0.09768486022949219, 0.10160446166992188, 0.10552406311035156, 0.10944366455078125, 0.11336326599121094, 0.11728286743164062, 0.12120246887207031, 0.1251220703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 2.0, 2.0, 10.0, 12.0, 16.0, 19.0, 27.0, 32.0, 44.0, 58.0, 63.0, 77.0, 122.0, 100.0, 97.0, 79.0, 57.0, 39.0, 30.0, 28.0, 16.0, 15.0, 9.0, 8.0, 12.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.975101470947266e-05, -7.766392081975937e-05, -7.557682693004608e-05, -7.34897330403328e-05, -7.140263915061951e-05, -6.931554526090622e-05, -6.722845137119293e-05, -6.514135748147964e-05, -6.305426359176636e-05, -6.096716970205307e-05, -5.888007581233978e-05, -5.6792981922626495e-05, -5.470588803291321e-05, -5.261879414319992e-05, -5.053170025348663e-05, -4.8444606363773346e-05, -4.635751247406006e-05, -4.427041858434677e-05, -4.2183324694633484e-05, -4.0096230804920197e-05, -3.800913691520691e-05, -3.592204302549362e-05, -3.3834949135780334e-05, -3.174785524606705e-05, -2.966076135635376e-05, -2.7573667466640472e-05, -2.5486573576927185e-05, -2.3399479687213898e-05, -2.131238579750061e-05, -1.9225291907787323e-05, -1.7138198018074036e-05, -1.5051104128360748e-05, -1.2964010238647461e-05, -1.0876916348934174e-05, -8.789822459220886e-06, -6.702728569507599e-06, -4.6156346797943115e-06, -2.528540790081024e-06, -4.414469003677368e-07, 1.6456469893455505e-06, 3.732740879058838e-06, 5.819834768772125e-06, 7.906928658485413e-06, 9.9940225481987e-06, 1.2081116437911987e-05, 1.4168210327625275e-05, 1.6255304217338562e-05, 1.834239810705185e-05, 2.0429491996765137e-05, 2.2516585886478424e-05, 2.460367977619171e-05, 2.6690773665905e-05, 2.8777867555618286e-05, 3.0864961445331573e-05, 3.295205533504486e-05, 3.503914922475815e-05, 3.7126243114471436e-05, 3.921333700418472e-05, 4.130043089389801e-05, 4.33875247836113e-05, 4.5474618673324585e-05, 4.756171256303787e-05, 4.964880645275116e-05, 5.173590034246445e-05, 5.3822994232177734e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 9.0, 13.0, 5.0, 17.0, 25.0, 29.0, 36.0, 55.0, 128.0, 328.0, 835.0, 2394.0, 7607.0, 30121.0, 180654.0, 665984.0, 127269.0, 23585.0, 6176.0, 1971.0, 700.0, 278.0, 120.0, 81.0, 39.0, 23.0, 21.0, 10.0, 6.0, 5.0, 7.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.13149642944335938, -0.12651824951171875, -0.12154006958007812, -0.1165618896484375, -0.11158370971679688, -0.10660552978515625, -0.10162734985351562, -0.096649169921875, -0.09167098999023438, -0.08669281005859375, -0.08171463012695312, -0.0767364501953125, -0.07175827026367188, -0.06678009033203125, -0.061801910400390625, -0.05682373046875, -0.051845550537109375, -0.04686737060546875, -0.041889190673828125, -0.0369110107421875, -0.031932830810546875, -0.02695465087890625, -0.021976470947265625, -0.016998291015625, -0.012020111083984375, -0.00704193115234375, -0.002063751220703125, 0.0029144287109375, 0.007892608642578125, 0.01287078857421875, 0.017848968505859375, 0.0228271484375, 0.027805328369140625, 0.03278350830078125, 0.037761688232421875, 0.0427398681640625, 0.047718048095703125, 0.05269622802734375, 0.057674407958984375, 0.062652587890625, 0.06763076782226562, 0.07260894775390625, 0.07758712768554688, 0.0825653076171875, 0.08754348754882812, 0.09252166748046875, 0.09749984741210938, 0.10247802734375, 0.10745620727539062, 0.11243438720703125, 0.11741256713867188, 0.1223907470703125, 0.12736892700195312, 0.13234710693359375, 0.13732528686523438, 0.142303466796875, 0.14728164672851562, 0.15225982666015625, 0.15723800659179688, 0.1622161865234375, 0.16719436645507812, 0.17217254638671875, 0.17715072631835938, 0.18212890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 8.0, 0.0, 5.0, 7.0, 5.0, 7.0, 11.0, 10.0, 15.0, 19.0, 27.0, 28.0, 39.0, 56.0, 55.0, 55.0, 62.0, 71.0, 83.0, 92.0, 68.0, 63.0, 28.0, 35.0, 27.0, 28.0, 29.0, 7.0, 12.0, 10.0, 13.0, 7.0, 8.0, 6.0, 7.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032318115234375, -0.031420230865478516, -0.03052234649658203, -0.029624462127685547, -0.028726577758789062, -0.027828693389892578, -0.026930809020996094, -0.02603292465209961, -0.025135040283203125, -0.02423715591430664, -0.023339271545410156, -0.022441387176513672, -0.021543502807617188, -0.020645618438720703, -0.01974773406982422, -0.018849849700927734, -0.01795196533203125, -0.017054080963134766, -0.01615619659423828, -0.015258312225341797, -0.014360427856445312, -0.013462543487548828, -0.012564659118652344, -0.01166677474975586, -0.010768890380859375, -0.00987100601196289, -0.008973121643066406, -0.008075237274169922, -0.0071773529052734375, -0.006279468536376953, -0.005381584167480469, -0.004483699798583984, -0.0035858154296875, -0.0026879310607910156, -0.0017900466918945312, -0.0008921623229980469, 5.7220458984375e-06, 0.0009036064147949219, 0.0018014907836914062, 0.0026993751525878906, 0.003597259521484375, 0.004495143890380859, 0.005393028259277344, 0.006290912628173828, 0.0071887969970703125, 0.008086681365966797, 0.008984565734863281, 0.009882450103759766, 0.01078033447265625, 0.011678218841552734, 0.012576103210449219, 0.013473987579345703, 0.014371871948242188, 0.015269756317138672, 0.016167640686035156, 0.01706552505493164, 0.017963409423828125, 0.01886129379272461, 0.019759178161621094, 0.020657062530517578, 0.021554946899414062, 0.022452831268310547, 0.02335071563720703, 0.024248600006103516, 0.025146484375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 23.0, 37.0, 29.0, 68.0, 137.0, 200.0, 207.0, 105.0, 73.0, 37.0, 26.0, 17.0, 9.0, 11.0, 6.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.530160665512085, -2.473973512649536, -2.4177865982055664, -2.3615994453430176, -2.305412530899048, -2.249225378036499, -2.1930384635925293, -2.1368513107299805, -2.0806641578674316, -2.024477005004883, -1.968290090560913, -1.9121030569076538, -1.8559160232543945, -1.7997288703918457, -1.7435418367385864, -1.6873548030853271, -1.6311678886413574, -1.5749808549880981, -1.5187938213348389, -1.4626067876815796, -1.4064197540283203, -1.3502326011657715, -1.2940455675125122, -1.237858533859253, -1.1816715002059937, -1.1254844665527344, -1.069297432899475, -1.0131103992462158, -0.9569233059883118, -0.9007362723350525, -0.8445491790771484, -0.7883621454238892, -0.7321751117706299, -0.6759880781173706, -0.6198010444641113, -0.5636139512062073, -0.507426917552948, -0.4512398838996887, -0.39505282044410706, -0.3388657569885254, -0.2826787233352661, -0.22649167478084564, -0.17030462622642517, -0.1141175776720047, -0.05793052911758423, -0.0017434954643249512, 0.054443567991256714, 0.11063063144683838, 0.16681766510009766, 0.22300471365451813, 0.2791917622089386, 0.33537882566452026, 0.39156585931777954, 0.4477528929710388, 0.5039399862289429, 0.5601270198822021, 0.6163140535354614, 0.6725010871887207, 0.72868812084198, 0.784875214099884, 0.8410622477531433, 0.8972492814064026, 0.9534363746643066, 1.009623408317566, 1.0658104419708252]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 5.0, 6.0, 18.0, 9.0, 15.0, 20.0, 27.0, 30.0, 32.0, 38.0, 33.0, 29.0, 18.0, 36.0, 53.0, 33.0, 49.0, 47.0, 31.0, 63.0, 37.0, 36.0, 41.0, 34.0, 40.0, 25.0, 31.0, 22.0, 27.0, 20.0, 12.0, 13.0, 8.0, 8.0, 10.0, 4.0, 5.0, 9.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7298775911331177, -0.708768367767334, -0.6876590847969055, -0.666549801826477, -0.6454405784606934, -0.6243313550949097, -0.6032220721244812, -0.5821127891540527, -0.561003565788269, -0.5398943424224854, -0.5187850594520569, -0.4976758062839508, -0.4765665531158447, -0.45545729994773865, -0.43434804677963257, -0.4132387936115265, -0.3921295404434204, -0.37102028727531433, -0.34991103410720825, -0.3288017809391022, -0.3076925277709961, -0.28658327460289, -0.26547402143478394, -0.24436476826667786, -0.22325551509857178, -0.2021462619304657, -0.18103700876235962, -0.15992775559425354, -0.13881850242614746, -0.11770924925804138, -0.0965999960899353, -0.07549074292182922, -0.054381489753723145, -0.033272236585617065, -0.012162983417510986, 0.008946269750595093, 0.030055522918701172, 0.05116477608680725, 0.07227402925491333, 0.09338328242301941, 0.11449253559112549, 0.13560178875923157, 0.15671104192733765, 0.17782029509544373, 0.1989295482635498, 0.22003880143165588, 0.24114805459976196, 0.26225730776786804, 0.2833665609359741, 0.3044758141040802, 0.3255850672721863, 0.34669432044029236, 0.36780357360839844, 0.3889128267765045, 0.4100220799446106, 0.4311313331127167, 0.45224058628082275, 0.47334983944892883, 0.4944590926170349, 0.5155683755874634, 0.5366775989532471, 0.5577868223190308, 0.5788961052894592, 0.6000053882598877, 0.6211146116256714]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 12.0, 19.0, 23.0, 34.0, 45.0, 68.0, 107.0, 118.0, 188.0, 259.0, 394.0, 541.0, 890.0, 1363.0, 2385.0, 5039.0, 12823.0, 47464.0, 290005.0, 557730.0, 92988.0, 20907.0, 7014.0, 3245.0, 1678.0, 1074.0, 622.0, 440.0, 308.0, 205.0, 148.0, 105.0, 69.0, 62.0, 46.0, 39.0, 23.0, 15.0, 9.0, 9.0, 8.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5087890625, -0.491943359375, -0.47509765625, -0.458251953125, -0.44140625, -0.424560546875, -0.40771484375, -0.390869140625, -0.3740234375, -0.357177734375, -0.34033203125, -0.323486328125, -0.306640625, -0.289794921875, -0.27294921875, -0.256103515625, -0.2392578125, -0.222412109375, -0.20556640625, -0.188720703125, -0.171875, -0.155029296875, -0.13818359375, -0.121337890625, -0.1044921875, -0.087646484375, -0.07080078125, -0.053955078125, -0.037109375, -0.020263671875, -0.00341796875, 0.013427734375, 0.0302734375, 0.047119140625, 0.06396484375, 0.080810546875, 0.09765625, 0.114501953125, 0.13134765625, 0.148193359375, 0.1650390625, 0.181884765625, 0.19873046875, 0.215576171875, 0.232421875, 0.249267578125, 0.26611328125, 0.282958984375, 0.2998046875, 0.316650390625, 0.33349609375, 0.350341796875, 0.3671875, 0.384033203125, 0.40087890625, 0.417724609375, 0.4345703125, 0.451416015625, 0.46826171875, 0.485107421875, 0.501953125, 0.518798828125, 0.53564453125, 0.552490234375, 0.5693359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 6.0, 4.0, 11.0, 8.0, 14.0, 8.0, 12.0, 19.0, 23.0, 31.0, 26.0, 35.0, 35.0, 28.0, 42.0, 36.0, 43.0, 44.0, 48.0, 43.0, 46.0, 56.0, 44.0, 43.0, 42.0, 25.0, 28.0, 24.0, 31.0, 28.0, 24.0, 22.0, 18.0, 17.0, 9.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.0703125, -2.01220703125, -1.9541015625, -1.89599609375, -1.837890625, -1.77978515625, -1.7216796875, -1.66357421875, -1.60546875, -1.54736328125, -1.4892578125, -1.43115234375, -1.373046875, -1.31494140625, -1.2568359375, -1.19873046875, -1.140625, -1.08251953125, -1.0244140625, -0.96630859375, -0.908203125, -0.85009765625, -0.7919921875, -0.73388671875, -0.67578125, -0.61767578125, -0.5595703125, -0.50146484375, -0.443359375, -0.38525390625, -0.3271484375, -0.26904296875, -0.2109375, -0.15283203125, -0.0947265625, -0.03662109375, 0.021484375, 0.07958984375, 0.1376953125, 0.19580078125, 0.25390625, 0.31201171875, 0.3701171875, 0.42822265625, 0.486328125, 0.54443359375, 0.6025390625, 0.66064453125, 0.71875, 0.77685546875, 0.8349609375, 0.89306640625, 0.951171875, 1.00927734375, 1.0673828125, 1.12548828125, 1.18359375, 1.24169921875, 1.2998046875, 1.35791015625, 1.416015625, 1.47412109375, 1.5322265625, 1.59033203125, 1.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 10.0, 12.0, 15.0, 25.0, 24.0, 22.0, 30.0, 36.0, 47.0, 68.0, 122.0, 487.0, 989194.0, 57705.0, 306.0, 98.0, 60.0, 46.0, 50.0, 32.0, 39.0, 29.0, 22.0, 20.0, 14.0, 15.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.5701904296875, -5.355224609375, -5.1402587890625, -4.92529296875, -4.7103271484375, -4.495361328125, -4.2803955078125, -4.0654296875, -3.8504638671875, -3.635498046875, -3.4205322265625, -3.20556640625, -2.9906005859375, -2.775634765625, -2.5606689453125, -2.345703125, -2.1307373046875, -1.915771484375, -1.7008056640625, -1.48583984375, -1.2708740234375, -1.055908203125, -0.8409423828125, -0.6259765625, -0.4110107421875, -0.196044921875, 0.0189208984375, 0.23388671875, 0.4488525390625, 0.663818359375, 0.8787841796875, 1.09375, 1.3087158203125, 1.523681640625, 1.7386474609375, 1.95361328125, 2.1685791015625, 2.383544921875, 2.5985107421875, 2.8134765625, 3.0284423828125, 3.243408203125, 3.4583740234375, 3.67333984375, 3.8883056640625, 4.103271484375, 4.3182373046875, 4.533203125, 4.7481689453125, 4.963134765625, 5.1781005859375, 5.39306640625, 5.6080322265625, 5.822998046875, 6.0379638671875, 6.2529296875, 6.4678955078125, 6.682861328125, 6.8978271484375, 7.11279296875, 7.3277587890625, 7.542724609375, 7.7576904296875, 7.97265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 8.0, 8.0, 9.0, 11.0, 15.0, 28.0, 24.0, 23.0, 30.0, 38.0, 37.0, 63.0, 68.0, 62.0, 84.0, 58.0, 54.0, 56.0, 47.0, 43.0, 51.0, 39.0, 30.0, 30.0, 23.0, 24.0, 8.0, 17.0, 3.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3046875, -2.218841552734375, -2.13299560546875, -2.047149658203125, -1.9613037109375, -1.875457763671875, -1.78961181640625, -1.703765869140625, -1.617919921875, -1.532073974609375, -1.44622802734375, -1.360382080078125, -1.2745361328125, -1.188690185546875, -1.10284423828125, -1.016998291015625, -0.93115234375, -0.845306396484375, -0.75946044921875, -0.673614501953125, -0.5877685546875, -0.501922607421875, -0.41607666015625, -0.330230712890625, -0.244384765625, -0.158538818359375, -0.07269287109375, 0.013153076171875, 0.0989990234375, 0.184844970703125, 0.27069091796875, 0.356536865234375, 0.4423828125, 0.528228759765625, 0.61407470703125, 0.699920654296875, 0.7857666015625, 0.871612548828125, 0.95745849609375, 1.043304443359375, 1.129150390625, 1.214996337890625, 1.30084228515625, 1.386688232421875, 1.4725341796875, 1.558380126953125, 1.64422607421875, 1.730072021484375, 1.81591796875, 1.901763916015625, 1.98760986328125, 2.073455810546875, 2.1593017578125, 2.245147705078125, 2.33099365234375, 2.416839599609375, 2.502685546875, 2.588531494140625, 2.67437744140625, 2.760223388671875, 2.8460693359375, 2.931915283203125, 3.01776123046875, 3.103607177734375, 3.189453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 10.0, 21.0, 38.0, 145.0, 925.0, 151996.0, 893694.0, 1468.0, 156.0, 47.0, 16.0, 6.0, 5.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6500625610351562, -0.6140899658203125, -0.5781173706054688, -0.542144775390625, -0.5061721801757812, -0.4701995849609375, -0.43422698974609375, -0.39825439453125, -0.36228179931640625, -0.3263092041015625, -0.29033660888671875, -0.254364013671875, -0.21839141845703125, -0.1824188232421875, -0.14644622802734375, -0.1104736328125, -0.07450103759765625, -0.0385284423828125, -0.00255584716796875, 0.033416748046875, 0.06938934326171875, 0.1053619384765625, 0.14133453369140625, 0.17730712890625, 0.21327972412109375, 0.2492523193359375, 0.28522491455078125, 0.321197509765625, 0.35717010498046875, 0.3931427001953125, 0.42911529541015625, 0.465087890625, 0.5010604858398438, 0.5370330810546875, 0.5730056762695312, 0.608978271484375, 0.6449508666992188, 0.6809234619140625, 0.7168960571289062, 0.75286865234375, 0.7888412475585938, 0.8248138427734375, 0.8607864379882812, 0.896759033203125, 0.9327316284179688, 0.9687042236328125, 1.0046768188476562, 1.0406494140625, 1.0766220092773438, 1.1125946044921875, 1.1485671997070312, 1.184539794921875, 1.2205123901367188, 1.2564849853515625, 1.2924575805664062, 1.32843017578125, 1.3644027709960938, 1.4003753662109375, 1.4363479614257812, 1.472320556640625, 1.5082931518554688, 1.5442657470703125, 1.5802383422851562, 1.6162109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 6.0, 2.0, 12.0, 14.0, 7.0, 10.0, 19.0, 18.0, 36.0, 43.0, 82.0, 124.0, 213.0, 145.0, 102.0, 49.0, 22.0, 30.0, 17.0, 8.0, 16.0, 2.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74913215637207e-05, -3.637932240962982e-05, -3.526732325553894e-05, -3.415532410144806e-05, -3.304332494735718e-05, -3.1931325793266296e-05, -3.0819326639175415e-05, -2.9707327485084534e-05, -2.8595328330993652e-05, -2.748332917690277e-05, -2.637133002281189e-05, -2.5259330868721008e-05, -2.4147331714630127e-05, -2.3035332560539246e-05, -2.1923333406448364e-05, -2.0811334252357483e-05, -1.96993350982666e-05, -1.858733594417572e-05, -1.747533679008484e-05, -1.6363337635993958e-05, -1.5251338481903076e-05, -1.4139339327812195e-05, -1.3027340173721313e-05, -1.1915341019630432e-05, -1.080334186553955e-05, -9.69134271144867e-06, -8.579343557357788e-06, -7.467344403266907e-06, -6.355345249176025e-06, -5.243346095085144e-06, -4.131346940994263e-06, -3.0193477869033813e-06, -1.9073486328125e-06, -7.953494787216187e-07, 3.166496753692627e-07, 1.428648829460144e-06, 2.5406479835510254e-06, 3.6526471376419067e-06, 4.764646291732788e-06, 5.8766454458236694e-06, 6.988644599914551e-06, 8.100643754005432e-06, 9.212642908096313e-06, 1.0324642062187195e-05, 1.1436641216278076e-05, 1.2548640370368958e-05, 1.3660639524459839e-05, 1.477263867855072e-05, 1.58846378326416e-05, 1.6996636986732483e-05, 1.8108636140823364e-05, 1.9220635294914246e-05, 2.0332634449005127e-05, 2.1444633603096008e-05, 2.255663275718689e-05, 2.366863191127777e-05, 2.4780631065368652e-05, 2.5892630219459534e-05, 2.7004629373550415e-05, 2.8116628527641296e-05, 2.9228627681732178e-05, 3.034062683582306e-05, 3.145262598991394e-05, 3.256462514400482e-05, 3.36766242980957e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 17.0, 18.0, 52.0, 203.0, 1307.0, 34506.0, 1005344.0, 6271.0, 600.0, 121.0, 41.0, 19.0, 14.0, 6.0, 8.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.0888671875, -1.0625, -1.0361328125, -1.009765625, -0.9833984375, -0.95703125, -0.9306640625, -0.904296875, -0.8779296875, -0.8515625, -0.8251953125, -0.798828125, -0.7724609375, -0.74609375, -0.7197265625, -0.693359375, -0.6669921875, -0.640625, -0.6142578125, -0.587890625, -0.5615234375, -0.53515625, -0.5087890625, -0.482421875, -0.4560546875, -0.4296875, -0.4033203125, -0.376953125, -0.3505859375, -0.32421875, -0.2978515625, -0.271484375, -0.2451171875, -0.21875, -0.1923828125, -0.166015625, -0.1396484375, -0.11328125, -0.0869140625, -0.060546875, -0.0341796875, -0.0078125, 0.0185546875, 0.044921875, 0.0712890625, 0.09765625, 0.1240234375, 0.150390625, 0.1767578125, 0.203125, 0.2294921875, 0.255859375, 0.2822265625, 0.30859375, 0.3349609375, 0.361328125, 0.3876953125, 0.4140625, 0.4404296875, 0.466796875, 0.4931640625, 0.51953125, 0.5458984375, 0.572265625, 0.5986328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 7.0, 11.0, 18.0, 32.0, 46.0, 69.0, 128.0, 232.0, 189.0, 111.0, 57.0, 36.0, 25.0, 11.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.0897207260131836, -0.08624076843261719, -0.08276081085205078, -0.07928085327148438, -0.07580089569091797, -0.07232093811035156, -0.06884098052978516, -0.06536102294921875, -0.061881065368652344, -0.05840110778808594, -0.05492115020751953, -0.051441192626953125, -0.04796123504638672, -0.04448127746582031, -0.041001319885253906, -0.0375213623046875, -0.034041404724121094, -0.030561447143554688, -0.02708148956298828, -0.023601531982421875, -0.02012157440185547, -0.016641616821289062, -0.013161659240722656, -0.00968170166015625, -0.006201744079589844, -0.0027217864990234375, 0.0007581710815429688, 0.004238128662109375, 0.007718086242675781, 0.011198043823242188, 0.014678001403808594, 0.018157958984375, 0.021637916564941406, 0.025117874145507812, 0.02859783172607422, 0.032077789306640625, 0.03555774688720703, 0.03903770446777344, 0.042517662048339844, 0.04599761962890625, 0.049477577209472656, 0.05295753479003906, 0.05643749237060547, 0.059917449951171875, 0.06339740753173828, 0.06687736511230469, 0.0703573226928711, 0.0738372802734375, 0.0773172378540039, 0.08079719543457031, 0.08427715301513672, 0.08775711059570312, 0.09123706817626953, 0.09471702575683594, 0.09819698333740234, 0.10167694091796875, 0.10515689849853516, 0.10863685607910156, 0.11211681365966797, 0.11559677124023438, 0.11907672882080078, 0.12255668640136719, 0.1260366439819336, 0.1295166015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 6.0, 11.0, 23.0, 27.0, 48.0, 63.0, 116.0, 168.0, 193.0, 128.0, 74.0, 48.0, 28.0, 26.0, 11.0, 12.0, 4.0, 7.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.985243320465088, -2.889725923538208, -2.7942087650299072, -2.6986913681030273, -2.6031739711761475, -2.5076565742492676, -2.412139415740967, -2.316622018814087, -2.221104621887207, -2.125587224960327, -2.0300700664520264, -1.9345526695251465, -1.8390352725982666, -1.7435179948806763, -1.648000717163086, -1.552483320236206, -1.4569661617279053, -1.361448884010315, -1.265931487083435, -1.1704142093658447, -1.0748968124389648, -0.9793795347213745, -0.8838622570037842, -0.7883449196815491, -0.692827582359314, -0.5973102450370789, -0.5017929077148438, -0.4062756299972534, -0.3107582926750183, -0.2152409553527832, -0.11972367763519287, -0.024206340312957764, 0.07131099700927734, 0.16682831943035126, 0.26234564185142517, 0.3578629493713379, 0.453380286693573, 0.5488976240158081, 0.6444149017333984, 0.7399322390556335, 0.8354495763778687, 0.9309669137001038, 1.0264842510223389, 1.1220015287399292, 1.2175188064575195, 1.3130362033843994, 1.4085534811019897, 1.50407075881958, 1.59958815574646, 1.6951054334640503, 1.7906228303909302, 1.8861401081085205, 1.9816575050354004, 2.077174663543701, 2.172692060470581, 2.268209457397461, 2.3637266159057617, 2.4592440128326416, 2.5547611713409424, 2.6502785682678223, 2.745795965194702, 2.841313362121582, 2.936830520629883, 3.0323479175567627, 3.1278653144836426]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 8.0, 10.0, 13.0, 18.0, 14.0, 21.0, 24.0, 36.0, 22.0, 26.0, 34.0, 21.0, 39.0, 50.0, 45.0, 47.0, 39.0, 36.0, 46.0, 49.0, 42.0, 40.0, 37.0, 33.0, 33.0, 31.0, 28.0, 21.0, 20.0, 19.0, 12.0, 11.0, 14.0, 14.0, 10.0, 9.0, 5.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6409285068511963, -2.5557265281677246, -2.470524311065674, -2.385322332382202, -2.3001201152801514, -2.2149181365966797, -2.129715919494629, -2.0445139408111572, -1.959311842918396, -1.8741097450256348, -1.7889076471328735, -1.7037055492401123, -1.6185035705566406, -1.5333013534545898, -1.4480993747711182, -1.362897276878357, -1.2776951789855957, -1.1924930810928345, -1.1072909832000732, -1.0220890045166016, -0.9368868470191956, -0.8516847491264343, -0.7664827108383179, -0.6812806129455566, -0.5960785150527954, -0.5108764171600342, -0.42567434906959534, -0.3404722809791565, -0.25527018308639526, -0.17006808519363403, -0.08486604690551758, 0.00033605098724365234, 0.08553814888000488, 0.17074023187160492, 0.25594231486320496, 0.3411443829536438, 0.42634648084640503, 0.5115485787391663, 0.5967506170272827, 0.681952714920044, 0.7671548128128052, 0.8523569107055664, 0.9375590085983276, 1.0227611064910889, 1.1079630851745605, 1.1931653022766113, 1.278367280960083, 1.3635693788528442, 1.4487714767456055, 1.5339735746383667, 1.619175672531128, 1.7043776512145996, 1.7895798683166504, 1.874781847000122, 1.9599839448928833, 2.0451860427856445, 2.1303882598876953, 2.215590238571167, 2.3007924556732178, 2.3859944343566895, 2.4711966514587402, 2.556398630142212, 2.6416006088256836, 2.7268028259277344, 2.812004804611206]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 8.0, 10.0, 10.0, 18.0, 13.0, 20.0, 15.0, 25.0, 34.0, 53.0, 58.0, 93.0, 131.0, 242.0, 390.0, 740.0, 1479.0, 3821.0, 12624.0, 107838.0, 3489281.0, 544494.0, 22975.0, 5720.0, 2053.0, 895.0, 439.0, 246.0, 159.0, 112.0, 77.0, 55.0, 28.0, 28.0, 23.0, 17.0, 21.0, 8.0, 9.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.76171875, -2.671722412109375, -2.58172607421875, -2.491729736328125, -2.4017333984375, -2.311737060546875, -2.22174072265625, -2.131744384765625, -2.041748046875, -1.951751708984375, -1.86175537109375, -1.771759033203125, -1.6817626953125, -1.591766357421875, -1.50177001953125, -1.411773681640625, -1.32177734375, -1.231781005859375, -1.14178466796875, -1.051788330078125, -0.9617919921875, -0.871795654296875, -0.78179931640625, -0.691802978515625, -0.601806640625, -0.511810302734375, -0.42181396484375, -0.331817626953125, -0.2418212890625, -0.151824951171875, -0.06182861328125, 0.028167724609375, 0.1181640625, 0.208160400390625, 0.29815673828125, 0.388153076171875, 0.4781494140625, 0.568145751953125, 0.65814208984375, 0.748138427734375, 0.838134765625, 0.928131103515625, 1.01812744140625, 1.108123779296875, 1.1981201171875, 1.288116455078125, 1.37811279296875, 1.468109130859375, 1.55810546875, 1.648101806640625, 1.73809814453125, 1.828094482421875, 1.9180908203125, 2.008087158203125, 2.09808349609375, 2.188079833984375, 2.278076171875, 2.368072509765625, 2.45806884765625, 2.548065185546875, 2.6380615234375, 2.728057861328125, 2.81805419921875, 2.908050537109375, 2.998046875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 9.0, 10.0, 12.0, 24.0, 17.0, 16.0, 34.0, 24.0, 29.0, 41.0, 34.0, 31.0, 39.0, 41.0, 50.0, 52.0, 58.0, 49.0, 58.0, 49.0, 34.0, 38.0, 33.0, 21.0, 29.0, 27.0, 20.0, 19.0, 25.0, 10.0, 10.0, 8.0, 11.0, 6.0, 4.0, 2.0, 5.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.82470703125, -0.800506591796875, -0.77630615234375, -0.752105712890625, -0.7279052734375, -0.703704833984375, -0.67950439453125, -0.655303955078125, -0.631103515625, -0.606903076171875, -0.58270263671875, -0.558502197265625, -0.5343017578125, -0.510101318359375, -0.48590087890625, -0.461700439453125, -0.4375, -0.413299560546875, -0.38909912109375, -0.364898681640625, -0.3406982421875, -0.316497802734375, -0.29229736328125, -0.268096923828125, -0.243896484375, -0.219696044921875, -0.19549560546875, -0.171295166015625, -0.1470947265625, -0.122894287109375, -0.09869384765625, -0.074493408203125, -0.05029296875, -0.026092529296875, -0.00189208984375, 0.022308349609375, 0.0465087890625, 0.070709228515625, 0.09490966796875, 0.119110107421875, 0.143310546875, 0.167510986328125, 0.19171142578125, 0.215911865234375, 0.2401123046875, 0.264312744140625, 0.28851318359375, 0.312713623046875, 0.3369140625, 0.361114501953125, 0.38531494140625, 0.409515380859375, 0.4337158203125, 0.457916259765625, 0.48211669921875, 0.506317138671875, 0.530517578125, 0.554718017578125, 0.57891845703125, 0.603118896484375, 0.6273193359375, 0.651519775390625, 0.67572021484375, 0.699920654296875, 0.72412109375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 16.0, 14.0, 30.0, 63.0, 95.0, 248.0, 669.0, 14865.0, 4169179.0, 8108.0, 550.0, 201.0, 93.0, 50.0, 34.0, 16.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.605224609375, -7.28076171875, -6.956298828125, -6.6318359375, -6.307373046875, -5.98291015625, -5.658447265625, -5.333984375, -5.009521484375, -4.68505859375, -4.360595703125, -4.0361328125, -3.711669921875, -3.38720703125, -3.062744140625, -2.73828125, -2.413818359375, -2.08935546875, -1.764892578125, -1.4404296875, -1.115966796875, -0.79150390625, -0.467041015625, -0.142578125, 0.181884765625, 0.50634765625, 0.830810546875, 1.1552734375, 1.479736328125, 1.80419921875, 2.128662109375, 2.453125, 2.777587890625, 3.10205078125, 3.426513671875, 3.7509765625, 4.075439453125, 4.39990234375, 4.724365234375, 5.048828125, 5.373291015625, 5.69775390625, 6.022216796875, 6.3466796875, 6.671142578125, 6.99560546875, 7.320068359375, 7.64453125, 7.968994140625, 8.29345703125, 8.617919921875, 8.9423828125, 9.266845703125, 9.59130859375, 9.915771484375, 10.240234375, 10.564697265625, 10.88916015625, 11.213623046875, 11.5380859375, 11.862548828125, 12.18701171875, 12.511474609375, 12.8359375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 3.0, 4.0, 5.0, 3.0, 6.0, 10.0, 9.0, 14.0, 14.0, 15.0, 20.0, 31.0, 44.0, 57.0, 87.0, 147.0, 216.0, 438.0, 737.0, 772.0, 573.0, 288.0, 166.0, 98.0, 85.0, 57.0, 36.0, 30.0, 23.0, 15.0, 20.0, 12.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.50830078125, -0.49462890625, -0.48095703125, -0.46728515625, -0.45361328125, -0.43994140625, -0.42626953125, -0.41259765625, -0.39892578125, -0.38525390625, -0.37158203125, -0.35791015625, -0.34423828125, -0.33056640625, -0.31689453125, -0.30322265625, -0.28955078125, -0.27587890625, -0.26220703125, -0.24853515625, -0.23486328125, -0.22119140625, -0.20751953125, -0.19384765625, -0.18017578125, -0.16650390625, -0.15283203125, -0.13916015625, -0.12548828125, -0.11181640625, -0.09814453125, -0.08447265625, -0.07080078125, -0.05712890625, -0.04345703125, -0.02978515625, -0.01611328125, -0.00244140625, 0.01123046875, 0.02490234375, 0.03857421875, 0.05224609375, 0.06591796875, 0.07958984375, 0.09326171875, 0.10693359375, 0.12060546875, 0.13427734375, 0.14794921875, 0.16162109375, 0.17529296875, 0.18896484375, 0.20263671875, 0.21630859375, 0.22998046875, 0.24365234375, 0.25732421875, 0.27099609375, 0.28466796875, 0.29833984375, 0.31201171875, 0.32568359375, 0.33935546875, 0.35302734375, 0.36669921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 6.0, 2.0, 12.0, 13.0, 20.0, 30.0, 57.0, 69.0, 76.0, 91.0, 112.0, 134.0, 100.0, 75.0, 61.0, 38.0, 24.0, 14.0, 12.0, 8.0, 11.0, 8.0, 4.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9296356439590454, -1.8824702501296997, -1.835304856300354, -1.7881394624710083, -1.7409741878509521, -1.6938087940216064, -1.6466434001922607, -1.599478006362915, -1.5523126125335693, -1.5051472187042236, -1.457981824874878, -1.4108164310455322, -1.3636510372161865, -1.3164857625961304, -1.2693203687667847, -1.222154974937439, -1.1749895811080933, -1.1278241872787476, -1.0806587934494019, -1.0334933996200562, -0.9863280653953552, -0.9391626715660095, -0.8919973373413086, -0.8448319435119629, -0.7976665496826172, -0.7505011558532715, -0.7033357620239258, -0.6561704277992249, -0.6090050339698792, -0.5618396401405334, -0.5146743059158325, -0.4675089120864868, -0.42034363746643066, -0.37317824363708496, -0.32601287961006165, -0.27884751558303833, -0.23168212175369263, -0.18451674282550812, -0.1373513638973236, -0.09018599987030029, -0.04302060604095459, 0.004144772887229919, 0.05131015181541443, 0.09847553074359894, 0.14564090967178345, 0.19280628859996796, 0.23997166752815247, 0.2871370315551758, 0.3343024253845215, 0.3814678192138672, 0.4286331832408905, 0.4757985472679138, 0.5229639410972595, 0.5701293349266052, 0.6172946691513062, 0.6644600629806519, 0.7116254568099976, 0.7587908506393433, 0.805956244468689, 0.8531215786933899, 0.9002869725227356, 0.9474523663520813, 0.9946177005767822, 1.041783094406128, 1.0889484882354736]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 7.0, 5.0, 6.0, 8.0, 6.0, 13.0, 12.0, 17.0, 16.0, 26.0, 24.0, 30.0, 20.0, 30.0, 22.0, 28.0, 26.0, 40.0, 44.0, 38.0, 38.0, 46.0, 31.0, 36.0, 40.0, 38.0, 28.0, 24.0, 25.0, 35.0, 24.0, 28.0, 25.0, 19.0, 15.0, 12.0, 17.0, 16.0, 13.0, 11.0, 7.0, 8.0, 14.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 5.0], "bins": [-0.7717801332473755, -0.7501706480979919, -0.7285611629486084, -0.7069516181945801, -0.6853421330451965, -0.663732647895813, -0.6421231031417847, -0.6205136179924011, -0.5989041328430176, -0.577294647693634, -0.5556851625442505, -0.5340756177902222, -0.5124661326408386, -0.4908566474914551, -0.46924713253974915, -0.4476376175880432, -0.42602813243865967, -0.4044186472892761, -0.3828091323375702, -0.36119961738586426, -0.3395901322364807, -0.31798064708709717, -0.29637113213539124, -0.2747616171836853, -0.25315213203430176, -0.23154263198375702, -0.20993313193321228, -0.18832363188266754, -0.1667141318321228, -0.14510463178157806, -0.12349513173103333, -0.10188563168048859, -0.08027607202529907, -0.058666571974754333, -0.037057071924209595, -0.015447571873664856, 0.006161928176879883, 0.02777142822742462, 0.04938092827796936, 0.0709904283285141, 0.09259992837905884, 0.11420942842960358, 0.13581892848014832, 0.15742842853069305, 0.1790379285812378, 0.20064742863178253, 0.22225692868232727, 0.243866428732872, 0.26547592878341675, 0.2870854139328003, 0.3086949288845062, 0.33030444383621216, 0.3519139289855957, 0.37352341413497925, 0.3951329290866852, 0.4167424440383911, 0.43835192918777466, 0.4599614143371582, 0.48157092928886414, 0.5031804442405701, 0.5247899293899536, 0.5463994145393372, 0.5680088996887207, 0.589618444442749, 0.6112279295921326]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 4.0, 7.0, 11.0, 9.0, 25.0, 36.0, 33.0, 51.0, 73.0, 120.0, 190.0, 230.0, 336.0, 505.0, 803.0, 1343.0, 1999.0, 3467.0, 6014.0, 11069.0, 21877.0, 49651.0, 155043.0, 503256.0, 184399.0, 56062.0, 23777.0, 11867.0, 6509.0, 3623.0, 2182.0, 1281.0, 881.0, 584.0, 408.0, 258.0, 173.0, 128.0, 80.0, 55.0, 38.0, 31.0, 22.0, 17.0, 11.0, 3.0, 2.0, 6.0, 5.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.36767578125, -0.356719970703125, -0.34576416015625, -0.334808349609375, -0.3238525390625, -0.312896728515625, -0.30194091796875, -0.290985107421875, -0.280029296875, -0.269073486328125, -0.25811767578125, -0.247161865234375, -0.2362060546875, -0.225250244140625, -0.21429443359375, -0.203338623046875, -0.1923828125, -0.181427001953125, -0.17047119140625, -0.159515380859375, -0.1485595703125, -0.137603759765625, -0.12664794921875, -0.115692138671875, -0.104736328125, -0.093780517578125, -0.08282470703125, -0.071868896484375, -0.0609130859375, -0.049957275390625, -0.03900146484375, -0.028045654296875, -0.01708984375, -0.006134033203125, 0.00482177734375, 0.015777587890625, 0.0267333984375, 0.037689208984375, 0.04864501953125, 0.059600830078125, 0.070556640625, 0.081512451171875, 0.09246826171875, 0.103424072265625, 0.1143798828125, 0.125335693359375, 0.13629150390625, 0.147247314453125, 0.158203125, 0.169158935546875, 0.18011474609375, 0.191070556640625, 0.2020263671875, 0.212982177734375, 0.22393798828125, 0.234893798828125, 0.245849609375, 0.256805419921875, 0.26776123046875, 0.278717041015625, 0.2896728515625, 0.300628662109375, 0.31158447265625, 0.322540283203125, 0.33349609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 8.0, 14.0, 10.0, 13.0, 9.0, 17.0, 22.0, 25.0, 25.0, 22.0, 28.0, 27.0, 36.0, 35.0, 46.0, 53.0, 46.0, 41.0, 35.0, 46.0, 49.0, 36.0, 39.0, 21.0, 38.0, 29.0, 40.0, 25.0, 26.0, 18.0, 12.0, 14.0, 11.0, 13.0, 10.0, 6.0, 7.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.51904296875, -0.5046348571777344, -0.49022674560546875, -0.4758186340332031, -0.4614105224609375, -0.4470024108886719, -0.43259429931640625, -0.4181861877441406, -0.403778076171875, -0.3893699645996094, -0.37496185302734375, -0.3605537414550781, -0.3461456298828125, -0.3317375183105469, -0.31732940673828125, -0.3029212951660156, -0.28851318359375, -0.2741050720214844, -0.25969696044921875, -0.24528884887695312, -0.2308807373046875, -0.21647262573242188, -0.20206451416015625, -0.18765640258789062, -0.173248291015625, -0.15884017944335938, -0.14443206787109375, -0.13002395629882812, -0.1156158447265625, -0.10120773315429688, -0.08679962158203125, -0.07239151000976562, -0.0579833984375, -0.043575286865234375, -0.02916717529296875, -0.014759063720703125, -0.0003509521484375, 0.014057159423828125, 0.02846527099609375, 0.042873382568359375, 0.057281494140625, 0.07168960571289062, 0.08609771728515625, 0.10050582885742188, 0.1149139404296875, 0.12932205200195312, 0.14373016357421875, 0.15813827514648438, 0.17254638671875, 0.18695449829101562, 0.20136260986328125, 0.21577072143554688, 0.2301788330078125, 0.24458694458007812, 0.25899505615234375, 0.2734031677246094, 0.287811279296875, 0.3022193908691406, 0.31662750244140625, 0.3310356140136719, 0.3454437255859375, 0.3598518371582031, 0.37425994873046875, 0.3886680603027344, 0.403076171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 6.0, 12.0, 11.0, 16.0, 32.0, 56.0, 62.0, 89.0, 162.0, 219.0, 400.0, 698.0, 1205.0, 2160.0, 4256.0, 9319.0, 22358.0, 66622.0, 278490.0, 482237.0, 118759.0, 35235.0, 13476.0, 6018.0, 3011.0, 1536.0, 816.0, 491.0, 307.0, 165.0, 96.0, 80.0, 43.0, 27.0, 24.0, 12.0, 12.0, 12.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2923927307128906, -0.28302764892578125, -0.2736625671386719, -0.2642974853515625, -0.2549324035644531, -0.24556732177734375, -0.23620223999023438, -0.226837158203125, -0.21747207641601562, -0.20810699462890625, -0.19874191284179688, -0.1893768310546875, -0.18001174926757812, -0.17064666748046875, -0.16128158569335938, -0.15191650390625, -0.14255142211914062, -0.13318634033203125, -0.12382125854492188, -0.1144561767578125, -0.10509109497070312, -0.09572601318359375, -0.08636093139648438, -0.076995849609375, -0.06763076782226562, -0.05826568603515625, -0.048900604248046875, -0.0395355224609375, -0.030170440673828125, -0.02080535888671875, -0.011440277099609375, -0.0020751953125, 0.007289886474609375, 0.01665496826171875, 0.026020050048828125, 0.0353851318359375, 0.044750213623046875, 0.05411529541015625, 0.06348037719726562, 0.072845458984375, 0.08221054077148438, 0.09157562255859375, 0.10094070434570312, 0.1103057861328125, 0.11967086791992188, 0.12903594970703125, 0.13840103149414062, 0.14776611328125, 0.15713119506835938, 0.16649627685546875, 0.17586135864257812, 0.1852264404296875, 0.19459152221679688, 0.20395660400390625, 0.21332168579101562, 0.222686767578125, 0.23205184936523438, 0.24141693115234375, 0.2507820129394531, 0.2601470947265625, 0.2695121765136719, 0.27887725830078125, 0.2882423400878906, 0.297607421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 10.0, 6.0, 7.0, 10.0, 16.0, 9.0, 29.0, 21.0, 25.0, 23.0, 28.0, 24.0, 43.0, 29.0, 38.0, 47.0, 35.0, 50.0, 32.0, 41.0, 37.0, 50.0, 40.0, 44.0, 38.0, 31.0, 33.0, 28.0, 21.0, 22.0, 13.0, 17.0, 17.0, 16.0, 11.0, 9.0, 5.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.89453125, -0.868927001953125, -0.84332275390625, -0.817718505859375, -0.7921142578125, -0.766510009765625, -0.74090576171875, -0.715301513671875, -0.689697265625, -0.664093017578125, -0.63848876953125, -0.612884521484375, -0.5872802734375, -0.561676025390625, -0.53607177734375, -0.510467529296875, -0.48486328125, -0.459259033203125, -0.43365478515625, -0.408050537109375, -0.3824462890625, -0.356842041015625, -0.33123779296875, -0.305633544921875, -0.280029296875, -0.254425048828125, -0.22882080078125, -0.203216552734375, -0.1776123046875, -0.152008056640625, -0.12640380859375, -0.100799560546875, -0.0751953125, -0.049591064453125, -0.02398681640625, 0.001617431640625, 0.0272216796875, 0.052825927734375, 0.07843017578125, 0.104034423828125, 0.129638671875, 0.155242919921875, 0.18084716796875, 0.206451416015625, 0.2320556640625, 0.257659912109375, 0.28326416015625, 0.308868408203125, 0.33447265625, 0.360076904296875, 0.38568115234375, 0.411285400390625, 0.4368896484375, 0.462493896484375, 0.48809814453125, 0.513702392578125, 0.539306640625, 0.564910888671875, 0.59051513671875, 0.616119384765625, 0.6417236328125, 0.667327880859375, 0.69293212890625, 0.718536376953125, 0.744140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 2.0, 9.0, 5.0, 6.0, 10.0, 17.0, 22.0, 41.0, 70.0, 91.0, 129.0, 175.0, 254.0, 393.0, 643.0, 1107.0, 1989.0, 3899.0, 8491.0, 20573.0, 60794.0, 221003.0, 469716.0, 175889.0, 50035.0, 17564.0, 7359.0, 3583.0, 1833.0, 1042.0, 646.0, 389.0, 233.0, 158.0, 123.0, 82.0, 53.0, 32.0, 31.0, 16.0, 20.0, 12.0, 3.0, 7.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055755615234375, -0.05379343032836914, -0.05183124542236328, -0.04986906051635742, -0.04790687561035156, -0.0459446907043457, -0.043982505798339844, -0.042020320892333984, -0.040058135986328125, -0.038095951080322266, -0.036133766174316406, -0.03417158126831055, -0.03220939636230469, -0.030247211456298828, -0.02828502655029297, -0.02632284164428711, -0.02436065673828125, -0.02239847183227539, -0.02043628692626953, -0.018474102020263672, -0.016511917114257812, -0.014549732208251953, -0.012587547302246094, -0.010625362396240234, -0.008663177490234375, -0.006700992584228516, -0.004738807678222656, -0.002776622772216797, -0.0008144378662109375, 0.0011477470397949219, 0.0031099319458007812, 0.005072116851806641, 0.0070343017578125, 0.00899648666381836, 0.010958671569824219, 0.012920856475830078, 0.014883041381835938, 0.016845226287841797, 0.018807411193847656, 0.020769596099853516, 0.022731781005859375, 0.024693965911865234, 0.026656150817871094, 0.028618335723876953, 0.030580520629882812, 0.03254270553588867, 0.03450489044189453, 0.03646707534790039, 0.03842926025390625, 0.04039144515991211, 0.04235363006591797, 0.04431581497192383, 0.04627799987792969, 0.04824018478393555, 0.050202369689941406, 0.052164554595947266, 0.054126739501953125, 0.056088924407958984, 0.058051109313964844, 0.0600132942199707, 0.06197547912597656, 0.06393766403198242, 0.06589984893798828, 0.06786203384399414, 0.06982421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 10.0, 12.0, 14.0, 26.0, 42.0, 65.0, 120.0, 170.0, 193.0, 116.0, 76.0, 54.0, 32.0, 20.0, 10.0, 10.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61015510559082e-05, -6.347056478261948e-05, -6.083957850933075e-05, -5.820859223604202e-05, -5.5577605962753296e-05, -5.294661968946457e-05, -5.031563341617584e-05, -4.7684647142887115e-05, -4.505366086959839e-05, -4.242267459630966e-05, -3.9791688323020935e-05, -3.716070204973221e-05, -3.452971577644348e-05, -3.1898729503154755e-05, -2.9267743229866028e-05, -2.66367569565773e-05, -2.4005770683288574e-05, -2.1374784409999847e-05, -1.874379813671112e-05, -1.6112811863422394e-05, -1.3481825590133667e-05, -1.085083931684494e-05, -8.219853043556213e-06, -5.5888667702674866e-06, -2.9578804969787598e-06, -3.2689422369003296e-07, 2.304092049598694e-06, 4.935078322887421e-06, 7.5660645961761475e-06, 1.0197050869464874e-05, 1.2828037142753601e-05, 1.5459023416042328e-05, 1.8090009689331055e-05, 2.072099596261978e-05, 2.3351982235908508e-05, 2.5982968509197235e-05, 2.8613954782485962e-05, 3.124494105577469e-05, 3.3875927329063416e-05, 3.650691360235214e-05, 3.913789987564087e-05, 4.1768886148929596e-05, 4.439987242221832e-05, 4.703085869550705e-05, 4.9661844968795776e-05, 5.22928312420845e-05, 5.492381751537323e-05, 5.755480378866196e-05, 6.0185790061950684e-05, 6.281677633523941e-05, 6.544776260852814e-05, 6.807874888181686e-05, 7.070973515510559e-05, 7.334072142839432e-05, 7.597170770168304e-05, 7.860269397497177e-05, 8.12336802482605e-05, 8.386466652154922e-05, 8.649565279483795e-05, 8.912663906812668e-05, 9.17576253414154e-05, 9.438861161470413e-05, 9.701959788799286e-05, 9.965058416128159e-05, 0.00010228157043457031]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 16.0, 18.0, 18.0, 40.0, 91.0, 179.0, 369.0, 1203.0, 4064.0, 19456.0, 188405.0, 739131.0, 80440.0, 10998.0, 2724.0, 803.0, 291.0, 129.0, 60.0, 28.0, 20.0, 16.0, 4.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.12993621826171875, -0.1253509521484375, -0.12076568603515625, -0.116180419921875, -0.11159515380859375, -0.1070098876953125, -0.10242462158203125, -0.09783935546875, -0.09325408935546875, -0.0886688232421875, -0.08408355712890625, -0.079498291015625, -0.07491302490234375, -0.0703277587890625, -0.06574249267578125, -0.0611572265625, -0.05657196044921875, -0.0519866943359375, -0.04740142822265625, -0.042816162109375, -0.03823089599609375, -0.0336456298828125, -0.02906036376953125, -0.02447509765625, -0.01988983154296875, -0.0153045654296875, -0.01071929931640625, -0.006134033203125, -0.00154876708984375, 0.0030364990234375, 0.00762176513671875, 0.01220703125, 0.01679229736328125, 0.0213775634765625, 0.02596282958984375, 0.030548095703125, 0.03513336181640625, 0.0397186279296875, 0.04430389404296875, 0.04888916015625, 0.05347442626953125, 0.0580596923828125, 0.06264495849609375, 0.067230224609375, 0.07181549072265625, 0.0764007568359375, 0.08098602294921875, 0.0855712890625, 0.09015655517578125, 0.0947418212890625, 0.09932708740234375, 0.103912353515625, 0.10849761962890625, 0.1130828857421875, 0.11766815185546875, 0.12225341796875, 0.12683868408203125, 0.1314239501953125, 0.13600921630859375, 0.140594482421875, 0.14517974853515625, 0.1497650146484375, 0.15435028076171875, 0.158935546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 2.0, 5.0, 8.0, 12.0, 9.0, 10.0, 17.0, 22.0, 33.0, 37.0, 56.0, 63.0, 70.0, 65.0, 76.0, 74.0, 80.0, 52.0, 60.0, 64.0, 49.0, 28.0, 25.0, 23.0, 8.0, 11.0, 12.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0187530517578125, -0.01811075210571289, -0.01746845245361328, -0.016826152801513672, -0.016183853149414062, -0.015541553497314453, -0.014899253845214844, -0.014256954193115234, -0.013614654541015625, -0.012972354888916016, -0.012330055236816406, -0.011687755584716797, -0.011045455932617188, -0.010403156280517578, -0.009760856628417969, -0.00911855697631836, -0.00847625732421875, -0.00783395767211914, -0.007191658020019531, -0.006549358367919922, -0.0059070587158203125, -0.005264759063720703, -0.004622459411621094, -0.003980159759521484, -0.003337860107421875, -0.0026955604553222656, -0.0020532608032226562, -0.0014109611511230469, -0.0007686614990234375, -0.00012636184692382812, 0.0005159378051757812, 0.0011582374572753906, 0.001800537109375, 0.0024428367614746094, 0.0030851364135742188, 0.003727436065673828, 0.0043697357177734375, 0.005012035369873047, 0.005654335021972656, 0.006296634674072266, 0.006938934326171875, 0.007581233978271484, 0.008223533630371094, 0.008865833282470703, 0.009508132934570312, 0.010150432586669922, 0.010792732238769531, 0.01143503189086914, 0.01207733154296875, 0.01271963119506836, 0.013361930847167969, 0.014004230499267578, 0.014646530151367188, 0.015288829803466797, 0.015931129455566406, 0.016573429107666016, 0.017215728759765625, 0.017858028411865234, 0.018500328063964844, 0.019142627716064453, 0.019784927368164062, 0.020427227020263672, 0.02106952667236328, 0.02171182632446289, 0.0223541259765625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 9.0, 6.0, 7.0, 13.0, 15.0, 42.0, 38.0, 86.0, 109.0, 127.0, 181.0, 139.0, 76.0, 56.0, 32.0, 21.0, 17.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0980820655822754, -1.062807559967041, -1.027532935142517, -0.9922583699226379, -0.9569838047027588, -0.9217092990875244, -0.8864347338676453, -0.8511601686477661, -0.815885603427887, -0.7806110382080078, -0.7453364729881287, -0.7100619077682495, -0.6747874021530151, -0.6395127773284912, -0.6042382717132568, -0.5689637064933777, -0.5336891412734985, -0.4984145760536194, -0.46314001083374023, -0.42786547541618347, -0.3925909101963043, -0.35731634497642517, -0.3220418095588684, -0.28676724433898926, -0.2514926791191101, -0.21621811389923096, -0.180943563580513, -0.14566901326179504, -0.1103944480419159, -0.07511988282203674, -0.03984533250331879, -0.00457078218460083, 0.03070366382598877, 0.06597822159528732, 0.10125277936458588, 0.13652732968330383, 0.17180189490318298, 0.20707646012306213, 0.2423510104417801, 0.27762556076049805, 0.3129001259803772, 0.34817469120025635, 0.3834492564201355, 0.41872379183769226, 0.4539983570575714, 0.48927292227745056, 0.5245474576950073, 0.5598220229148865, 0.5950965881347656, 0.6303711533546448, 0.6656457185745239, 0.7009202837944031, 0.7361948490142822, 0.7714693546295166, 0.8067439198493958, 0.8420184850692749, 0.877293050289154, 0.9125676155090332, 0.9478421807289124, 0.9831167459487915, 1.0183912515640259, 1.0536658763885498, 1.0889403820037842, 1.1242148876190186, 1.1594895124435425]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 6.0, 7.0, 11.0, 17.0, 21.0, 11.0, 19.0, 21.0, 28.0, 29.0, 24.0, 19.0, 37.0, 26.0, 31.0, 34.0, 40.0, 51.0, 37.0, 51.0, 26.0, 38.0, 34.0, 25.0, 31.0, 30.0, 27.0, 35.0, 40.0, 17.0, 17.0, 19.0, 12.0, 18.0, 12.0, 9.0, 9.0, 15.0, 9.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0], "bins": [-0.449985146522522, -0.43745124340057373, -0.4249173402786255, -0.41238343715667725, -0.399849534034729, -0.38731563091278076, -0.37478169798851013, -0.3622477948665619, -0.34971389174461365, -0.3371799886226654, -0.32464608550071716, -0.3121121823787689, -0.2995782494544983, -0.28704434633255005, -0.2745104432106018, -0.26197654008865356, -0.24944263696670532, -0.23690873384475708, -0.22437483072280884, -0.2118409126996994, -0.19930700957775116, -0.18677310645580292, -0.17423918843269348, -0.16170528531074524, -0.149171382188797, -0.13663747906684875, -0.12410356849431992, -0.11156965792179108, -0.09903575479984283, -0.08650185167789459, -0.07396794110536575, -0.061434030532836914, -0.04890015721321106, -0.03636625036597252, -0.02383234351873398, -0.011298436671495438, 0.001235470175743103, 0.013769373297691345, 0.026303283870220184, 0.03883719444274902, 0.051371097564697266, 0.06390500068664551, 0.07643891125917435, 0.08897282183170319, 0.10150672495365143, 0.11404062807559967, 0.1265745460987091, 0.13910844922065735, 0.1516423523426056, 0.16417625546455383, 0.17671015858650208, 0.1892440766096115, 0.20177797973155975, 0.214311882853508, 0.22684580087661743, 0.23937970399856567, 0.2519136071205139, 0.26444751024246216, 0.2769814133644104, 0.28951531648635864, 0.3020492196083069, 0.3145831227302551, 0.32711705565452576, 0.339650958776474, 0.35218486189842224]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 13.0, 7.0, 13.0, 18.0, 21.0, 41.0, 62.0, 84.0, 155.0, 225.0, 370.0, 610.0, 1039.0, 1703.0, 2921.0, 5265.0, 10224.0, 21580.0, 59373.0, 283376.0, 500742.0, 100783.0, 31189.0, 13224.0, 6711.0, 3583.0, 2081.0, 1248.0, 662.0, 430.0, 275.0, 208.0, 100.0, 73.0, 52.0, 30.0, 23.0, 15.0, 5.0, 3.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2526664733886719, -0.24263763427734375, -0.23260879516601562, -0.2225799560546875, -0.21255111694335938, -0.20252227783203125, -0.19249343872070312, -0.182464599609375, -0.17243576049804688, -0.16240692138671875, -0.15237808227539062, -0.1423492431640625, -0.13232040405273438, -0.12229156494140625, -0.11226272583007812, -0.10223388671875, -0.09220504760742188, -0.08217620849609375, -0.07214736938476562, -0.0621185302734375, -0.052089691162109375, -0.04206085205078125, -0.032032012939453125, -0.022003173828125, -0.011974334716796875, -0.00194549560546875, 0.008083343505859375, 0.0181121826171875, 0.028141021728515625, 0.03816986083984375, 0.048198699951171875, 0.0582275390625, 0.06825637817382812, 0.07828521728515625, 0.08831405639648438, 0.0983428955078125, 0.10837173461914062, 0.11840057373046875, 0.12842941284179688, 0.138458251953125, 0.14848709106445312, 0.15851593017578125, 0.16854476928710938, 0.1785736083984375, 0.18860244750976562, 0.19863128662109375, 0.20866012573242188, 0.21868896484375, 0.22871780395507812, 0.23874664306640625, 0.24877548217773438, 0.2588043212890625, 0.2688331604003906, 0.27886199951171875, 0.2888908386230469, 0.298919677734375, 0.3089485168457031, 0.31897735595703125, 0.3290061950683594, 0.3390350341796875, 0.3490638732910156, 0.35909271240234375, 0.3691215515136719, 0.379150390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 6.0, 5.0, 17.0, 20.0, 12.0, 15.0, 24.0, 17.0, 43.0, 30.0, 19.0, 32.0, 41.0, 39.0, 40.0, 48.0, 46.0, 50.0, 43.0, 40.0, 37.0, 44.0, 32.0, 35.0, 30.0, 29.0, 29.0, 31.0, 21.0, 22.0, 11.0, 12.0, 14.0, 13.0, 8.0, 5.0, 7.0, 4.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0517578125, -1.0185546875, -0.9853515625, -0.9521484375, -0.9189453125, -0.8857421875, -0.8525390625, -0.8193359375, -0.7861328125, -0.7529296875, -0.7197265625, -0.6865234375, -0.6533203125, -0.6201171875, -0.5869140625, -0.5537109375, -0.5205078125, -0.4873046875, -0.4541015625, -0.4208984375, -0.3876953125, -0.3544921875, -0.3212890625, -0.2880859375, -0.2548828125, -0.2216796875, -0.1884765625, -0.1552734375, -0.1220703125, -0.0888671875, -0.0556640625, -0.0224609375, 0.0107421875, 0.0439453125, 0.0771484375, 0.1103515625, 0.1435546875, 0.1767578125, 0.2099609375, 0.2431640625, 0.2763671875, 0.3095703125, 0.3427734375, 0.3759765625, 0.4091796875, 0.4423828125, 0.4755859375, 0.5087890625, 0.5419921875, 0.5751953125, 0.6083984375, 0.6416015625, 0.6748046875, 0.7080078125, 0.7412109375, 0.7744140625, 0.8076171875, 0.8408203125, 0.8740234375, 0.9072265625, 0.9404296875, 0.9736328125, 1.0068359375, 1.0400390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 9.0, 4.0, 10.0, 10.0, 9.0, 17.0, 20.0, 17.0, 20.0, 30.0, 22.0, 33.0, 53.0, 41.0, 35.0, 55.0, 131.0, 844078.0, 203443.0, 124.0, 47.0, 44.0, 46.0, 34.0, 36.0, 27.0, 27.0, 22.0, 18.0, 17.0, 12.0, 12.0, 6.0, 7.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.29296875, -5.1416015625, -4.990234375, -4.8388671875, -4.6875, -4.5361328125, -4.384765625, -4.2333984375, -4.08203125, -3.9306640625, -3.779296875, -3.6279296875, -3.4765625, -3.3251953125, -3.173828125, -3.0224609375, -2.87109375, -2.7197265625, -2.568359375, -2.4169921875, -2.265625, -2.1142578125, -1.962890625, -1.8115234375, -1.66015625, -1.5087890625, -1.357421875, -1.2060546875, -1.0546875, -0.9033203125, -0.751953125, -0.6005859375, -0.44921875, -0.2978515625, -0.146484375, 0.0048828125, 0.15625, 0.3076171875, 0.458984375, 0.6103515625, 0.76171875, 0.9130859375, 1.064453125, 1.2158203125, 1.3671875, 1.5185546875, 1.669921875, 1.8212890625, 1.97265625, 2.1240234375, 2.275390625, 2.4267578125, 2.578125, 2.7294921875, 2.880859375, 3.0322265625, 3.18359375, 3.3349609375, 3.486328125, 3.6376953125, 3.7890625, 3.9404296875, 4.091796875, 4.2431640625, 4.39453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 16.0, 19.0, 19.0, 20.0, 18.0, 29.0, 29.0, 32.0, 46.0, 46.0, 28.0, 54.0, 37.0, 62.0, 49.0, 55.0, 49.0, 42.0, 39.0, 38.0, 32.0, 26.0, 31.0, 22.0, 28.0, 14.0, 15.0, 10.0, 10.0, 8.0, 8.0, 4.0, 8.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.1552734375, -1.1223373413085938, -1.0894012451171875, -1.0564651489257812, -1.023529052734375, -0.9905929565429688, -0.9576568603515625, -0.9247207641601562, -0.89178466796875, -0.8588485717773438, -0.8259124755859375, -0.7929763793945312, -0.760040283203125, -0.7271041870117188, -0.6941680908203125, -0.6612319946289062, -0.6282958984375, -0.5953598022460938, -0.5624237060546875, -0.5294876098632812, -0.496551513671875, -0.46361541748046875, -0.4306793212890625, -0.39774322509765625, -0.36480712890625, -0.33187103271484375, -0.2989349365234375, -0.26599884033203125, -0.233062744140625, -0.20012664794921875, -0.1671905517578125, -0.13425445556640625, -0.101318359375, -0.06838226318359375, -0.0354461669921875, -0.00251007080078125, 0.030426025390625, 0.06336212158203125, 0.0962982177734375, 0.12923431396484375, 0.16217041015625, 0.19510650634765625, 0.2280426025390625, 0.26097869873046875, 0.293914794921875, 0.32685089111328125, 0.3597869873046875, 0.39272308349609375, 0.4256591796875, 0.45859527587890625, 0.4915313720703125, 0.5244674682617188, 0.557403564453125, 0.5903396606445312, 0.6232757568359375, 0.6562118530273438, 0.68914794921875, 0.7220840454101562, 0.7550201416015625, 0.7879562377929688, 0.820892333984375, 0.8538284301757812, 0.8867645263671875, 0.9197006225585938, 0.95263671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 22.0, 14.0, 23.0, 28.0, 60.0, 125.0, 324.0, 979.0, 4664.0, 38956.0, 947680.0, 48448.0, 5403.0, 1191.0, 344.0, 113.0, 60.0, 35.0, 20.0, 15.0, 9.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44921875, -0.43497467041015625, -0.4207305908203125, -0.40648651123046875, -0.392242431640625, -0.37799835205078125, -0.3637542724609375, -0.34951019287109375, -0.33526611328125, -0.32102203369140625, -0.3067779541015625, -0.29253387451171875, -0.278289794921875, -0.26404571533203125, -0.2498016357421875, -0.23555755615234375, -0.2213134765625, -0.20706939697265625, -0.1928253173828125, -0.17858123779296875, -0.164337158203125, -0.15009307861328125, -0.1358489990234375, -0.12160491943359375, -0.10736083984375, -0.09311676025390625, -0.0788726806640625, -0.06462860107421875, -0.050384521484375, -0.03614044189453125, -0.0218963623046875, -0.00765228271484375, 0.006591796875, 0.02083587646484375, 0.0350799560546875, 0.04932403564453125, 0.063568115234375, 0.07781219482421875, 0.0920562744140625, 0.10630035400390625, 0.12054443359375, 0.13478851318359375, 0.1490325927734375, 0.16327667236328125, 0.177520751953125, 0.19176483154296875, 0.2060089111328125, 0.22025299072265625, 0.2344970703125, 0.24874114990234375, 0.2629852294921875, 0.27722930908203125, 0.291473388671875, 0.30571746826171875, 0.3199615478515625, 0.33420562744140625, 0.34844970703125, 0.36269378662109375, 0.3769378662109375, 0.39118194580078125, 0.405426025390625, 0.41967010498046875, 0.4339141845703125, 0.44815826416015625, 0.46240234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 10.0, 19.0, 26.0, 25.0, 32.0, 86.0, 173.0, 266.0, 123.0, 65.0, 45.0, 21.0, 22.0, 11.0, 7.0, 7.0, 4.0, 1.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.987550735473633e-05, -3.855675458908081e-05, -3.723800182342529e-05, -3.5919249057769775e-05, -3.460049629211426e-05, -3.328174352645874e-05, -3.196299076080322e-05, -3.0644237995147705e-05, -2.9325485229492188e-05, -2.800673246383667e-05, -2.6687979698181152e-05, -2.5369226932525635e-05, -2.4050474166870117e-05, -2.27317214012146e-05, -2.1412968635559082e-05, -2.0094215869903564e-05, -1.8775463104248047e-05, -1.745671033859253e-05, -1.6137957572937012e-05, -1.4819204807281494e-05, -1.3500452041625977e-05, -1.2181699275970459e-05, -1.0862946510314941e-05, -9.544193744659424e-06, -8.225440979003906e-06, -6.906688213348389e-06, -5.587935447692871e-06, -4.2691826820373535e-06, -2.950429916381836e-06, -1.6316771507263184e-06, -3.129243850708008e-07, 1.0058283805847168e-06, 2.3245811462402344e-06, 3.643333911895752e-06, 4.9620866775512695e-06, 6.280839443206787e-06, 7.599592208862305e-06, 8.918344974517822e-06, 1.023709774017334e-05, 1.1555850505828857e-05, 1.2874603271484375e-05, 1.4193356037139893e-05, 1.551210880279541e-05, 1.6830861568450928e-05, 1.8149614334106445e-05, 1.9468367099761963e-05, 2.078711986541748e-05, 2.2105872631072998e-05, 2.3424625396728516e-05, 2.4743378162384033e-05, 2.606213092803955e-05, 2.738088369369507e-05, 2.8699636459350586e-05, 3.0018389225006104e-05, 3.133714199066162e-05, 3.265589475631714e-05, 3.3974647521972656e-05, 3.5293400287628174e-05, 3.661215305328369e-05, 3.793090581893921e-05, 3.9249658584594727e-05, 4.0568411350250244e-05, 4.188716411590576e-05, 4.320591688156128e-05, 4.45246696472168e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 9.0, 9.0, 20.0, 15.0, 34.0, 66.0, 126.0, 209.0, 333.0, 764.0, 1625.0, 3873.0, 12032.0, 59014.0, 825269.0, 117966.0, 18042.0, 5222.0, 2013.0, 946.0, 436.0, 219.0, 118.0, 66.0, 42.0, 22.0, 15.0, 15.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.19244766235351562, -0.18494415283203125, -0.17744064331054688, -0.1699371337890625, -0.16243362426757812, -0.15493011474609375, -0.14742660522460938, -0.139923095703125, -0.13241958618164062, -0.12491607666015625, -0.11741256713867188, -0.1099090576171875, -0.10240554809570312, -0.09490203857421875, -0.08739852905273438, -0.07989501953125, -0.07239151000976562, -0.06488800048828125, -0.057384490966796875, -0.0498809814453125, -0.042377471923828125, -0.03487396240234375, -0.027370452880859375, -0.019866943359375, -0.012363433837890625, -0.00485992431640625, 0.002643585205078125, 0.0101470947265625, 0.017650604248046875, 0.02515411376953125, 0.032657623291015625, 0.0401611328125, 0.047664642333984375, 0.05516815185546875, 0.06267166137695312, 0.0701751708984375, 0.07767868041992188, 0.08518218994140625, 0.09268569946289062, 0.100189208984375, 0.10769271850585938, 0.11519622802734375, 0.12269973754882812, 0.1302032470703125, 0.13770675659179688, 0.14521026611328125, 0.15271377563476562, 0.16021728515625, 0.16772079467773438, 0.17522430419921875, 0.18272781372070312, 0.1902313232421875, 0.19773483276367188, 0.20523834228515625, 0.21274185180664062, 0.220245361328125, 0.22774887084960938, 0.23525238037109375, 0.24275588989257812, 0.2502593994140625, 0.2577629089355469, 0.26526641845703125, 0.2727699279785156, 0.2802734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 8.0, 12.0, 9.0, 15.0, 19.0, 15.0, 30.0, 49.0, 59.0, 78.0, 207.0, 192.0, 90.0, 62.0, 42.0, 23.0, 21.0, 16.0, 14.0, 11.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1019287109375, -0.09931182861328125, -0.0966949462890625, -0.09407806396484375, -0.091461181640625, -0.08884429931640625, -0.0862274169921875, -0.08361053466796875, -0.08099365234375, -0.07837677001953125, -0.0757598876953125, -0.07314300537109375, -0.070526123046875, -0.06790924072265625, -0.0652923583984375, -0.06267547607421875, -0.06005859375, -0.05744171142578125, -0.0548248291015625, -0.05220794677734375, -0.049591064453125, -0.04697418212890625, -0.0443572998046875, -0.04174041748046875, -0.03912353515625, -0.03650665283203125, -0.0338897705078125, -0.03127288818359375, -0.028656005859375, -0.02603912353515625, -0.0234222412109375, -0.02080535888671875, -0.0181884765625, -0.01557159423828125, -0.0129547119140625, -0.01033782958984375, -0.007720947265625, -0.00510406494140625, -0.0024871826171875, 0.00012969970703125, 0.00274658203125, 0.00536346435546875, 0.0079803466796875, 0.01059722900390625, 0.013214111328125, 0.01583099365234375, 0.0184478759765625, 0.02106475830078125, 0.023681640625, 0.02629852294921875, 0.0289154052734375, 0.03153228759765625, 0.034149169921875, 0.03676605224609375, 0.0393829345703125, 0.04199981689453125, 0.04461669921875, 0.04723358154296875, 0.0498504638671875, 0.05246734619140625, 0.055084228515625, 0.05770111083984375, 0.0603179931640625, 0.06293487548828125, 0.0655517578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 7.0, 14.0, 22.0, 40.0, 102.0, 151.0, 212.0, 200.0, 119.0, 63.0, 26.0, 21.0, 7.0, 10.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0143203735351562, -1.917041540145874, -1.8197627067565918, -1.7224838733673096, -1.625205159187317, -1.5279263257980347, -1.4306474924087524, -1.3333687782287598, -1.2360899448394775, -1.1388111114501953, -1.041532278060913, -0.9442535042762756, -0.8469747304916382, -0.749695897102356, -0.6524170637130737, -0.5551382899284363, -0.4578593969345093, -0.36058059334754944, -0.2633017897605896, -0.16602295637130737, -0.06874415278434753, 0.028534650802612305, 0.12581348419189453, 0.22309225797653198, 0.3203710913658142, 0.41764989495277405, 0.5149286985397339, 0.6122075319290161, 0.7094863653182983, 0.8067651391029358, 0.904043972492218, 1.0013227462768555, 1.0986015796661377, 1.19588041305542, 1.2931592464447021, 1.3904380798339844, 1.487716794013977, 1.5849956274032593, 1.6822744607925415, 1.7795531749725342, 1.8768320083618164, 1.9741108417510986, 2.071389675140381, 2.168668508529663, 2.2659473419189453, 2.3632259368896484, 2.4605050086975098, 2.557783603668213, 2.655062675476074, 2.7523415088653564, 2.8496203422546387, 2.946899175643921, 3.044178009033203, 3.1414566040039062, 3.2387356758117676, 3.3360142707824707, 3.433293104171753, 3.530571937561035, 3.6278507709503174, 3.7251296043395996, 3.822408437728882, 3.919687271118164, 4.016965866088867, 4.1142449378967285, 4.211523532867432]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 12.0, 12.0, 17.0, 25.0, 20.0, 28.0, 35.0, 32.0, 41.0, 36.0, 36.0, 50.0, 48.0, 49.0, 40.0, 44.0, 52.0, 38.0, 28.0, 34.0, 29.0, 29.0, 31.0, 27.0, 21.0, 25.0, 24.0, 14.0, 15.0, 10.0, 11.0, 6.0, 6.0, 7.0, 6.0, 4.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4211187362670898, -1.374914526939392, -1.3287103176116943, -1.2825061082839966, -1.2363018989562988, -1.1900975704193115, -1.1438934803009033, -1.097689151763916, -1.0514849424362183, -1.0052807331085205, -0.9590765237808228, -0.912872314453125, -0.8666680455207825, -0.8204638361930847, -0.774259626865387, -0.7280553579330444, -0.6818512082099915, -0.6356469988822937, -0.589442789554596, -0.5432385206222534, -0.49703431129455566, -0.4508301019668579, -0.40462589263916016, -0.35842165350914, -0.31221744418144226, -0.2660132348537445, -0.21980899572372437, -0.1736047863960266, -0.12740056216716766, -0.08119633793830872, -0.03499212861061096, 0.01121211051940918, 0.057416319847106934, 0.10362054407596588, 0.14982476830482483, 0.19602897763252258, 0.24223320186138153, 0.2884374260902405, 0.33464163541793823, 0.3808458745479584, 0.42705008387565613, 0.4732542932033539, 0.519458532333374, 0.5656627416610718, 0.6118669509887695, 0.6580711603164673, 0.704275369644165, 0.7504796385765076, 0.7966838479042053, 0.8428880572319031, 0.8890922665596008, 0.9352965354919434, 0.9815007448196411, 1.0277049541473389, 1.0739091634750366, 1.1201133728027344, 1.1663175821304321, 1.2125217914581299, 1.2587260007858276, 1.3049302101135254, 1.3511344194412231, 1.397338628768921, 1.4435429573059082, 1.489747166633606, 1.5359513759613037]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 10.0, 14.0, 20.0, 16.0, 43.0, 41.0, 84.0, 107.0, 176.0, 269.0, 505.0, 832.0, 1548.0, 3307.0, 8509.0, 65841.0, 2569555.0, 1487336.0, 42401.0, 7347.0, 2958.0, 1426.0, 778.0, 410.0, 291.0, 152.0, 92.0, 72.0, 42.0, 26.0, 14.0, 20.0, 6.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9326171875, -1.8720703125, -1.8115234375, -1.7509765625, -1.6904296875, -1.6298828125, -1.5693359375, -1.5087890625, -1.4482421875, -1.3876953125, -1.3271484375, -1.2666015625, -1.2060546875, -1.1455078125, -1.0849609375, -1.0244140625, -0.9638671875, -0.9033203125, -0.8427734375, -0.7822265625, -0.7216796875, -0.6611328125, -0.6005859375, -0.5400390625, -0.4794921875, -0.4189453125, -0.3583984375, -0.2978515625, -0.2373046875, -0.1767578125, -0.1162109375, -0.0556640625, 0.0048828125, 0.0654296875, 0.1259765625, 0.1865234375, 0.2470703125, 0.3076171875, 0.3681640625, 0.4287109375, 0.4892578125, 0.5498046875, 0.6103515625, 0.6708984375, 0.7314453125, 0.7919921875, 0.8525390625, 0.9130859375, 0.9736328125, 1.0341796875, 1.0947265625, 1.1552734375, 1.2158203125, 1.2763671875, 1.3369140625, 1.3974609375, 1.4580078125, 1.5185546875, 1.5791015625, 1.6396484375, 1.7001953125, 1.7607421875, 1.8212890625, 1.8818359375, 1.9423828125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 12.0, 12.0, 12.0, 8.0, 13.0, 26.0, 19.0, 19.0, 44.0, 29.0, 35.0, 39.0, 39.0, 74.0, 43.0, 48.0, 52.0, 57.0, 51.0, 44.0, 49.0, 38.0, 29.0, 32.0, 24.0, 22.0, 15.0, 13.0, 12.0, 9.0, 12.0, 8.0, 9.0, 7.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72509765625, -0.7042236328125, -0.683349609375, -0.6624755859375, -0.6416015625, -0.6207275390625, -0.599853515625, -0.5789794921875, -0.55810546875, -0.5372314453125, -0.516357421875, -0.4954833984375, -0.474609375, -0.4537353515625, -0.432861328125, -0.4119873046875, -0.39111328125, -0.3702392578125, -0.349365234375, -0.3284912109375, -0.3076171875, -0.2867431640625, -0.265869140625, -0.2449951171875, -0.22412109375, -0.2032470703125, -0.182373046875, -0.1614990234375, -0.140625, -0.1197509765625, -0.098876953125, -0.0780029296875, -0.05712890625, -0.0362548828125, -0.015380859375, 0.0054931640625, 0.0263671875, 0.0472412109375, 0.068115234375, 0.0889892578125, 0.10986328125, 0.1307373046875, 0.151611328125, 0.1724853515625, 0.193359375, 0.2142333984375, 0.235107421875, 0.2559814453125, 0.27685546875, 0.2977294921875, 0.318603515625, 0.3394775390625, 0.3603515625, 0.3812255859375, 0.402099609375, 0.4229736328125, 0.44384765625, 0.4647216796875, 0.485595703125, 0.5064697265625, 0.52734375, 0.5482177734375, 0.569091796875, 0.5899658203125, 0.61083984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 13.0, 15.0, 34.0, 61.0, 113.0, 253.0, 679.0, 2177.0, 9724.0, 99850.0, 3986075.0, 83403.0, 8761.0, 1931.0, 603.0, 291.0, 109.0, 69.0, 34.0, 24.0, 16.0, 11.0, 4.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7516632080078125, -1.680084228515625, -1.6085052490234375, -1.53692626953125, -1.4653472900390625, -1.393768310546875, -1.3221893310546875, -1.2506103515625, -1.1790313720703125, -1.107452392578125, -1.0358734130859375, -0.96429443359375, -0.8927154541015625, -0.821136474609375, -0.7495574951171875, -0.677978515625, -0.6063995361328125, -0.534820556640625, -0.4632415771484375, -0.39166259765625, -0.3200836181640625, -0.248504638671875, -0.1769256591796875, -0.1053466796875, -0.0337677001953125, 0.037811279296875, 0.1093902587890625, 0.18096923828125, 0.2525482177734375, 0.324127197265625, 0.3957061767578125, 0.46728515625, 0.5388641357421875, 0.610443115234375, 0.6820220947265625, 0.75360107421875, 0.8251800537109375, 0.896759033203125, 0.9683380126953125, 1.0399169921875, 1.1114959716796875, 1.183074951171875, 1.2546539306640625, 1.32623291015625, 1.3978118896484375, 1.469390869140625, 1.5409698486328125, 1.612548828125, 1.6841278076171875, 1.755706787109375, 1.8272857666015625, 1.89886474609375, 1.9704437255859375, 2.042022705078125, 2.1136016845703125, 2.1851806640625, 2.2567596435546875, 2.328338623046875, 2.3999176025390625, 2.47149658203125, 2.5430755615234375, 2.614654541015625, 2.6862335205078125, 2.7578125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 8.0, 6.0, 16.0, 15.0, 11.0, 24.0, 25.0, 23.0, 46.0, 56.0, 96.0, 146.0, 316.0, 605.0, 812.0, 762.0, 433.0, 247.0, 132.0, 79.0, 47.0, 32.0, 20.0, 20.0, 17.0, 15.0, 7.0, 10.0, 8.0, 8.0, 2.0, 1.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28466796875, -0.2747764587402344, -0.26488494873046875, -0.2549934387207031, -0.2451019287109375, -0.23521041870117188, -0.22531890869140625, -0.21542739868164062, -0.205535888671875, -0.19564437866210938, -0.18575286865234375, -0.17586135864257812, -0.1659698486328125, -0.15607833862304688, -0.14618682861328125, -0.13629531860351562, -0.12640380859375, -0.11651229858398438, -0.10662078857421875, -0.09672927856445312, -0.0868377685546875, -0.07694625854492188, -0.06705474853515625, -0.057163238525390625, -0.047271728515625, -0.037380218505859375, -0.02748870849609375, -0.017597198486328125, -0.0077056884765625, 0.002185821533203125, 0.01207733154296875, 0.021968841552734375, 0.0318603515625, 0.041751861572265625, 0.05164337158203125, 0.061534881591796875, 0.0714263916015625, 0.08131790161132812, 0.09120941162109375, 0.10110092163085938, 0.110992431640625, 0.12088394165039062, 0.13077545166015625, 0.14066696166992188, 0.1505584716796875, 0.16044998168945312, 0.17034149169921875, 0.18023300170898438, 0.19012451171875, 0.20001602172851562, 0.20990753173828125, 0.21979904174804688, 0.2296905517578125, 0.23958206176757812, 0.24947357177734375, 0.2593650817871094, 0.269256591796875, 0.2791481018066406, 0.28903961181640625, 0.2989311218261719, 0.3088226318359375, 0.3187141418457031, 0.32860565185546875, 0.3384971618652344, 0.348388671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 12.0, 10.0, 17.0, 29.0, 40.0, 55.0, 70.0, 79.0, 130.0, 115.0, 117.0, 89.0, 52.0, 58.0, 33.0, 17.0, 11.0, 14.0, 11.0, 6.0, 6.0, 2.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5149469375610352, -1.4754689931869507, -1.4359909296035767, -1.3965129852294922, -1.3570350408554077, -1.3175570964813232, -1.2780790328979492, -1.2386010885238647, -1.1991231441497803, -1.1596451997756958, -1.1201671361923218, -1.0806891918182373, -1.0412112474441528, -1.0017333030700684, -0.9622552394866943, -0.9227772951126099, -0.8832992315292358, -0.8438212275505066, -0.8043432831764221, -0.7648652791976929, -0.7253873348236084, -0.6859093308448792, -0.6464313268661499, -0.6069533824920654, -0.5674753785133362, -0.5279973745346069, -0.48851943016052246, -0.4490414261817932, -0.40956345200538635, -0.3700854778289795, -0.33060747385025024, -0.2911294996738434, -0.2516516447067261, -0.2121736705303192, -0.17269568145275116, -0.1332176923751831, -0.09373971819877625, -0.054261744022369385, -0.01478375494480133, 0.024694234132766724, 0.06417220830917358, 0.10365018993616104, 0.1431281715631485, 0.18260616064071655, 0.2220841348171234, 0.2615621089935303, 0.3010401129722595, 0.3405180871486664, 0.37999606132507324, 0.4194740355014801, 0.45895200967788696, 0.4984300136566162, 0.5379079580307007, 0.5773859620094299, 0.6168639659881592, 0.6563419103622437, 0.6958199143409729, 0.7352979183197021, 0.7747758626937866, 0.8142538666725159, 0.8537318706512451, 0.8932098150253296, 0.9326878190040588, 0.9721658229827881, 1.0116437673568726]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 11.0, 11.0, 8.0, 12.0, 12.0, 13.0, 22.0, 31.0, 29.0, 25.0, 34.0, 30.0, 30.0, 33.0, 33.0, 31.0, 52.0, 52.0, 38.0, 31.0, 38.0, 40.0, 37.0, 33.0, 30.0, 38.0, 20.0, 27.0, 28.0, 21.0, 20.0, 22.0, 14.0, 10.0, 15.0, 11.0, 11.0, 12.0, 4.0, 5.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.6883559226989746, -0.668379008769989, -0.6484020948410034, -0.628425121307373, -0.6084482073783875, -0.5884712934494019, -0.5684943795204163, -0.5485174655914307, -0.5285404920578003, -0.5085635781288147, -0.4885866343975067, -0.4686097204685211, -0.44863277673721313, -0.42865586280822754, -0.40867894887924194, -0.38870200514793396, -0.36872509121894836, -0.34874817728996277, -0.3287712335586548, -0.3087943196296692, -0.2888173758983612, -0.2688404619693756, -0.24886353313922882, -0.22888660430908203, -0.20890967547893524, -0.18893274664878845, -0.16895581781864166, -0.14897888898849487, -0.12900197505950928, -0.10902503877878189, -0.0890481173992157, -0.06907118856906891, -0.04909425973892212, -0.02911733277142048, -0.009140405803918839, 0.010836519300937653, 0.030813448131084442, 0.05079037696123123, 0.07076729834079742, 0.09074422717094421, 0.110721156001091, 0.1306980848312378, 0.15067501366138458, 0.17065194249153137, 0.19062885642051697, 0.21060580015182495, 0.23058271408081055, 0.25055962800979614, 0.2705365717411041, 0.2905134856700897, 0.3104904294013977, 0.3304673433303833, 0.3504442870616913, 0.3704212009906769, 0.39039814472198486, 0.41037505865097046, 0.43035197257995605, 0.45032888650894165, 0.47030583024024963, 0.49028274416923523, 0.5102596879005432, 0.5302366018295288, 0.5502135157585144, 0.5701904296875, 0.5901674032211304]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 14.0, 18.0, 28.0, 42.0, 56.0, 71.0, 137.0, 160.0, 234.0, 359.0, 465.0, 666.0, 1043.0, 1496.0, 2331.0, 3532.0, 5937.0, 11323.0, 24439.0, 74964.0, 492179.0, 327085.0, 56592.0, 20477.0, 9710.0, 5555.0, 3192.0, 2041.0, 1346.0, 945.0, 607.0, 432.0, 317.0, 232.0, 153.0, 102.0, 86.0, 57.0, 27.0, 22.0, 25.0, 14.0, 10.0, 6.0, 7.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.33544921875, -0.3249320983886719, -0.31441497802734375, -0.3038978576660156, -0.2933807373046875, -0.2828636169433594, -0.27234649658203125, -0.2618293762207031, -0.251312255859375, -0.24079513549804688, -0.23027801513671875, -0.21976089477539062, -0.2092437744140625, -0.19872665405273438, -0.18820953369140625, -0.17769241333007812, -0.16717529296875, -0.15665817260742188, -0.14614105224609375, -0.13562393188476562, -0.1251068115234375, -0.11458969116210938, -0.10407257080078125, -0.09355545043945312, -0.083038330078125, -0.07252120971679688, -0.06200408935546875, -0.051486968994140625, -0.0409698486328125, -0.030452728271484375, -0.01993560791015625, -0.009418487548828125, 0.0010986328125, 0.011615753173828125, 0.02213287353515625, 0.032649993896484375, 0.0431671142578125, 0.053684234619140625, 0.06420135498046875, 0.07471847534179688, 0.085235595703125, 0.09575271606445312, 0.10626983642578125, 0.11678695678710938, 0.1273040771484375, 0.13782119750976562, 0.14833831787109375, 0.15885543823242188, 0.16937255859375, 0.17988967895507812, 0.19040679931640625, 0.20092391967773438, 0.2114410400390625, 0.22195816040039062, 0.23247528076171875, 0.24299240112304688, 0.253509521484375, 0.2640266418457031, 0.27454376220703125, 0.2850608825683594, 0.2955780029296875, 0.3060951232910156, 0.31661224365234375, 0.3271293640136719, 0.337646484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 11.0, 7.0, 10.0, 12.0, 14.0, 15.0, 19.0, 21.0, 30.0, 26.0, 28.0, 30.0, 34.0, 33.0, 36.0, 55.0, 53.0, 46.0, 52.0, 35.0, 48.0, 38.0, 43.0, 34.0, 39.0, 25.0, 24.0, 22.0, 22.0, 19.0, 18.0, 14.0, 11.0, 16.0, 9.0, 11.0, 7.0, 2.0, 5.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0], "bins": [-0.4453125, -0.4327545166015625, -0.420196533203125, -0.4076385498046875, -0.39508056640625, -0.3825225830078125, -0.369964599609375, -0.3574066162109375, -0.3448486328125, -0.3322906494140625, -0.319732666015625, -0.3071746826171875, -0.29461669921875, -0.2820587158203125, -0.269500732421875, -0.2569427490234375, -0.244384765625, -0.2318267822265625, -0.219268798828125, -0.2067108154296875, -0.19415283203125, -0.1815948486328125, -0.169036865234375, -0.1564788818359375, -0.1439208984375, -0.1313629150390625, -0.118804931640625, -0.1062469482421875, -0.09368896484375, -0.0811309814453125, -0.068572998046875, -0.0560150146484375, -0.04345703125, -0.0308990478515625, -0.018341064453125, -0.0057830810546875, 0.00677490234375, 0.0193328857421875, 0.031890869140625, 0.0444488525390625, 0.0570068359375, 0.0695648193359375, 0.082122802734375, 0.0946807861328125, 0.10723876953125, 0.1197967529296875, 0.132354736328125, 0.1449127197265625, 0.157470703125, 0.1700286865234375, 0.182586669921875, 0.1951446533203125, 0.20770263671875, 0.2202606201171875, 0.232818603515625, 0.2453765869140625, 0.2579345703125, 0.2704925537109375, 0.283050537109375, 0.2956085205078125, 0.30816650390625, 0.3207244873046875, 0.333282470703125, 0.3458404541015625, 0.3583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 10.0, 25.0, 41.0, 50.0, 75.0, 112.0, 158.0, 266.0, 406.0, 605.0, 988.0, 1705.0, 2829.0, 5359.0, 10956.0, 26807.0, 80269.0, 318594.0, 424137.0, 112183.0, 34563.0, 13669.0, 6372.0, 3363.0, 1893.0, 1072.0, 692.0, 459.0, 320.0, 172.0, 115.0, 87.0, 56.0, 37.0, 35.0, 25.0, 14.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18313026428222656, -0.17705154418945312, -0.1709728240966797, -0.16489410400390625, -0.1588153839111328, -0.15273666381835938, -0.14665794372558594, -0.1405792236328125, -0.13450050354003906, -0.12842178344726562, -0.12234306335449219, -0.11626434326171875, -0.11018562316894531, -0.10410690307617188, -0.09802818298339844, -0.091949462890625, -0.08587074279785156, -0.07979202270507812, -0.07371330261230469, -0.06763458251953125, -0.06155586242675781, -0.055477142333984375, -0.04939842224121094, -0.0433197021484375, -0.03724098205566406, -0.031162261962890625, -0.025083541870117188, -0.01900482177734375, -0.012926101684570312, -0.006847381591796875, -0.0007686614990234375, 0.00531005859375, 0.011388778686523438, 0.017467498779296875, 0.023546218872070312, 0.02962493896484375, 0.03570365905761719, 0.041782379150390625, 0.04786109924316406, 0.0539398193359375, 0.06001853942871094, 0.06609725952148438, 0.07217597961425781, 0.07825469970703125, 0.08433341979980469, 0.09041213989257812, 0.09649085998535156, 0.102569580078125, 0.10864830017089844, 0.11472702026367188, 0.12080574035644531, 0.12688446044921875, 0.1329631805419922, 0.13904190063476562, 0.14512062072753906, 0.1511993408203125, 0.15727806091308594, 0.16335678100585938, 0.1694355010986328, 0.17551422119140625, 0.1815929412841797, 0.18767166137695312, 0.19375038146972656, 0.1998291015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 6.0, 6.0, 10.0, 3.0, 15.0, 13.0, 14.0, 13.0, 17.0, 17.0, 32.0, 29.0, 25.0, 31.0, 32.0, 49.0, 56.0, 32.0, 50.0, 39.0, 47.0, 46.0, 39.0, 34.0, 40.0, 42.0, 33.0, 27.0, 27.0, 34.0, 18.0, 24.0, 12.0, 17.0, 8.0, 11.0, 11.0, 10.0, 10.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.69091796875, -0.6693344116210938, -0.6477508544921875, -0.6261672973632812, -0.604583740234375, -0.5830001831054688, -0.5614166259765625, -0.5398330688476562, -0.51824951171875, -0.49666595458984375, -0.4750823974609375, -0.45349884033203125, -0.431915283203125, -0.41033172607421875, -0.3887481689453125, -0.36716461181640625, -0.3455810546875, -0.32399749755859375, -0.3024139404296875, -0.28083038330078125, -0.259246826171875, -0.23766326904296875, -0.2160797119140625, -0.19449615478515625, -0.17291259765625, -0.15132904052734375, -0.1297454833984375, -0.10816192626953125, -0.086578369140625, -0.06499481201171875, -0.0434112548828125, -0.02182769775390625, -0.000244140625, 0.02133941650390625, 0.0429229736328125, 0.06450653076171875, 0.086090087890625, 0.10767364501953125, 0.1292572021484375, 0.15084075927734375, 0.17242431640625, 0.19400787353515625, 0.2155914306640625, 0.23717498779296875, 0.258758544921875, 0.28034210205078125, 0.3019256591796875, 0.32350921630859375, 0.3450927734375, 0.36667633056640625, 0.3882598876953125, 0.40984344482421875, 0.431427001953125, 0.45301055908203125, 0.4745941162109375, 0.49617767333984375, 0.51776123046875, 0.5393447875976562, 0.5609283447265625, 0.5825119018554688, 0.604095458984375, 0.6256790161132812, 0.6472625732421875, 0.6688461303710938, 0.6904296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 18.0, 18.0, 42.0, 54.0, 85.0, 132.0, 225.0, 357.0, 611.0, 1193.0, 2235.0, 4614.0, 10980.0, 28990.0, 92764.0, 350725.0, 392717.0, 107487.0, 32894.0, 12104.0, 5141.0, 2388.0, 1163.0, 645.0, 356.0, 234.0, 129.0, 88.0, 44.0, 24.0, 22.0, 16.0, 10.0, 10.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0421142578125, -0.04084014892578125, -0.0395660400390625, -0.03829193115234375, -0.037017822265625, -0.03574371337890625, -0.0344696044921875, -0.03319549560546875, -0.03192138671875, -0.03064727783203125, -0.0293731689453125, -0.02809906005859375, -0.026824951171875, -0.02555084228515625, -0.0242767333984375, -0.02300262451171875, -0.021728515625, -0.02045440673828125, -0.0191802978515625, -0.01790618896484375, -0.016632080078125, -0.01535797119140625, -0.0140838623046875, -0.01280975341796875, -0.01153564453125, -0.01026153564453125, -0.0089874267578125, -0.00771331787109375, -0.006439208984375, -0.00516510009765625, -0.0038909912109375, -0.00261688232421875, -0.0013427734375, -6.866455078125e-05, 0.0012054443359375, 0.00247955322265625, 0.003753662109375, 0.00502777099609375, 0.0063018798828125, 0.00757598876953125, 0.00885009765625, 0.01012420654296875, 0.0113983154296875, 0.01267242431640625, 0.013946533203125, 0.01522064208984375, 0.0164947509765625, 0.01776885986328125, 0.01904296875, 0.02031707763671875, 0.0215911865234375, 0.02286529541015625, 0.024139404296875, 0.02541351318359375, 0.0266876220703125, 0.02796173095703125, 0.02923583984375, 0.03050994873046875, 0.0317840576171875, 0.03305816650390625, 0.034332275390625, 0.03560638427734375, 0.0368804931640625, 0.03815460205078125, 0.0394287109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 11.0, 17.0, 15.0, 30.0, 45.0, 58.0, 85.0, 133.0, 141.0, 130.0, 102.0, 83.0, 42.0, 34.0, 23.0, 10.0, 17.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.075599670410156e-05, -2.964399755001068e-05, -2.85319983959198e-05, -2.741999924182892e-05, -2.6308000087738037e-05, -2.5196000933647156e-05, -2.4084001779556274e-05, -2.2972002625465393e-05, -2.1860003471374512e-05, -2.074800431728363e-05, -1.963600516319275e-05, -1.8524006009101868e-05, -1.7412006855010986e-05, -1.6300007700920105e-05, -1.5188008546829224e-05, -1.4076009392738342e-05, -1.2964010238647461e-05, -1.185201108455658e-05, -1.0740011930465698e-05, -9.628012776374817e-06, -8.516013622283936e-06, -7.404014468193054e-06, -6.292015314102173e-06, -5.1800161600112915e-06, -4.06801700592041e-06, -2.956017851829529e-06, -1.8440186977386475e-06, -7.320195436477661e-07, 3.7997961044311523e-07, 1.4919787645339966e-06, 2.603977918624878e-06, 3.7159770727157593e-06, 4.827976226806641e-06, 5.939975380897522e-06, 7.051974534988403e-06, 8.163973689079285e-06, 9.275972843170166e-06, 1.0387971997261047e-05, 1.1499971151351929e-05, 1.261197030544281e-05, 1.3723969459533691e-05, 1.4835968613624573e-05, 1.5947967767715454e-05, 1.7059966921806335e-05, 1.8171966075897217e-05, 1.9283965229988098e-05, 2.039596438407898e-05, 2.150796353816986e-05, 2.2619962692260742e-05, 2.3731961846351624e-05, 2.4843961000442505e-05, 2.5955960154533386e-05, 2.7067959308624268e-05, 2.817995846271515e-05, 2.929195761680603e-05, 3.040395677089691e-05, 3.151595592498779e-05, 3.2627955079078674e-05, 3.3739954233169556e-05, 3.485195338726044e-05, 3.596395254135132e-05, 3.70759516954422e-05, 3.818795084953308e-05, 3.929995000362396e-05, 4.0411949157714844e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 9.0, 18.0, 23.0, 49.0, 72.0, 149.0, 340.0, 801.0, 2560.0, 10482.0, 57410.0, 487737.0, 425676.0, 50122.0, 9385.0, 2370.0, 718.0, 298.0, 133.0, 72.0, 32.0, 27.0, 9.0, 20.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08709716796875, -0.0845327377319336, -0.08196830749511719, -0.07940387725830078, -0.07683944702148438, -0.07427501678466797, -0.07171058654785156, -0.06914615631103516, -0.06658172607421875, -0.06401729583740234, -0.06145286560058594, -0.05888843536376953, -0.056324005126953125, -0.05375957489013672, -0.05119514465332031, -0.048630714416503906, -0.0460662841796875, -0.043501853942871094, -0.04093742370605469, -0.03837299346923828, -0.035808563232421875, -0.03324413299560547, -0.030679702758789062, -0.028115272521972656, -0.02555084228515625, -0.022986412048339844, -0.020421981811523438, -0.01785755157470703, -0.015293121337890625, -0.012728691101074219, -0.010164260864257812, -0.007599830627441406, -0.005035400390625, -0.0024709701538085938, 9.34600830078125e-05, 0.0026578903198242188, 0.005222320556640625, 0.007786750793457031, 0.010351181030273438, 0.012915611267089844, 0.01548004150390625, 0.018044471740722656, 0.020608901977539062, 0.02317333221435547, 0.025737762451171875, 0.02830219268798828, 0.030866622924804688, 0.033431053161621094, 0.0359954833984375, 0.038559913635253906, 0.04112434387207031, 0.04368877410888672, 0.046253204345703125, 0.04881763458251953, 0.05138206481933594, 0.053946495056152344, 0.05651092529296875, 0.059075355529785156, 0.06163978576660156, 0.06420421600341797, 0.06676864624023438, 0.06933307647705078, 0.07189750671386719, 0.0744619369506836, 0.0770263671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 5.0, 8.0, 12.0, 17.0, 13.0, 18.0, 14.0, 27.0, 31.0, 33.0, 53.0, 67.0, 61.0, 72.0, 64.0, 63.0, 73.0, 57.0, 47.0, 47.0, 32.0, 31.0, 34.0, 20.0, 22.0, 13.0, 12.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0129241943359375, -0.012572526931762695, -0.01222085952758789, -0.011869192123413086, -0.011517524719238281, -0.011165857315063477, -0.010814189910888672, -0.010462522506713867, -0.010110855102539062, -0.009759187698364258, -0.009407520294189453, -0.009055852890014648, -0.008704185485839844, -0.008352518081665039, -0.008000850677490234, -0.00764918327331543, -0.007297515869140625, -0.00694584846496582, -0.006594181060791016, -0.006242513656616211, -0.005890846252441406, -0.0055391788482666016, -0.005187511444091797, -0.004835844039916992, -0.0044841766357421875, -0.004132509231567383, -0.003780841827392578, -0.0034291744232177734, -0.0030775070190429688, -0.002725839614868164, -0.0023741722106933594, -0.0020225048065185547, -0.00167083740234375, -0.0013191699981689453, -0.0009675025939941406, -0.0006158351898193359, -0.00026416778564453125, 8.749961853027344e-05, 0.0004391670227050781, 0.0007908344268798828, 0.0011425018310546875, 0.0014941692352294922, 0.0018458366394042969, 0.0021975040435791016, 0.0025491714477539062, 0.002900838851928711, 0.0032525062561035156, 0.0036041736602783203, 0.003955841064453125, 0.00430750846862793, 0.004659175872802734, 0.005010843276977539, 0.005362510681152344, 0.0057141780853271484, 0.006065845489501953, 0.006417512893676758, 0.0067691802978515625, 0.007120847702026367, 0.007472515106201172, 0.007824182510375977, 0.008175849914550781, 0.008527517318725586, 0.00887918472290039, 0.009230852127075195, 0.00958251953125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 13.0, 7.0, 11.0, 26.0, 25.0, 42.0, 43.0, 66.0, 89.0, 115.0, 114.0, 108.0, 92.0, 47.0, 48.0, 36.0, 31.0, 19.0, 8.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.8256650567054749, -0.8052636981010437, -0.7848622798919678, -0.7644609212875366, -0.7440595626831055, -0.7236582040786743, -0.7032567858695984, -0.6828554272651672, -0.6624540090560913, -0.6420526504516602, -0.6216512322425842, -0.6012498736381531, -0.5808485150337219, -0.560447096824646, -0.5400457382202148, -0.5196443796157837, -0.49924302101135254, -0.478841632604599, -0.45844027400016785, -0.4380388855934143, -0.41763752698898315, -0.3972361385822296, -0.3768347501754761, -0.3564333915710449, -0.3360320031642914, -0.31563061475753784, -0.2952292561531067, -0.27482786774635315, -0.2544264793395996, -0.23402512073516846, -0.21362373232841492, -0.19322235882282257, -0.17282095551490784, -0.1524195820093155, -0.13201820850372314, -0.1116168200969696, -0.09121544659137726, -0.07081407308578491, -0.05041269212961197, -0.030011311173439026, -0.00960993766784668, 0.010791439563035965, 0.03119281679391861, 0.051594194024801254, 0.0719955712556839, 0.09239694476127625, 0.11279832571744919, 0.13319970667362213, 0.15360108017921448, 0.17400245368480682, 0.19440382719039917, 0.2148052155971527, 0.23520658910274506, 0.2556079626083374, 0.27600935101509094, 0.2964107394218445, 0.31681209802627563, 0.3372134864330292, 0.3576148450374603, 0.37801623344421387, 0.398417592048645, 0.41881898045539856, 0.4392203688621521, 0.45962172746658325, 0.4800231158733368]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 8.0, 12.0, 9.0, 12.0, 20.0, 17.0, 26.0, 36.0, 24.0, 25.0, 32.0, 28.0, 42.0, 32.0, 51.0, 49.0, 52.0, 45.0, 41.0, 29.0, 40.0, 37.0, 27.0, 48.0, 29.0, 24.0, 26.0, 33.0, 17.0, 15.0, 17.0, 12.0, 15.0, 14.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 4.0, 4.0], "bins": [-0.43707090616226196, -0.4251249432563782, -0.4131790101528168, -0.40123307704925537, -0.3892871141433716, -0.3773411512374878, -0.3653952181339264, -0.353449285030365, -0.3415033221244812, -0.3295573592185974, -0.317611426115036, -0.3056654930114746, -0.2937195301055908, -0.28177356719970703, -0.26982763409614563, -0.25788170099258423, -0.24593573808670044, -0.23398979008197784, -0.22204384207725525, -0.21009789407253265, -0.19815194606781006, -0.18620599806308746, -0.17426005005836487, -0.16231410205364227, -0.15036815404891968, -0.13842220604419708, -0.1264762580394745, -0.11453031003475189, -0.1025843620300293, -0.0906384140253067, -0.0786924660205841, -0.06674651801586151, -0.054800570011138916, -0.04285462200641632, -0.030908674001693726, -0.01896272599697113, -0.007016777992248535, 0.00492917001247406, 0.016875118017196655, 0.02882106602191925, 0.040767014026641846, 0.05271296203136444, 0.06465891003608704, 0.07660485804080963, 0.08855080604553223, 0.10049675405025482, 0.11244270205497742, 0.12438865005970001, 0.1363345980644226, 0.1482805460691452, 0.1602264940738678, 0.1721724420785904, 0.184118390083313, 0.19606433808803558, 0.20801028609275818, 0.21995623409748077, 0.23190218210220337, 0.24384813010692596, 0.25579407811164856, 0.26774001121520996, 0.27968597412109375, 0.29163193702697754, 0.30357787013053894, 0.31552380323410034, 0.32746976613998413]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 8.0, 10.0, 14.0, 18.0, 38.0, 56.0, 77.0, 97.0, 123.0, 206.0, 342.0, 471.0, 734.0, 1180.0, 1848.0, 3102.0, 5420.0, 10728.0, 32728.0, 269941.0, 625557.0, 63409.0, 15432.0, 7000.0, 3819.0, 2255.0, 1367.0, 885.0, 551.0, 397.0, 240.0, 151.0, 90.0, 70.0, 58.0, 43.0, 29.0, 24.0, 9.0, 4.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.484619140625, -0.4700202941894531, -0.45542144775390625, -0.4408226013183594, -0.4262237548828125, -0.4116249084472656, -0.39702606201171875, -0.3824272155761719, -0.367828369140625, -0.3532295227050781, -0.33863067626953125, -0.3240318298339844, -0.3094329833984375, -0.2948341369628906, -0.28023529052734375, -0.2656364440917969, -0.25103759765625, -0.23643875122070312, -0.22183990478515625, -0.20724105834960938, -0.1926422119140625, -0.17804336547851562, -0.16344451904296875, -0.14884567260742188, -0.134246826171875, -0.11964797973632812, -0.10504913330078125, -0.09045028686523438, -0.0758514404296875, -0.061252593994140625, -0.04665374755859375, -0.032054901123046875, -0.0174560546875, -0.002857208251953125, 0.01174163818359375, 0.026340484619140625, 0.0409393310546875, 0.055538177490234375, 0.07013702392578125, 0.08473587036132812, 0.099334716796875, 0.11393356323242188, 0.12853240966796875, 0.14313125610351562, 0.1577301025390625, 0.17232894897460938, 0.18692779541015625, 0.20152664184570312, 0.21612548828125, 0.23072433471679688, 0.24532318115234375, 0.2599220275878906, 0.2745208740234375, 0.2891197204589844, 0.30371856689453125, 0.3183174133300781, 0.332916259765625, 0.3475151062011719, 0.36211395263671875, 0.3767127990722656, 0.3913116455078125, 0.4059104919433594, 0.42050933837890625, 0.4351081848144531, 0.44970703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 7.0, 9.0, 9.0, 14.0, 17.0, 27.0, 17.0, 25.0, 26.0, 33.0, 22.0, 38.0, 44.0, 47.0, 50.0, 47.0, 59.0, 52.0, 47.0, 30.0, 40.0, 47.0, 32.0, 28.0, 25.0, 33.0, 27.0, 19.0, 16.0, 19.0, 17.0, 9.0, 7.0, 11.0, 7.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0], "bins": [-1.00390625, -0.9770126342773438, -0.9501190185546875, -0.9232254028320312, -0.896331787109375, -0.8694381713867188, -0.8425445556640625, -0.8156509399414062, -0.78875732421875, -0.7618637084960938, -0.7349700927734375, -0.7080764770507812, -0.681182861328125, -0.6542892456054688, -0.6273956298828125, -0.6005020141601562, -0.5736083984375, -0.5467147827148438, -0.5198211669921875, -0.49292755126953125, -0.466033935546875, -0.43914031982421875, -0.4122467041015625, -0.38535308837890625, -0.35845947265625, -0.33156585693359375, -0.3046722412109375, -0.27777862548828125, -0.250885009765625, -0.22399139404296875, -0.1970977783203125, -0.17020416259765625, -0.143310546875, -0.11641693115234375, -0.0895233154296875, -0.06262969970703125, -0.035736083984375, -0.00884246826171875, 0.0180511474609375, 0.04494476318359375, 0.07183837890625, 0.09873199462890625, 0.1256256103515625, 0.15251922607421875, 0.179412841796875, 0.20630645751953125, 0.2332000732421875, 0.26009368896484375, 0.2869873046875, 0.31388092041015625, 0.3407745361328125, 0.36766815185546875, 0.394561767578125, 0.42145538330078125, 0.4483489990234375, 0.47524261474609375, 0.50213623046875, 0.5290298461914062, 0.5559234619140625, 0.5828170776367188, 0.609710693359375, 0.6366043090820312, 0.6634979248046875, 0.6903915405273438, 0.71728515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 3.0, 4.0, 7.0, 2.0, 5.0, 6.0, 12.0, 14.0, 5.0, 23.0, 17.0, 23.0, 17.0, 14.0, 28.0, 28.0, 39.0, 35.0, 45.0, 64.0, 136.0, 700.0, 38981.0, 1005200.0, 2556.0, 184.0, 63.0, 56.0, 36.0, 29.0, 33.0, 24.0, 22.0, 21.0, 17.0, 19.0, 8.0, 7.0, 13.0, 5.0, 9.0, 13.0, 8.0, 6.0, 4.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.337921142578125, -2.25787353515625, -2.177825927734375, -2.0977783203125, -2.017730712890625, -1.93768310546875, -1.857635498046875, -1.777587890625, -1.697540283203125, -1.61749267578125, -1.537445068359375, -1.4573974609375, -1.377349853515625, -1.29730224609375, -1.217254638671875, -1.13720703125, -1.057159423828125, -0.97711181640625, -0.897064208984375, -0.8170166015625, -0.736968994140625, -0.65692138671875, -0.576873779296875, -0.496826171875, -0.416778564453125, -0.33673095703125, -0.256683349609375, -0.1766357421875, -0.096588134765625, -0.01654052734375, 0.063507080078125, 0.1435546875, 0.223602294921875, 0.30364990234375, 0.383697509765625, 0.4637451171875, 0.543792724609375, 0.62384033203125, 0.703887939453125, 0.783935546875, 0.863983154296875, 0.94403076171875, 1.024078369140625, 1.1041259765625, 1.184173583984375, 1.26422119140625, 1.344268798828125, 1.42431640625, 1.504364013671875, 1.58441162109375, 1.664459228515625, 1.7445068359375, 1.824554443359375, 1.90460205078125, 1.984649658203125, 2.064697265625, 2.144744873046875, 2.22479248046875, 2.304840087890625, 2.3848876953125, 2.464935302734375, 2.54498291015625, 2.625030517578125, 2.705078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 20.0, 21.0, 16.0, 21.0, 21.0, 26.0, 33.0, 36.0, 47.0, 35.0, 59.0, 51.0, 42.0, 45.0, 35.0, 64.0, 38.0, 38.0, 31.0, 40.0, 34.0, 23.0, 19.0, 23.0, 24.0, 13.0, 13.0, 14.0, 9.0, 6.0, 12.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.72705078125, -0.70263671875, -0.67822265625, -0.65380859375, -0.62939453125, -0.60498046875, -0.58056640625, -0.55615234375, -0.53173828125, -0.50732421875, -0.48291015625, -0.45849609375, -0.43408203125, -0.40966796875, -0.38525390625, -0.36083984375, -0.33642578125, -0.31201171875, -0.28759765625, -0.26318359375, -0.23876953125, -0.21435546875, -0.18994140625, -0.16552734375, -0.14111328125, -0.11669921875, -0.09228515625, -0.06787109375, -0.04345703125, -0.01904296875, 0.00537109375, 0.02978515625, 0.05419921875, 0.07861328125, 0.10302734375, 0.12744140625, 0.15185546875, 0.17626953125, 0.20068359375, 0.22509765625, 0.24951171875, 0.27392578125, 0.29833984375, 0.32275390625, 0.34716796875, 0.37158203125, 0.39599609375, 0.42041015625, 0.44482421875, 0.46923828125, 0.49365234375, 0.51806640625, 0.54248046875, 0.56689453125, 0.59130859375, 0.61572265625, 0.64013671875, 0.66455078125, 0.68896484375, 0.71337890625, 0.73779296875, 0.76220703125, 0.78662109375, 0.81103515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 7.0, 11.0, 13.0, 27.0, 37.0, 59.0, 109.0, 152.0, 295.0, 584.0, 1136.0, 2481.0, 6147.0, 22850.0, 635212.0, 350621.0, 18586.0, 5442.0, 2293.0, 1138.0, 595.0, 340.0, 171.0, 93.0, 61.0, 26.0, 25.0, 12.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271728515625, -0.26416778564453125, -0.2566070556640625, -0.24904632568359375, -0.241485595703125, -0.23392486572265625, -0.2263641357421875, -0.21880340576171875, -0.21124267578125, -0.20368194580078125, -0.1961212158203125, -0.18856048583984375, -0.180999755859375, -0.17343902587890625, -0.1658782958984375, -0.15831756591796875, -0.1507568359375, -0.14319610595703125, -0.1356353759765625, -0.12807464599609375, -0.120513916015625, -0.11295318603515625, -0.1053924560546875, -0.09783172607421875, -0.09027099609375, -0.08271026611328125, -0.0751495361328125, -0.06758880615234375, -0.060028076171875, -0.05246734619140625, -0.0449066162109375, -0.03734588623046875, -0.02978515625, -0.02222442626953125, -0.0146636962890625, -0.00710296630859375, 0.000457763671875, 0.00801849365234375, 0.0155792236328125, 0.02313995361328125, 0.03070068359375, 0.03826141357421875, 0.0458221435546875, 0.05338287353515625, 0.060943603515625, 0.06850433349609375, 0.0760650634765625, 0.08362579345703125, 0.0911865234375, 0.09874725341796875, 0.1063079833984375, 0.11386871337890625, 0.121429443359375, 0.12899017333984375, 0.1365509033203125, 0.14411163330078125, 0.15167236328125, 0.15923309326171875, 0.1667938232421875, 0.17435455322265625, 0.181915283203125, 0.18947601318359375, 0.1970367431640625, 0.20459747314453125, 0.212158203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 3.0, 2.0, 8.0, 8.0, 23.0, 44.0, 154.0, 408.0, 210.0, 60.0, 31.0, 16.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.463029861450195e-05, -3.277510404586792e-05, -3.091990947723389e-05, -2.9064714908599854e-05, -2.720952033996582e-05, -2.5354325771331787e-05, -2.3499131202697754e-05, -2.164393663406372e-05, -1.9788742065429688e-05, -1.7933547496795654e-05, -1.607835292816162e-05, -1.4223158359527588e-05, -1.2367963790893555e-05, -1.0512769222259521e-05, -8.657574653625488e-06, -6.802380084991455e-06, -4.947185516357422e-06, -3.0919909477233887e-06, -1.2367963790893555e-06, 6.183981895446777e-07, 2.473592758178711e-06, 4.328787326812744e-06, 6.183981895446777e-06, 8.03917646408081e-06, 9.894371032714844e-06, 1.1749565601348877e-05, 1.360476016998291e-05, 1.5459954738616943e-05, 1.7315149307250977e-05, 1.917034387588501e-05, 2.1025538444519043e-05, 2.2880733013153076e-05, 2.473592758178711e-05, 2.6591122150421143e-05, 2.8446316719055176e-05, 3.030151128768921e-05, 3.215670585632324e-05, 3.4011900424957275e-05, 3.586709499359131e-05, 3.772228956222534e-05, 3.9577484130859375e-05, 4.143267869949341e-05, 4.328787326812744e-05, 4.5143067836761475e-05, 4.699826240539551e-05, 4.885345697402954e-05, 5.0708651542663574e-05, 5.256384611129761e-05, 5.441904067993164e-05, 5.6274235248565674e-05, 5.812942981719971e-05, 5.998462438583374e-05, 6.183981895446777e-05, 6.36950135231018e-05, 6.555020809173584e-05, 6.740540266036987e-05, 6.92605972290039e-05, 7.111579179763794e-05, 7.297098636627197e-05, 7.4826180934906e-05, 7.668137550354004e-05, 7.853657007217407e-05, 8.03917646408081e-05, 8.224695920944214e-05, 8.410215377807617e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 13.0, 22.0, 23.0, 43.0, 49.0, 95.0, 119.0, 213.0, 329.0, 489.0, 849.0, 1368.0, 2337.0, 4480.0, 9882.0, 32141.0, 584514.0, 365636.0, 27049.0, 8954.0, 4193.0, 2292.0, 1265.0, 824.0, 459.0, 336.0, 177.0, 122.0, 86.0, 56.0, 35.0, 30.0, 13.0, 15.0, 9.0, 9.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2122802734375, -0.20563507080078125, -0.1989898681640625, -0.19234466552734375, -0.185699462890625, -0.17905426025390625, -0.1724090576171875, -0.16576385498046875, -0.15911865234375, -0.15247344970703125, -0.1458282470703125, -0.13918304443359375, -0.132537841796875, -0.12589263916015625, -0.1192474365234375, -0.11260223388671875, -0.10595703125, -0.09931182861328125, -0.0926666259765625, -0.08602142333984375, -0.079376220703125, -0.07273101806640625, -0.0660858154296875, -0.05944061279296875, -0.05279541015625, -0.04615020751953125, -0.0395050048828125, -0.03285980224609375, -0.026214599609375, -0.01956939697265625, -0.0129241943359375, -0.00627899169921875, 0.0003662109375, 0.00701141357421875, 0.0136566162109375, 0.02030181884765625, 0.026947021484375, 0.03359222412109375, 0.0402374267578125, 0.04688262939453125, 0.05352783203125, 0.06017303466796875, 0.0668182373046875, 0.07346343994140625, 0.080108642578125, 0.08675384521484375, 0.0933990478515625, 0.10004425048828125, 0.106689453125, 0.11333465576171875, 0.1199798583984375, 0.12662506103515625, 0.133270263671875, 0.13991546630859375, 0.1465606689453125, 0.15320587158203125, 0.15985107421875, 0.16649627685546875, 0.1731414794921875, 0.17978668212890625, 0.186431884765625, 0.19307708740234375, 0.1997222900390625, 0.20636749267578125, 0.2130126953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 8.0, 14.0, 23.0, 31.0, 50.0, 102.0, 203.0, 248.0, 120.0, 58.0, 40.0, 17.0, 17.0, 13.0, 4.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1109619140625, -0.10771656036376953, -0.10447120666503906, -0.1012258529663086, -0.09798049926757812, -0.09473514556884766, -0.09148979187011719, -0.08824443817138672, -0.08499908447265625, -0.08175373077392578, -0.07850837707519531, -0.07526302337646484, -0.07201766967773438, -0.0687723159790039, -0.06552696228027344, -0.06228160858154297, -0.0590362548828125, -0.05579090118408203, -0.05254554748535156, -0.049300193786621094, -0.046054840087890625, -0.042809486389160156, -0.03956413269042969, -0.03631877899169922, -0.03307342529296875, -0.02982807159423828, -0.026582717895507812, -0.023337364196777344, -0.020092010498046875, -0.016846656799316406, -0.013601303100585938, -0.010355949401855469, -0.007110595703125, -0.0038652420043945312, -0.0006198883056640625, 0.0026254653930664062, 0.005870819091796875, 0.009116172790527344, 0.012361526489257812, 0.015606880187988281, 0.01885223388671875, 0.02209758758544922, 0.025342941284179688, 0.028588294982910156, 0.031833648681640625, 0.035079002380371094, 0.03832435607910156, 0.04156970977783203, 0.0448150634765625, 0.04806041717529297, 0.05130577087402344, 0.054551124572753906, 0.057796478271484375, 0.061041831970214844, 0.06428718566894531, 0.06753253936767578, 0.07077789306640625, 0.07402324676513672, 0.07726860046386719, 0.08051395416259766, 0.08375930786132812, 0.0870046615600586, 0.09025001525878906, 0.09349536895751953, 0.09674072265625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 15.0, 13.0, 19.0, 28.0, 49.0, 54.0, 91.0, 115.0, 136.0, 113.0, 115.0, 76.0, 44.0, 31.0, 27.0, 14.0, 14.0, 7.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9558732509613037, -1.9066932201385498, -1.857513189315796, -1.808333158493042, -1.759153127670288, -1.7099730968475342, -1.6607930660247803, -1.6116130352020264, -1.5624330043792725, -1.5132529735565186, -1.4640729427337646, -1.4148929119110107, -1.3657128810882568, -1.316532850265503, -1.267352819442749, -1.2181727886199951, -1.1689927577972412, -1.1198127269744873, -1.0706326961517334, -1.0214526653289795, -0.9722726345062256, -0.9230926036834717, -0.8739125728607178, -0.8247325420379639, -0.77555251121521, -0.726372480392456, -0.6771924495697021, -0.6280124187469482, -0.5788323879241943, -0.5296523571014404, -0.4804723262786865, -0.4312922954559326, -0.38211214542388916, -0.33293211460113525, -0.28375208377838135, -0.23457205295562744, -0.18539202213287354, -0.13621199131011963, -0.08703196048736572, -0.037851929664611816, 0.01132810115814209, 0.060508131980895996, 0.1096881628036499, 0.1588681936264038, 0.20804822444915771, 0.2572282552719116, 0.3064082860946655, 0.35558831691741943, 0.40476834774017334, 0.45394837856292725, 0.5031284093856812, 0.5523084402084351, 0.601488471031189, 0.6506685018539429, 0.6998485326766968, 0.7490285634994507, 0.7982085943222046, 0.8473886251449585, 0.8965686559677124, 0.9457486867904663, 0.9949287176132202, 1.0441087484359741, 1.093288779258728, 1.142468810081482, 1.1916488409042358]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 10.0, 13.0, 19.0, 18.0, 23.0, 30.0, 42.0, 29.0, 37.0, 46.0, 40.0, 40.0, 45.0, 51.0, 40.0, 45.0, 43.0, 42.0, 34.0, 40.0, 47.0, 35.0, 32.0, 28.0, 18.0, 22.0, 23.0, 20.0, 16.0, 5.0, 6.0, 9.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3416337966918945, -1.2968405485153198, -1.2520473003387451, -1.2072540521621704, -1.1624608039855957, -1.1176674365997314, -1.0728741884231567, -1.028080940246582, -0.9832876920700073, -0.9384944438934326, -0.8937011957168579, -0.8489078879356384, -0.8041146397590637, -0.759321391582489, -0.7145280838012695, -0.6697348356246948, -0.6249415874481201, -0.5801483392715454, -0.5353550910949707, -0.4905617833137512, -0.4457685351371765, -0.4009752869606018, -0.3561820089817047, -0.3113887310028076, -0.2665954828262329, -0.221802219748497, -0.1770089566707611, -0.1322156935930252, -0.0874224305152893, -0.042629167437553406, 0.002164095640182495, 0.04695737361907959, 0.09175074100494385, 0.13654400408267975, 0.18133726716041565, 0.22613053023815155, 0.27092379331588745, 0.31571704149246216, 0.36051031947135925, 0.40530359745025635, 0.45009684562683105, 0.49489009380340576, 0.5396833419799805, 0.5844766497612, 0.6292698979377747, 0.6740631461143494, 0.7188564538955688, 0.7636497020721436, 0.8084429502487183, 0.853236198425293, 0.8980294466018677, 0.9428227543830872, 0.9876160025596619, 1.0324093103408813, 1.077202558517456, 1.1219958066940308, 1.1667890548706055, 1.2115823030471802, 1.2563755512237549, 1.3011687994003296, 1.3459620475769043, 1.3907554149627686, 1.4355486631393433, 1.480341911315918, 1.5251351594924927]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 14.0, 18.0, 24.0, 41.0, 55.0, 87.0, 180.0, 338.0, 839.0, 2499.0, 10447.0, 298524.0, 3814377.0, 57758.0, 6136.0, 1687.0, 615.0, 247.0, 144.0, 75.0, 42.0, 37.0, 30.0, 15.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24407958984375, -2.1619873046875, -2.07989501953125, -1.997802734375, -1.91571044921875, -1.8336181640625, -1.75152587890625, -1.66943359375, -1.58734130859375, -1.5052490234375, -1.42315673828125, -1.341064453125, -1.25897216796875, -1.1768798828125, -1.09478759765625, -1.0126953125, -0.93060302734375, -0.8485107421875, -0.76641845703125, -0.684326171875, -0.60223388671875, -0.5201416015625, -0.43804931640625, -0.35595703125, -0.27386474609375, -0.1917724609375, -0.10968017578125, -0.027587890625, 0.05450439453125, 0.1365966796875, 0.21868896484375, 0.30078125, 0.38287353515625, 0.4649658203125, 0.54705810546875, 0.629150390625, 0.71124267578125, 0.7933349609375, 0.87542724609375, 0.95751953125, 1.03961181640625, 1.1217041015625, 1.20379638671875, 1.285888671875, 1.36798095703125, 1.4500732421875, 1.53216552734375, 1.6142578125, 1.69635009765625, 1.7784423828125, 1.86053466796875, 1.942626953125, 2.02471923828125, 2.1068115234375, 2.18890380859375, 2.27099609375, 2.35308837890625, 2.4351806640625, 2.51727294921875, 2.599365234375, 2.68145751953125, 2.7635498046875, 2.84564208984375, 2.927734375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 6.0, 15.0, 14.0, 19.0, 22.0, 28.0, 39.0, 35.0, 38.0, 55.0, 50.0, 58.0, 59.0, 45.0, 62.0, 51.0, 56.0, 57.0, 39.0, 38.0, 38.0, 25.0, 27.0, 25.0, 23.0, 15.0, 12.0, 5.0, 8.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.705078125, -0.6843109130859375, -0.663543701171875, -0.6427764892578125, -0.62200927734375, -0.6012420654296875, -0.580474853515625, -0.5597076416015625, -0.5389404296875, -0.5181732177734375, -0.497406005859375, -0.4766387939453125, -0.45587158203125, -0.4351043701171875, -0.414337158203125, -0.3935699462890625, -0.372802734375, -0.3520355224609375, -0.331268310546875, -0.3105010986328125, -0.28973388671875, -0.2689666748046875, -0.248199462890625, -0.2274322509765625, -0.2066650390625, -0.1858978271484375, -0.165130615234375, -0.1443634033203125, -0.12359619140625, -0.1028289794921875, -0.082061767578125, -0.0612945556640625, -0.04052734375, -0.0197601318359375, 0.001007080078125, 0.0217742919921875, 0.04254150390625, 0.0633087158203125, 0.084075927734375, 0.1048431396484375, 0.1256103515625, 0.1463775634765625, 0.167144775390625, 0.1879119873046875, 0.20867919921875, 0.2294464111328125, 0.250213623046875, 0.2709808349609375, 0.291748046875, 0.3125152587890625, 0.333282470703125, 0.3540496826171875, 0.37481689453125, 0.3955841064453125, 0.416351318359375, 0.4371185302734375, 0.4578857421875, 0.4786529541015625, 0.499420166015625, 0.5201873779296875, 0.54095458984375, 0.5617218017578125, 0.582489013671875, 0.6032562255859375, 0.6240234375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 11.0, 12.0, 15.0, 9.0, 21.0, 26.0, 50.0, 72.0, 84.0, 208.0, 467.0, 1029.0, 2839.0, 9934.0, 51272.0, 2088163.0, 1974104.0, 51169.0, 9881.0, 2929.0, 1033.0, 423.0, 190.0, 110.0, 68.0, 36.0, 31.0, 18.0, 16.0, 21.0, 4.0, 5.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1220703125, -1.08050537109375, -1.0389404296875, -0.99737548828125, -0.955810546875, -0.91424560546875, -0.8726806640625, -0.83111572265625, -0.78955078125, -0.74798583984375, -0.7064208984375, -0.66485595703125, -0.623291015625, -0.58172607421875, -0.5401611328125, -0.49859619140625, -0.45703125, -0.41546630859375, -0.3739013671875, -0.33233642578125, -0.290771484375, -0.24920654296875, -0.2076416015625, -0.16607666015625, -0.12451171875, -0.08294677734375, -0.0413818359375, 0.00018310546875, 0.041748046875, 0.08331298828125, 0.1248779296875, 0.16644287109375, 0.2080078125, 0.24957275390625, 0.2911376953125, 0.33270263671875, 0.374267578125, 0.41583251953125, 0.4573974609375, 0.49896240234375, 0.54052734375, 0.58209228515625, 0.6236572265625, 0.66522216796875, 0.706787109375, 0.74835205078125, 0.7899169921875, 0.83148193359375, 0.873046875, 0.91461181640625, 0.9561767578125, 0.99774169921875, 1.039306640625, 1.08087158203125, 1.1224365234375, 1.16400146484375, 1.20556640625, 1.24713134765625, 1.2886962890625, 1.33026123046875, 1.371826171875, 1.41339111328125, 1.4549560546875, 1.49652099609375, 1.5380859375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 19.0, 17.0, 16.0, 23.0, 29.0, 39.0, 65.0, 99.0, 114.0, 250.0, 461.0, 723.0, 820.0, 536.0, 315.0, 182.0, 94.0, 56.0, 45.0, 31.0, 23.0, 26.0, 19.0, 14.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28076171875, -0.272308349609375, -0.26385498046875, -0.255401611328125, -0.2469482421875, -0.238494873046875, -0.23004150390625, -0.221588134765625, -0.213134765625, -0.204681396484375, -0.19622802734375, -0.187774658203125, -0.1793212890625, -0.170867919921875, -0.16241455078125, -0.153961181640625, -0.1455078125, -0.137054443359375, -0.12860107421875, -0.120147705078125, -0.1116943359375, -0.103240966796875, -0.09478759765625, -0.086334228515625, -0.077880859375, -0.069427490234375, -0.06097412109375, -0.052520751953125, -0.0440673828125, -0.035614013671875, -0.02716064453125, -0.018707275390625, -0.01025390625, -0.001800537109375, 0.00665283203125, 0.015106201171875, 0.0235595703125, 0.032012939453125, 0.04046630859375, 0.048919677734375, 0.057373046875, 0.065826416015625, 0.07427978515625, 0.082733154296875, 0.0911865234375, 0.099639892578125, 0.10809326171875, 0.116546630859375, 0.125, 0.133453369140625, 0.14190673828125, 0.150360107421875, 0.1588134765625, 0.167266845703125, 0.17572021484375, 0.184173583984375, 0.192626953125, 0.201080322265625, 0.20953369140625, 0.217987060546875, 0.2264404296875, 0.234893798828125, 0.24334716796875, 0.251800537109375, 0.26025390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 12.0, 19.0, 17.0, 28.0, 33.0, 56.0, 70.0, 133.0, 164.0, 129.0, 89.0, 58.0, 56.0, 39.0, 30.0, 19.0, 7.0, 6.0, 9.0, 6.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6198253631591797, -1.5801854133605957, -1.5405454635620117, -1.5009055137634277, -1.4612655639648438, -1.4216256141662598, -1.3819856643676758, -1.3423457145690918, -1.3027057647705078, -1.2630658149719238, -1.2234258651733398, -1.1837859153747559, -1.1441459655761719, -1.104506015777588, -1.064866065979004, -1.02522611618042, -0.9855862259864807, -0.9459462761878967, -0.9063063263893127, -0.8666663765907288, -0.8270264267921448, -0.7873864769935608, -0.7477465867996216, -0.7081066370010376, -0.6684666872024536, -0.6288267374038696, -0.5891867876052856, -0.5495468378067017, -0.5099068880081177, -0.4702669382095337, -0.4306270182132721, -0.3909870684146881, -0.35134708881378174, -0.31170713901519775, -0.27206718921661377, -0.23242725431919098, -0.192787304520607, -0.153147354722023, -0.11350741982460022, -0.07386747002601624, -0.03422752022743225, 0.005412425845861435, 0.04505237191915512, 0.08469231426715851, 0.12433226406574249, 0.16397221386432648, 0.20361214876174927, 0.24325209856033325, 0.28289204835891724, 0.3225319981575012, 0.3621719479560852, 0.4018118977546692, 0.4414518475532532, 0.48109179735183716, 0.5207316875457764, 0.5603716373443604, 0.6000115871429443, 0.6396515369415283, 0.6792914867401123, 0.7189314365386963, 0.7585713863372803, 0.7982113361358643, 0.8378512859344482, 0.8774912357330322, 0.9171311855316162]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 4.0, 8.0, 12.0, 12.0, 13.0, 20.0, 19.0, 16.0, 34.0, 33.0, 43.0, 40.0, 47.0, 38.0, 45.0, 48.0, 44.0, 46.0, 43.0, 48.0, 44.0, 44.0, 49.0, 36.0, 24.0, 30.0, 31.0, 21.0, 22.0, 12.0, 17.0, 13.0, 5.0, 10.0, 9.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6572402715682983, -0.6374079585075378, -0.6175755858421326, -0.5977432727813721, -0.5779109001159668, -0.5580785870552063, -0.5382462739944458, -0.5184139013290405, -0.49858158826828003, -0.47874924540519714, -0.45891690254211426, -0.43908458948135376, -0.4192522466182709, -0.399419903755188, -0.3795875608921051, -0.3597552180290222, -0.33992287516593933, -0.32009053230285645, -0.30025818943977356, -0.2804258465766907, -0.2605935335159302, -0.2407611906528473, -0.2209288477897644, -0.2010965198278427, -0.18126417696475983, -0.16143183410167694, -0.14159950613975525, -0.12176716327667236, -0.10193482786417007, -0.08210249245166779, -0.0622701495885849, -0.04243782162666321, -0.022605478763580322, -0.002773141488432884, 0.017059195786714554, 0.03689153492450714, 0.05672387033700943, 0.07655620574951172, 0.0963885486125946, 0.1162208765745163, 0.13605321943759918, 0.15588556230068207, 0.17571789026260376, 0.19555023312568665, 0.21538257598876953, 0.23521490395069122, 0.2550472617149353, 0.2748795747756958, 0.2947119176387787, 0.3145442605018616, 0.33437660336494446, 0.35420894622802734, 0.37404125928878784, 0.3938736021518707, 0.4137059450149536, 0.4335382580757141, 0.4533706307411194, 0.47320297360420227, 0.49303531646728516, 0.5128676295280457, 0.5327000021934509, 0.5525323152542114, 0.5723646879196167, 0.5921970009803772, 0.6120293140411377]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 0.0, 4.0, 8.0, 9.0, 12.0, 22.0, 30.0, 41.0, 53.0, 114.0, 179.0, 301.0, 676.0, 1314.0, 2955.0, 7102.0, 19750.0, 65950.0, 294994.0, 489817.0, 115624.0, 30930.0, 10728.0, 4176.0, 1820.0, 888.0, 425.0, 256.0, 134.0, 75.0, 41.0, 32.0, 28.0, 15.0, 14.0, 13.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.1900634765625, -0.18521499633789062, -0.18036651611328125, -0.17551803588867188, -0.1706695556640625, -0.16582107543945312, -0.16097259521484375, -0.15612411499023438, -0.151275634765625, -0.14642715454101562, -0.14157867431640625, -0.13673019409179688, -0.1318817138671875, -0.12703323364257812, -0.12218475341796875, -0.11733627319335938, -0.11248779296875, -0.10763931274414062, -0.10279083251953125, -0.09794235229492188, -0.0930938720703125, -0.08824539184570312, -0.08339691162109375, -0.07854843139648438, -0.073699951171875, -0.06885147094726562, -0.06400299072265625, -0.059154510498046875, -0.0543060302734375, -0.049457550048828125, -0.04460906982421875, -0.039760589599609375, -0.034912109375, -0.030063629150390625, -0.02521514892578125, -0.020366668701171875, -0.0155181884765625, -0.010669708251953125, -0.00582122802734375, -0.000972747802734375, 0.003875732421875, 0.008724212646484375, 0.01357269287109375, 0.018421173095703125, 0.0232696533203125, 0.028118133544921875, 0.03296661376953125, 0.037815093994140625, 0.04266357421875, 0.047512054443359375, 0.05236053466796875, 0.057209014892578125, 0.0620574951171875, 0.06690597534179688, 0.07175445556640625, 0.07660293579101562, 0.081451416015625, 0.08629989624023438, 0.09114837646484375, 0.09599685668945312, 0.1008453369140625, 0.10569381713867188, 0.11054229736328125, 0.11539077758789062, 0.1202392578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 8.0, 15.0, 18.0, 18.0, 18.0, 34.0, 42.0, 42.0, 50.0, 52.0, 52.0, 58.0, 57.0, 54.0, 62.0, 50.0, 45.0, 55.0, 43.0, 29.0, 31.0, 26.0, 24.0, 17.0, 14.0, 18.0, 7.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.489013671875, -0.4742240905761719, -0.45943450927734375, -0.4446449279785156, -0.4298553466796875, -0.4150657653808594, -0.40027618408203125, -0.3854866027832031, -0.370697021484375, -0.3559074401855469, -0.34111785888671875, -0.3263282775878906, -0.3115386962890625, -0.2967491149902344, -0.28195953369140625, -0.2671699523925781, -0.25238037109375, -0.23759078979492188, -0.22280120849609375, -0.20801162719726562, -0.1932220458984375, -0.17843246459960938, -0.16364288330078125, -0.14885330200195312, -0.134063720703125, -0.11927413940429688, -0.10448455810546875, -0.08969497680664062, -0.0749053955078125, -0.060115814208984375, -0.04532623291015625, -0.030536651611328125, -0.0157470703125, -0.000957489013671875, 0.01383209228515625, 0.028621673583984375, 0.0434112548828125, 0.058200836181640625, 0.07299041748046875, 0.08777999877929688, 0.102569580078125, 0.11735916137695312, 0.13214874267578125, 0.14693832397460938, 0.1617279052734375, 0.17651748657226562, 0.19130706787109375, 0.20609664916992188, 0.22088623046875, 0.23567581176757812, 0.25046539306640625, 0.2652549743652344, 0.2800445556640625, 0.2948341369628906, 0.30962371826171875, 0.3244132995605469, 0.339202880859375, 0.3539924621582031, 0.36878204345703125, 0.3835716247558594, 0.3983612060546875, 0.4131507873535156, 0.42794036865234375, 0.4427299499511719, 0.45751953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 17.0, 35.0, 29.0, 66.0, 104.0, 200.0, 323.0, 560.0, 1117.0, 2437.0, 5608.0, 15156.0, 46892.0, 171207.0, 476806.0, 234098.0, 61370.0, 19434.0, 7058.0, 2940.0, 1473.0, 696.0, 368.0, 212.0, 103.0, 75.0, 47.0, 36.0, 11.0, 9.0, 10.0, 4.0, 7.0, 2.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.12017822265625, -0.11637687683105469, -0.11257553100585938, -0.10877418518066406, -0.10497283935546875, -0.10117149353027344, -0.09737014770507812, -0.09356880187988281, -0.0897674560546875, -0.08596611022949219, -0.08216476440429688, -0.07836341857910156, -0.07456207275390625, -0.07076072692871094, -0.06695938110351562, -0.06315803527832031, -0.059356689453125, -0.05555534362792969, -0.051753997802734375, -0.04795265197753906, -0.04415130615234375, -0.04034996032714844, -0.036548614501953125, -0.03274726867675781, -0.0289459228515625, -0.025144577026367188, -0.021343231201171875, -0.017541885375976562, -0.01374053955078125, -0.009939193725585938, -0.006137847900390625, -0.0023365020751953125, 0.00146484375, 0.0052661895751953125, 0.009067535400390625, 0.012868881225585938, 0.01667022705078125, 0.020471572875976562, 0.024272918701171875, 0.028074264526367188, 0.0318756103515625, 0.03567695617675781, 0.039478302001953125, 0.04327964782714844, 0.04708099365234375, 0.05088233947753906, 0.054683685302734375, 0.05848503112792969, 0.062286376953125, 0.06608772277832031, 0.06988906860351562, 0.07369041442871094, 0.07749176025390625, 0.08129310607910156, 0.08509445190429688, 0.08889579772949219, 0.0926971435546875, 0.09649848937988281, 0.10029983520507812, 0.10410118103027344, 0.10790252685546875, 0.11170387268066406, 0.11550521850585938, 0.11930656433105469, 0.12310791015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 6.0, 11.0, 14.0, 13.0, 17.0, 22.0, 27.0, 25.0, 37.0, 35.0, 34.0, 48.0, 50.0, 54.0, 35.0, 43.0, 52.0, 55.0, 48.0, 30.0, 44.0, 40.0, 42.0, 35.0, 37.0, 23.0, 19.0, 21.0, 14.0, 11.0, 8.0, 10.0, 5.0, 9.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7099609375, -0.6864700317382812, -0.6629791259765625, -0.6394882202148438, -0.615997314453125, -0.5925064086914062, -0.5690155029296875, -0.5455245971679688, -0.52203369140625, -0.49854278564453125, -0.4750518798828125, -0.45156097412109375, -0.428070068359375, -0.40457916259765625, -0.3810882568359375, -0.35759735107421875, -0.3341064453125, -0.31061553955078125, -0.2871246337890625, -0.26363372802734375, -0.240142822265625, -0.21665191650390625, -0.1931610107421875, -0.16967010498046875, -0.14617919921875, -0.12268829345703125, -0.0991973876953125, -0.07570648193359375, -0.052215576171875, -0.02872467041015625, -0.0052337646484375, 0.01825714111328125, 0.041748046875, 0.06523895263671875, 0.0887298583984375, 0.11222076416015625, 0.135711669921875, 0.15920257568359375, 0.1826934814453125, 0.20618438720703125, 0.22967529296875, 0.25316619873046875, 0.2766571044921875, 0.30014801025390625, 0.323638916015625, 0.34712982177734375, 0.3706207275390625, 0.39411163330078125, 0.4176025390625, 0.44109344482421875, 0.4645843505859375, 0.48807525634765625, 0.511566162109375, 0.5350570678710938, 0.5585479736328125, 0.5820388793945312, 0.60552978515625, 0.6290206909179688, 0.6525115966796875, 0.6760025024414062, 0.699493408203125, 0.7229843139648438, 0.7464752197265625, 0.7699661254882812, 0.79345703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 9.0, 13.0, 10.0, 33.0, 37.0, 61.0, 143.0, 213.0, 378.0, 922.0, 2184.0, 6491.0, 23357.0, 118118.0, 594906.0, 244463.0, 41226.0, 10345.0, 3246.0, 1199.0, 579.0, 271.0, 145.0, 71.0, 46.0, 26.0, 18.0, 8.0, 5.0, 9.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051849365234375, -0.05021333694458008, -0.048577308654785156, -0.046941280364990234, -0.04530525207519531, -0.04366922378540039, -0.04203319549560547, -0.04039716720581055, -0.038761138916015625, -0.0371251106262207, -0.03548908233642578, -0.03385305404663086, -0.03221702575683594, -0.030580997467041016, -0.028944969177246094, -0.027308940887451172, -0.02567291259765625, -0.024036884307861328, -0.022400856018066406, -0.020764827728271484, -0.019128799438476562, -0.01749277114868164, -0.01585674285888672, -0.014220714569091797, -0.012584686279296875, -0.010948657989501953, -0.009312629699707031, -0.007676601409912109, -0.0060405731201171875, -0.004404544830322266, -0.0027685165405273438, -0.0011324882507324219, 0.0005035400390625, 0.002139568328857422, 0.0037755966186523438, 0.005411624908447266, 0.0070476531982421875, 0.00868368148803711, 0.010319709777832031, 0.011955738067626953, 0.013591766357421875, 0.015227794647216797, 0.01686382293701172, 0.01849985122680664, 0.020135879516601562, 0.021771907806396484, 0.023407936096191406, 0.025043964385986328, 0.02667999267578125, 0.028316020965576172, 0.029952049255371094, 0.031588077545166016, 0.03322410583496094, 0.03486013412475586, 0.03649616241455078, 0.0381321907043457, 0.039768218994140625, 0.04140424728393555, 0.04304027557373047, 0.04467630386352539, 0.04631233215332031, 0.047948360443115234, 0.049584388732910156, 0.05122041702270508, 0.0528564453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 3.0, 7.0, 12.0, 13.0, 9.0, 17.0, 17.0, 39.0, 42.0, 68.0, 117.0, 126.0, 101.0, 127.0, 89.0, 60.0, 47.0, 31.0, 26.0, 16.0, 6.0, 10.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.552436828613281e-05, -3.464706242084503e-05, -3.376975655555725e-05, -3.289245069026947e-05, -3.201514482498169e-05, -3.113783895969391e-05, -3.0260533094406128e-05, -2.9383227229118347e-05, -2.8505921363830566e-05, -2.7628615498542786e-05, -2.6751309633255005e-05, -2.5874003767967224e-05, -2.4996697902679443e-05, -2.4119392037391663e-05, -2.3242086172103882e-05, -2.23647803068161e-05, -2.148747444152832e-05, -2.061016857624054e-05, -1.973286271095276e-05, -1.8855556845664978e-05, -1.7978250980377197e-05, -1.7100945115089417e-05, -1.6223639249801636e-05, -1.5346333384513855e-05, -1.4469027519226074e-05, -1.3591721653938293e-05, -1.2714415788650513e-05, -1.1837109923362732e-05, -1.0959804058074951e-05, -1.008249819278717e-05, -9.20519232749939e-06, -8.327886462211609e-06, -7.450580596923828e-06, -6.573274731636047e-06, -5.695968866348267e-06, -4.818663001060486e-06, -3.941357135772705e-06, -3.0640512704849243e-06, -2.1867454051971436e-06, -1.3094395399093628e-06, -4.3213367462158203e-07, 4.4517219066619873e-07, 1.3224780559539795e-06, 2.1997839212417603e-06, 3.077089786529541e-06, 3.954395651817322e-06, 4.8317015171051025e-06, 5.709007382392883e-06, 6.586313247680664e-06, 7.463619112968445e-06, 8.340924978256226e-06, 9.218230843544006e-06, 1.0095536708831787e-05, 1.0972842574119568e-05, 1.1850148439407349e-05, 1.272745430469513e-05, 1.360476016998291e-05, 1.4482066035270691e-05, 1.535937190055847e-05, 1.6236677765846252e-05, 1.7113983631134033e-05, 1.7991289496421814e-05, 1.8868595361709595e-05, 1.9745901226997375e-05, 2.0623207092285156e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 8.0, 21.0, 42.0, 46.0, 69.0, 124.0, 207.0, 363.0, 564.0, 935.0, 1759.0, 3390.0, 6780.0, 15876.0, 41380.0, 127518.0, 392454.0, 307847.0, 93239.0, 31555.0, 12299.0, 5637.0, 2779.0, 1524.0, 848.0, 485.0, 279.0, 201.0, 118.0, 62.0, 45.0, 34.0, 14.0, 16.0, 7.0, 4.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.037506103515625, -0.03643035888671875, -0.0353546142578125, -0.03427886962890625, -0.033203125, -0.03212738037109375, -0.0310516357421875, -0.02997589111328125, -0.028900146484375, -0.02782440185546875, -0.0267486572265625, -0.02567291259765625, -0.02459716796875, -0.02352142333984375, -0.0224456787109375, -0.02136993408203125, -0.020294189453125, -0.01921844482421875, -0.0181427001953125, -0.01706695556640625, -0.0159912109375, -0.01491546630859375, -0.0138397216796875, -0.01276397705078125, -0.011688232421875, -0.01061248779296875, -0.0095367431640625, -0.00846099853515625, -0.00738525390625, -0.00630950927734375, -0.0052337646484375, -0.00415802001953125, -0.003082275390625, -0.00200653076171875, -0.0009307861328125, 0.00014495849609375, 0.001220703125, 0.00229644775390625, 0.0033721923828125, 0.00444793701171875, 0.005523681640625, 0.00659942626953125, 0.0076751708984375, 0.00875091552734375, 0.00982666015625, 0.01090240478515625, 0.0119781494140625, 0.01305389404296875, 0.014129638671875, 0.01520538330078125, 0.0162811279296875, 0.01735687255859375, 0.0184326171875, 0.01950836181640625, 0.0205841064453125, 0.02165985107421875, 0.022735595703125, 0.02381134033203125, 0.0248870849609375, 0.02596282958984375, 0.02703857421875, 0.02811431884765625, 0.0291900634765625, 0.03026580810546875, 0.031341552734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 21.0, 31.0, 25.0, 34.0, 70.0, 72.0, 65.0, 97.0, 75.0, 82.0, 78.0, 58.0, 63.0, 47.0, 37.0, 26.0, 16.0, 19.0, 11.0, 12.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01166534423828125, -0.011307954788208008, -0.010950565338134766, -0.010593175888061523, -0.010235786437988281, -0.009878396987915039, -0.009521007537841797, -0.009163618087768555, -0.008806228637695312, -0.00844883918762207, -0.008091449737548828, -0.007734060287475586, -0.007376670837402344, -0.0070192813873291016, -0.006661891937255859, -0.006304502487182617, -0.005947113037109375, -0.005589723587036133, -0.005232334136962891, -0.0048749446868896484, -0.004517555236816406, -0.004160165786743164, -0.003802776336669922, -0.0034453868865966797, -0.0030879974365234375, -0.0027306079864501953, -0.002373218536376953, -0.002015829086303711, -0.0016584396362304688, -0.0013010501861572266, -0.0009436607360839844, -0.0005862712860107422, -0.0002288818359375, 0.0001285076141357422, 0.0004858970642089844, 0.0008432865142822266, 0.0012006759643554688, 0.001558065414428711, 0.0019154548645019531, 0.0022728443145751953, 0.0026302337646484375, 0.0029876232147216797, 0.003345012664794922, 0.003702402114868164, 0.004059791564941406, 0.0044171810150146484, 0.004774570465087891, 0.005131959915161133, 0.005489349365234375, 0.005846738815307617, 0.006204128265380859, 0.0065615177154541016, 0.006918907165527344, 0.007276296615600586, 0.007633686065673828, 0.00799107551574707, 0.008348464965820312, 0.008705854415893555, 0.009063243865966797, 0.009420633316040039, 0.009778022766113281, 0.010135412216186523, 0.010492801666259766, 0.010850191116333008, 0.01120758056640625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 19.0, 22.0, 26.0, 53.0, 74.0, 164.0, 195.0, 167.0, 83.0, 76.0, 46.0, 21.0, 9.0, 14.0, 10.0, 3.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4605964422225952, -1.4278874397277832, -1.3951785564422607, -1.3624695539474487, -1.3297605514526367, -1.2970515489578247, -1.2643426656723022, -1.2316336631774902, -1.1989246606826782, -1.1662156581878662, -1.1335067749023438, -1.1007977724075317, -1.0680887699127197, -1.0353797674179077, -1.0026708841323853, -0.9699618816375732, -0.937252938747406, -0.9045439958572388, -0.8718349933624268, -0.8391260504722595, -0.8064170479774475, -0.7737081050872803, -0.7409991025924683, -0.708290159702301, -0.6755812168121338, -0.6428722739219666, -0.6101632714271545, -0.5774543285369873, -0.5447453260421753, -0.5120363831520081, -0.47932741045951843, -0.4466184377670288, -0.4139094948768616, -0.38120052218437195, -0.3484915494918823, -0.3157826066017151, -0.2830736041069031, -0.25036466121673584, -0.21765568852424622, -0.1849467158317566, -0.15223774313926697, -0.11952877044677734, -0.08681980520486832, -0.05411083996295929, -0.021401867270469666, 0.011307105422019958, 0.04401606321334839, 0.07672503590583801, 0.10943400859832764, 0.14214298129081726, 0.17485195398330688, 0.20756091177463531, 0.24026988446712494, 0.27297884225845337, 0.305687814950943, 0.3383967876434326, 0.37110576033592224, 0.40381473302841187, 0.4365237057209015, 0.4692326784133911, 0.5019416213035583, 0.5346506237983704, 0.5673595666885376, 0.6000685691833496, 0.6327775120735168]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 10.0, 4.0, 6.0, 11.0, 21.0, 17.0, 20.0, 26.0, 25.0, 39.0, 45.0, 50.0, 52.0, 46.0, 52.0, 53.0, 43.0, 55.0, 57.0, 46.0, 53.0, 51.0, 28.0, 30.0, 31.0, 28.0, 20.0, 13.0, 20.0, 11.0, 3.0, 8.0, 8.0, 5.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44822201132774353, -0.4344092905521393, -0.42059656977653503, -0.4067838490009308, -0.39297112822532654, -0.3791584074497223, -0.36534565687179565, -0.3515329360961914, -0.33772021532058716, -0.3239074945449829, -0.31009477376937866, -0.2962820529937744, -0.28246933221817017, -0.2686566114425659, -0.25484389066696167, -0.24103115499019623, -0.22721844911575317, -0.21340572834014893, -0.19959300756454468, -0.18578028678894043, -0.17196756601333618, -0.15815484523773193, -0.1443421095609665, -0.13052938878536224, -0.116716668009758, -0.10290394723415375, -0.0890912264585495, -0.07527849823236465, -0.061465777456760406, -0.04765305668115616, -0.033840328454971313, -0.020027607679367065, -0.006214916706085205, 0.007597805932164192, 0.02141052857041359, 0.035223253071308136, 0.049035973846912384, 0.06284869462251663, 0.07666142284870148, 0.09047414362430573, 0.10428686439990997, 0.11809958517551422, 0.13191230595111847, 0.1457250416278839, 0.15953776240348816, 0.1733504831790924, 0.18716320395469666, 0.2009759247303009, 0.21478864550590515, 0.2286013662815094, 0.24241408705711365, 0.2562268078327179, 0.27003952860832214, 0.2838522493839264, 0.297664999961853, 0.3114777207374573, 0.3252904415130615, 0.33910316228866577, 0.35291588306427, 0.36672860383987427, 0.3805413246154785, 0.39435404539108276, 0.408166766166687, 0.42197948694229126, 0.4357922077178955]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 13.0, 16.0, 23.0, 36.0, 39.0, 60.0, 64.0, 106.0, 118.0, 182.0, 254.0, 359.0, 513.0, 822.0, 1274.0, 2238.0, 4476.0, 10097.0, 35030.0, 373309.0, 551628.0, 44532.0, 11797.0, 4875.0, 2498.0, 1413.0, 840.0, 554.0, 355.0, 282.0, 198.0, 126.0, 97.0, 74.0, 56.0, 47.0, 32.0, 28.0, 20.0, 20.0, 11.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.53271484375, -0.5161056518554688, -0.4994964599609375, -0.48288726806640625, -0.466278076171875, -0.44966888427734375, -0.4330596923828125, -0.41645050048828125, -0.39984130859375, -0.38323211669921875, -0.3666229248046875, -0.35001373291015625, -0.333404541015625, -0.31679534912109375, -0.3001861572265625, -0.28357696533203125, -0.2669677734375, -0.25035858154296875, -0.2337493896484375, -0.21714019775390625, -0.200531005859375, -0.18392181396484375, -0.1673126220703125, -0.15070343017578125, -0.13409423828125, -0.11748504638671875, -0.1008758544921875, -0.08426666259765625, -0.067657470703125, -0.05104827880859375, -0.0344390869140625, -0.01782989501953125, -0.001220703125, 0.01538848876953125, 0.0319976806640625, 0.04860687255859375, 0.065216064453125, 0.08182525634765625, 0.0984344482421875, 0.11504364013671875, 0.13165283203125, 0.14826202392578125, 0.1648712158203125, 0.18148040771484375, 0.198089599609375, 0.21469879150390625, 0.2313079833984375, 0.24791717529296875, 0.2645263671875, 0.28113555908203125, 0.2977447509765625, 0.31435394287109375, 0.330963134765625, 0.34757232666015625, 0.3641815185546875, 0.38079071044921875, 0.39739990234375, 0.41400909423828125, 0.4306182861328125, 0.44722747802734375, 0.463836669921875, 0.48044586181640625, 0.4970550537109375, 0.5136642456054688, 0.5302734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 2.0, 6.0, 17.0, 15.0, 17.0, 26.0, 24.0, 52.0, 45.0, 58.0, 57.0, 54.0, 57.0, 63.0, 65.0, 63.0, 53.0, 56.0, 64.0, 33.0, 16.0, 28.0, 30.0, 19.0, 17.0, 11.0, 9.0, 6.0, 2.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9509658813476562, -0.9199981689453125, -0.8890304565429688, -0.858062744140625, -0.8270950317382812, -0.7961273193359375, -0.7651596069335938, -0.73419189453125, -0.7032241821289062, -0.6722564697265625, -0.6412887573242188, -0.610321044921875, -0.5793533325195312, -0.5483856201171875, -0.5174179077148438, -0.4864501953125, -0.45548248291015625, -0.4245147705078125, -0.39354705810546875, -0.362579345703125, -0.33161163330078125, -0.3006439208984375, -0.26967620849609375, -0.23870849609375, -0.20774078369140625, -0.1767730712890625, -0.14580535888671875, -0.114837646484375, -0.08386993408203125, -0.0529022216796875, -0.02193450927734375, 0.009033203125, 0.04000091552734375, 0.0709686279296875, 0.10193634033203125, 0.132904052734375, 0.16387176513671875, 0.1948394775390625, 0.22580718994140625, 0.25677490234375, 0.28774261474609375, 0.3187103271484375, 0.34967803955078125, 0.380645751953125, 0.41161346435546875, 0.4425811767578125, 0.47354888916015625, 0.5045166015625, 0.5354843139648438, 0.5664520263671875, 0.5974197387695312, 0.628387451171875, 0.6593551635742188, 0.6903228759765625, 0.7212905883789062, 0.75225830078125, 0.7832260131835938, 0.8141937255859375, 0.8451614379882812, 0.876129150390625, 0.9070968627929688, 0.9380645751953125, 0.9690322875976562, 1.0]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 10.0, 7.0, 12.0, 15.0, 24.0, 40.0, 42.0, 73.0, 101.0, 136.0, 227.0, 404.0, 894.0, 2694.0, 21337.0, 990297.0, 27104.0, 2999.0, 970.0, 476.0, 232.0, 121.0, 96.0, 53.0, 45.0, 30.0, 18.0, 19.0, 14.0, 10.0, 13.0, 15.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1044921875, -1.0628662109375, -1.021240234375, -0.9796142578125, -0.93798828125, -0.8963623046875, -0.854736328125, -0.8131103515625, -0.771484375, -0.7298583984375, -0.688232421875, -0.6466064453125, -0.60498046875, -0.5633544921875, -0.521728515625, -0.4801025390625, -0.4384765625, -0.3968505859375, -0.355224609375, -0.3135986328125, -0.27197265625, -0.2303466796875, -0.188720703125, -0.1470947265625, -0.10546875, -0.0638427734375, -0.022216796875, 0.0194091796875, 0.06103515625, 0.1026611328125, 0.144287109375, 0.1859130859375, 0.2275390625, 0.2691650390625, 0.310791015625, 0.3524169921875, 0.39404296875, 0.4356689453125, 0.477294921875, 0.5189208984375, 0.560546875, 0.6021728515625, 0.643798828125, 0.6854248046875, 0.72705078125, 0.7686767578125, 0.810302734375, 0.8519287109375, 0.8935546875, 0.9351806640625, 0.976806640625, 1.0184326171875, 1.06005859375, 1.1016845703125, 1.143310546875, 1.1849365234375, 1.2265625, 1.2681884765625, 1.309814453125, 1.3514404296875, 1.39306640625, 1.4346923828125, 1.476318359375, 1.5179443359375, 1.5595703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 6.0, 3.0, 5.0, 3.0, 8.0, 15.0, 9.0, 15.0, 18.0, 17.0, 17.0, 29.0, 24.0, 23.0, 32.0, 28.0, 36.0, 32.0, 31.0, 44.0, 43.0, 34.0, 45.0, 44.0, 25.0, 38.0, 36.0, 44.0, 42.0, 22.0, 33.0, 22.0, 21.0, 23.0, 25.0, 16.0, 11.0, 10.0, 12.0, 8.0, 6.0, 14.0, 12.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.63330078125, -0.6142730712890625, -0.595245361328125, -0.5762176513671875, -0.55718994140625, -0.5381622314453125, -0.519134521484375, -0.5001068115234375, -0.4810791015625, -0.4620513916015625, -0.443023681640625, -0.4239959716796875, -0.40496826171875, -0.3859405517578125, -0.366912841796875, -0.3478851318359375, -0.328857421875, -0.3098297119140625, -0.290802001953125, -0.2717742919921875, -0.25274658203125, -0.2337188720703125, -0.214691162109375, -0.1956634521484375, -0.1766357421875, -0.1576080322265625, -0.138580322265625, -0.1195526123046875, -0.10052490234375, -0.0814971923828125, -0.062469482421875, -0.0434417724609375, -0.0244140625, -0.0053863525390625, 0.013641357421875, 0.0326690673828125, 0.05169677734375, 0.0707244873046875, 0.089752197265625, 0.1087799072265625, 0.1278076171875, 0.1468353271484375, 0.165863037109375, 0.1848907470703125, 0.20391845703125, 0.2229461669921875, 0.241973876953125, 0.2610015869140625, 0.280029296875, 0.2990570068359375, 0.318084716796875, 0.3371124267578125, 0.35614013671875, 0.3751678466796875, 0.394195556640625, 0.4132232666015625, 0.4322509765625, 0.4512786865234375, 0.470306396484375, 0.4893341064453125, 0.50836181640625, 0.5273895263671875, 0.546417236328125, 0.5654449462890625, 0.58447265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 9.0, 14.0, 8.0, 12.0, 19.0, 41.0, 74.0, 113.0, 257.0, 605.0, 1952.0, 8795.0, 75833.0, 849914.0, 97045.0, 10433.0, 2185.0, 676.0, 273.0, 121.0, 53.0, 45.0, 28.0, 10.0, 6.0, 5.0, 5.0, 6.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19780349731445312, -0.19223785400390625, -0.18667221069335938, -0.1811065673828125, -0.17554092407226562, -0.16997528076171875, -0.16440963745117188, -0.158843994140625, -0.15327835083007812, -0.14771270751953125, -0.14214706420898438, -0.1365814208984375, -0.13101577758789062, -0.12545013427734375, -0.11988449096679688, -0.11431884765625, -0.10875320434570312, -0.10318756103515625, -0.09762191772460938, -0.0920562744140625, -0.08649063110351562, -0.08092498779296875, -0.07535934448242188, -0.069793701171875, -0.06422805786132812, -0.05866241455078125, -0.053096771240234375, -0.0475311279296875, -0.041965484619140625, -0.03639984130859375, -0.030834197998046875, -0.0252685546875, -0.019702911376953125, -0.01413726806640625, -0.008571624755859375, -0.0030059814453125, 0.002559661865234375, 0.00812530517578125, 0.013690948486328125, 0.019256591796875, 0.024822235107421875, 0.03038787841796875, 0.035953521728515625, 0.0415191650390625, 0.047084808349609375, 0.05265045166015625, 0.058216094970703125, 0.06378173828125, 0.06934738159179688, 0.07491302490234375, 0.08047866821289062, 0.0860443115234375, 0.09160995483398438, 0.09717559814453125, 0.10274124145507812, 0.108306884765625, 0.11387252807617188, 0.11943817138671875, 0.12500381469726562, 0.1305694580078125, 0.13613510131835938, 0.14170074462890625, 0.14726638793945312, 0.15283203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 9.0, 8.0, 13.0, 22.0, 22.0, 34.0, 46.0, 63.0, 80.0, 134.0, 119.0, 113.0, 129.0, 52.0, 41.0, 27.0, 24.0, 10.0, 10.0, 8.0, 4.0, 8.0, 9.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5106983482837677e-05, -1.459755003452301e-05, -1.4088116586208344e-05, -1.3578683137893677e-05, -1.306924968957901e-05, -1.2559816241264343e-05, -1.2050382792949677e-05, -1.154094934463501e-05, -1.1031515896320343e-05, -1.0522082448005676e-05, -1.001264899969101e-05, -9.503215551376343e-06, -8.993782103061676e-06, -8.48434865474701e-06, -7.974915206432343e-06, -7.465481758117676e-06, -6.956048309803009e-06, -6.446614861488342e-06, -5.9371814131736755e-06, -5.427747964859009e-06, -4.918314516544342e-06, -4.408881068229675e-06, -3.8994476199150085e-06, -3.390014171600342e-06, -2.880580723285675e-06, -2.3711472749710083e-06, -1.8617138266563416e-06, -1.3522803783416748e-06, -8.428469300270081e-07, -3.334134817123413e-07, 1.7601996660232544e-07, 6.854534149169922e-07, 1.194886863231659e-06, 1.7043203115463257e-06, 2.2137537598609924e-06, 2.723187208175659e-06, 3.232620656490326e-06, 3.7420541048049927e-06, 4.2514875531196594e-06, 4.760921001434326e-06, 5.270354449748993e-06, 5.77978789806366e-06, 6.289221346378326e-06, 6.798654794692993e-06, 7.30808824300766e-06, 7.817521691322327e-06, 8.326955139636993e-06, 8.83638858795166e-06, 9.345822036266327e-06, 9.855255484580994e-06, 1.036468893289566e-05, 1.0874122381210327e-05, 1.1383555829524994e-05, 1.189298927783966e-05, 1.2402422726154327e-05, 1.2911856174468994e-05, 1.3421289622783661e-05, 1.3930723071098328e-05, 1.4440156519412994e-05, 1.4949589967727661e-05, 1.5459023416042328e-05, 1.5968456864356995e-05, 1.647789031267166e-05, 1.6987323760986328e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 13.0, 20.0, 21.0, 35.0, 70.0, 106.0, 160.0, 276.0, 465.0, 838.0, 1585.0, 3513.0, 9430.0, 41734.0, 594093.0, 352506.0, 29839.0, 7579.0, 2980.0, 1411.0, 738.0, 442.0, 254.0, 171.0, 107.0, 63.0, 35.0, 24.0, 14.0, 9.0, 6.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2088623046875, -0.2036285400390625, -0.198394775390625, -0.1931610107421875, -0.18792724609375, -0.1826934814453125, -0.177459716796875, -0.1722259521484375, -0.1669921875, -0.1617584228515625, -0.156524658203125, -0.1512908935546875, -0.14605712890625, -0.1408233642578125, -0.135589599609375, -0.1303558349609375, -0.1251220703125, -0.1198883056640625, -0.114654541015625, -0.1094207763671875, -0.10418701171875, -0.0989532470703125, -0.093719482421875, -0.0884857177734375, -0.083251953125, -0.0780181884765625, -0.072784423828125, -0.0675506591796875, -0.06231689453125, -0.0570831298828125, -0.051849365234375, -0.0466156005859375, -0.0413818359375, -0.0361480712890625, -0.030914306640625, -0.0256805419921875, -0.02044677734375, -0.0152130126953125, -0.009979248046875, -0.0047454833984375, 0.00048828125, 0.0057220458984375, 0.010955810546875, 0.0161895751953125, 0.02142333984375, 0.0266571044921875, 0.031890869140625, 0.0371246337890625, 0.0423583984375, 0.0475921630859375, 0.052825927734375, 0.0580596923828125, 0.06329345703125, 0.0685272216796875, 0.073760986328125, 0.0789947509765625, 0.084228515625, 0.0894622802734375, 0.094696044921875, 0.0999298095703125, 0.10516357421875, 0.1103973388671875, 0.115631103515625, 0.1208648681640625, 0.1260986328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 3.0, 12.0, 15.0, 26.0, 21.0, 40.0, 61.0, 102.0, 101.0, 150.0, 158.0, 82.0, 85.0, 42.0, 22.0, 20.0, 7.0, 10.0, 6.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0626220703125, -0.06041908264160156, -0.058216094970703125, -0.05601310729980469, -0.05381011962890625, -0.05160713195800781, -0.049404144287109375, -0.04720115661621094, -0.0449981689453125, -0.04279518127441406, -0.040592193603515625, -0.03838920593261719, -0.03618621826171875, -0.03398323059082031, -0.031780242919921875, -0.029577255249023438, -0.027374267578125, -0.025171279907226562, -0.022968292236328125, -0.020765304565429688, -0.01856231689453125, -0.016359329223632812, -0.014156341552734375, -0.011953353881835938, -0.0097503662109375, -0.0075473785400390625, -0.005344390869140625, -0.0031414031982421875, -0.00093841552734375, 0.0012645721435546875, 0.003467559814453125, 0.0056705474853515625, 0.00787353515625, 0.010076522827148438, 0.012279510498046875, 0.014482498168945312, 0.01668548583984375, 0.018888473510742188, 0.021091461181640625, 0.023294448852539062, 0.0254974365234375, 0.027700424194335938, 0.029903411865234375, 0.03210639953613281, 0.03430938720703125, 0.03651237487792969, 0.038715362548828125, 0.04091835021972656, 0.043121337890625, 0.04532432556152344, 0.047527313232421875, 0.04973030090332031, 0.05193328857421875, 0.05413627624511719, 0.056339263916015625, 0.05854225158691406, 0.0607452392578125, 0.06294822692871094, 0.06515121459960938, 0.06735420227050781, 0.06955718994140625, 0.07176017761230469, 0.07396316528320312, 0.07616615295410156, 0.078369140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 0.0, 8.0, 10.0, 16.0, 17.0, 38.0, 54.0, 125.0, 190.0, 200.0, 136.0, 77.0, 57.0, 32.0, 14.0, 12.0, 9.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.283629894256592, -3.2141385078430176, -3.1446471214294434, -3.07515549659729, -3.005664110183716, -2.9361727237701416, -2.8666810989379883, -2.797189712524414, -2.72769832611084, -2.6582069396972656, -2.5887155532836914, -2.519223928451538, -2.449732542037964, -2.3802411556243896, -2.3107495307922363, -2.241258144378662, -2.171766757965088, -2.1022753715515137, -2.0327839851379395, -1.9632923603057861, -1.893800973892212, -1.8243095874786377, -1.754818081855774, -1.6853265762329102, -1.615835189819336, -1.5463438034057617, -1.476852297782898, -1.4073607921600342, -1.33786940574646, -1.2683780193328857, -1.198886513710022, -1.1293950080871582, -1.0599033832550049, -0.9904119372367859, -0.9209204912185669, -0.8514290452003479, -0.7819375991821289, -0.7124461531639099, -0.6429547071456909, -0.5734632611274719, -0.5039718151092529, -0.43448036909103394, -0.36498892307281494, -0.29549747705459595, -0.22600603103637695, -0.15651458501815796, -0.08702313899993896, -0.01753169298171997, 0.05195975303649902, 0.12145119905471802, 0.190942645072937, 0.260434091091156, 0.329925537109375, 0.399416983127594, 0.468908429145813, 0.538399875164032, 0.607891321182251, 0.67738276720047, 0.746874213218689, 0.816365659236908, 0.885857105255127, 0.955348551273346, 1.024839997291565, 1.0943315029144287, 1.163822889328003]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 10.0, 8.0, 7.0, 11.0, 13.0, 13.0, 20.0, 17.0, 22.0, 36.0, 38.0, 32.0, 29.0, 51.0, 47.0, 46.0, 40.0, 47.0, 38.0, 50.0, 44.0, 53.0, 30.0, 35.0, 44.0, 39.0, 27.0, 28.0, 16.0, 29.0, 20.0, 14.0, 11.0, 2.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3882209062576294, -1.3489383459091187, -1.3096556663513184, -1.2703731060028076, -1.2310905456542969, -1.1918078660964966, -1.1525253057479858, -1.1132426261901855, -1.0739600658416748, -1.034677505493164, -0.9953948259353638, -0.956112265586853, -0.9168296456336975, -0.877547025680542, -0.8382644653320312, -0.7989818453788757, -0.7596992254257202, -0.7204166054725647, -0.6811339855194092, -0.6418514251708984, -0.6025688052177429, -0.5632861852645874, -0.5240036249160767, -0.48472100496292114, -0.4454383850097656, -0.4061557650566101, -0.366873174905777, -0.32759058475494385, -0.28830796480178833, -0.249025359749794, -0.20974275469779968, -0.17046016454696655, -0.13117754459381104, -0.09189493954181671, -0.05261233448982239, -0.013329729437828064, 0.02595287561416626, 0.06523548066616058, 0.10451808571815491, 0.14380067586898804, 0.18308329582214355, 0.22236590087413788, 0.2616485059261322, 0.30093109607696533, 0.34021371603012085, 0.37949633598327637, 0.4187789261341095, 0.4580615162849426, 0.49734413623809814, 0.5366267561912537, 0.5759093761444092, 0.6151919364929199, 0.6544745564460754, 0.693757176399231, 0.7330397367477417, 0.7723223567008972, 0.8116049766540527, 0.8508875966072083, 0.8901702165603638, 0.9294527769088745, 0.96873539686203, 1.0080180168151855, 1.0473005771636963, 1.086583137512207, 1.1258658170700073]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 25.0, 35.0, 45.0, 63.0, 92.0, 152.0, 230.0, 442.0, 959.0, 2669.0, 11402.0, 520328.0, 3621067.0, 29429.0, 4399.0, 1432.0, 581.0, 323.0, 203.0, 104.0, 69.0, 67.0, 50.0, 27.0, 17.0, 14.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9501953125, -1.8785247802734375, -1.806854248046875, -1.7351837158203125, -1.66351318359375, -1.5918426513671875, -1.520172119140625, -1.4485015869140625, -1.3768310546875, -1.3051605224609375, -1.233489990234375, -1.1618194580078125, -1.09014892578125, -1.0184783935546875, -0.946807861328125, -0.8751373291015625, -0.803466796875, -0.7317962646484375, -0.660125732421875, -0.5884552001953125, -0.51678466796875, -0.4451141357421875, -0.373443603515625, -0.3017730712890625, -0.2301025390625, -0.1584320068359375, -0.086761474609375, -0.0150909423828125, 0.05657958984375, 0.1282501220703125, 0.199920654296875, 0.2715911865234375, 0.34326171875, 0.4149322509765625, 0.486602783203125, 0.5582733154296875, 0.62994384765625, 0.7016143798828125, 0.773284912109375, 0.8449554443359375, 0.9166259765625, 0.9882965087890625, 1.059967041015625, 1.1316375732421875, 1.20330810546875, 1.2749786376953125, 1.346649169921875, 1.4183197021484375, 1.489990234375, 1.5616607666015625, 1.633331298828125, 1.7050018310546875, 1.77667236328125, 1.8483428955078125, 1.920013427734375, 1.9916839599609375, 2.0633544921875, 2.1350250244140625, 2.206695556640625, 2.2783660888671875, 2.35003662109375, 2.4217071533203125, 2.493377685546875, 2.5650482177734375, 2.63671875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 5.0, 10.0, 13.0, 13.0, 11.0, 21.0, 17.0, 26.0, 30.0, 44.0, 40.0, 49.0, 57.0, 67.0, 56.0, 57.0, 55.0, 74.0, 62.0, 45.0, 53.0, 39.0, 32.0, 27.0, 17.0, 18.0, 13.0, 11.0, 4.0, 11.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5053939819335938, -0.4863739013671875, -0.46735382080078125, -0.448333740234375, -0.42931365966796875, -0.4102935791015625, -0.39127349853515625, -0.37225341796875, -0.35323333740234375, -0.3342132568359375, -0.31519317626953125, -0.296173095703125, -0.27715301513671875, -0.2581329345703125, -0.23911285400390625, -0.2200927734375, -0.20107269287109375, -0.1820526123046875, -0.16303253173828125, -0.144012451171875, -0.12499237060546875, -0.1059722900390625, -0.08695220947265625, -0.06793212890625, -0.04891204833984375, -0.0298919677734375, -0.01087188720703125, 0.008148193359375, 0.02716827392578125, 0.0461883544921875, 0.06520843505859375, 0.084228515625, 0.10324859619140625, 0.1222686767578125, 0.14128875732421875, 0.160308837890625, 0.17932891845703125, 0.1983489990234375, 0.21736907958984375, 0.23638916015625, 0.25540924072265625, 0.2744293212890625, 0.29344940185546875, 0.312469482421875, 0.33148956298828125, 0.3505096435546875, 0.36952972412109375, 0.3885498046875, 0.40756988525390625, 0.4265899658203125, 0.44561004638671875, 0.464630126953125, 0.48365020751953125, 0.5026702880859375, 0.5216903686523438, 0.54071044921875, 0.5597305297851562, 0.5787506103515625, 0.5977706909179688, 0.616790771484375, 0.6358108520507812, 0.6548309326171875, 0.6738510131835938, 0.69287109375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 10.0, 3.0, 8.0, 16.0, 20.0, 40.0, 43.0, 78.0, 121.0, 187.0, 325.0, 636.0, 1334.0, 3130.0, 8630.0, 34577.0, 472973.0, 3553691.0, 93208.0, 16378.0, 5064.0, 1854.0, 861.0, 447.0, 247.0, 121.0, 88.0, 58.0, 45.0, 30.0, 13.0, 10.0, 5.0, 5.0, 8.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9052734375, -0.87322998046875, -0.8411865234375, -0.80914306640625, -0.777099609375, -0.74505615234375, -0.7130126953125, -0.68096923828125, -0.64892578125, -0.61688232421875, -0.5848388671875, -0.55279541015625, -0.520751953125, -0.48870849609375, -0.4566650390625, -0.42462158203125, -0.392578125, -0.36053466796875, -0.3284912109375, -0.29644775390625, -0.264404296875, -0.23236083984375, -0.2003173828125, -0.16827392578125, -0.13623046875, -0.10418701171875, -0.0721435546875, -0.04010009765625, -0.008056640625, 0.02398681640625, 0.0560302734375, 0.08807373046875, 0.1201171875, 0.15216064453125, 0.1842041015625, 0.21624755859375, 0.248291015625, 0.28033447265625, 0.3123779296875, 0.34442138671875, 0.37646484375, 0.40850830078125, 0.4405517578125, 0.47259521484375, 0.504638671875, 0.53668212890625, 0.5687255859375, 0.60076904296875, 0.6328125, 0.66485595703125, 0.6968994140625, 0.72894287109375, 0.760986328125, 0.79302978515625, 0.8250732421875, 0.85711669921875, 0.88916015625, 0.92120361328125, 0.9532470703125, 0.98529052734375, 1.017333984375, 1.04937744140625, 1.0814208984375, 1.11346435546875, 1.1455078125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 11.0, 16.0, 18.0, 28.0, 45.0, 62.0, 123.0, 277.0, 651.0, 1252.0, 824.0, 352.0, 162.0, 86.0, 56.0, 27.0, 22.0, 10.0, 12.0, 11.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285400390625, -0.2750701904296875, -0.264739990234375, -0.2544097900390625, -0.24407958984375, -0.2337493896484375, -0.223419189453125, -0.2130889892578125, -0.2027587890625, -0.1924285888671875, -0.182098388671875, -0.1717681884765625, -0.16143798828125, -0.1511077880859375, -0.140777587890625, -0.1304473876953125, -0.1201171875, -0.1097869873046875, -0.099456787109375, -0.0891265869140625, -0.07879638671875, -0.0684661865234375, -0.058135986328125, -0.0478057861328125, -0.0374755859375, -0.0271453857421875, -0.016815185546875, -0.0064849853515625, 0.00384521484375, 0.0141754150390625, 0.024505615234375, 0.0348358154296875, 0.045166015625, 0.0554962158203125, 0.065826416015625, 0.0761566162109375, 0.08648681640625, 0.0968170166015625, 0.107147216796875, 0.1174774169921875, 0.1278076171875, 0.1381378173828125, 0.148468017578125, 0.1587982177734375, 0.16912841796875, 0.1794586181640625, 0.189788818359375, 0.2001190185546875, 0.21044921875, 0.2207794189453125, 0.231109619140625, 0.2414398193359375, 0.25177001953125, 0.2621002197265625, 0.272430419921875, 0.2827606201171875, 0.2930908203125, 0.3034210205078125, 0.313751220703125, 0.3240814208984375, 0.33441162109375, 0.3447418212890625, 0.355072021484375, 0.3654022216796875, 0.375732421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 13.0, 21.0, 32.0, 44.0, 51.0, 70.0, 98.0, 116.0, 114.0, 113.0, 84.0, 45.0, 38.0, 32.0, 24.0, 23.0, 12.0, 8.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.154934048652649, -1.1261039972305298, -1.097273826599121, -1.068443775177002, -1.0396137237548828, -1.0107836723327637, -0.981953501701355, -0.9531234502792358, -0.9242933988571167, -0.8954632878303528, -0.8666332364082336, -0.8378031253814697, -0.8089730739593506, -0.7801429629325867, -0.7513128519058228, -0.7224828004837036, -0.6936526894569397, -0.6648225784301758, -0.6359925270080566, -0.6071624159812927, -0.5783323645591736, -0.5495022535324097, -0.5206722021102905, -0.4918420910835266, -0.4630120098590851, -0.43418192863464355, -0.405351847410202, -0.3765217661857605, -0.3476916551589966, -0.31886160373687744, -0.2900314927101135, -0.261201411485672, -0.23237133026123047, -0.20354124903678894, -0.1747111678123474, -0.1458810716867447, -0.11705099046230316, -0.08822090923786163, -0.05939081311225891, -0.030560731887817383, -0.0017306506633758545, 0.027099434286355972, 0.0559295192360878, 0.08475960791110992, 0.11358968913555145, 0.14241977035999298, 0.1712498664855957, 0.20007994771003723, 0.22891002893447876, 0.2577401101589203, 0.2865701913833618, 0.31540030241012573, 0.3442303538322449, 0.3730604648590088, 0.4018905460834503, 0.43072062730789185, 0.4595507085323334, 0.4883807897567749, 0.5172109007835388, 0.546040952205658, 0.5748710632324219, 0.603701114654541, 0.6325312256813049, 0.6613613367080688, 0.690191388130188]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 7.0, 10.0, 11.0, 21.0, 17.0, 23.0, 28.0, 38.0, 41.0, 47.0, 42.0, 50.0, 52.0, 44.0, 54.0, 59.0, 59.0, 64.0, 63.0, 44.0, 37.0, 36.0, 40.0, 24.0, 21.0, 17.0, 10.0, 14.0, 7.0, 10.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6195239424705505, -0.5981258153915405, -0.5767276287078857, -0.5553295016288757, -0.5339313745498657, -0.5125331878662109, -0.4911350607872009, -0.46973690390586853, -0.44833874702453613, -0.42694059014320374, -0.40554243326187134, -0.38414430618286133, -0.36274614930152893, -0.34134799242019653, -0.3199498653411865, -0.2985517084598541, -0.27715355157852173, -0.25575539469718933, -0.23435725271701813, -0.21295911073684692, -0.19156095385551453, -0.17016279697418213, -0.14876465499401093, -0.12736651301383972, -0.10596835613250732, -0.08457020670175552, -0.06317205727100372, -0.04177390784025192, -0.020375758409500122, 0.0010223910212516785, 0.02242054045200348, 0.04381868243217468, 0.0652167797088623, 0.0866149291396141, 0.1080130785703659, 0.1294112205505371, 0.1508093774318695, 0.1722075343132019, 0.1936056762933731, 0.2150038182735443, 0.2364019751548767, 0.2578001320362091, 0.2791982889175415, 0.3005964159965515, 0.3219945728778839, 0.3433927297592163, 0.3647908568382263, 0.3861890137195587, 0.4075871706008911, 0.4289853274822235, 0.4503834843635559, 0.4717816114425659, 0.4931797683238983, 0.5145779252052307, 0.5359760522842407, 0.5573742389678955, 0.5787723660469055, 0.6001704931259155, 0.6215686798095703, 0.6429668068885803, 0.6643649339675903, 0.6857631206512451, 0.7071612477302551, 0.7285593748092651, 0.7499575614929199]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 10.0, 5.0, 16.0, 38.0, 30.0, 77.0, 140.0, 276.0, 564.0, 1108.0, 2955.0, 11651.0, 108605.0, 829282.0, 79221.0, 9899.0, 2617.0, 1046.0, 454.0, 235.0, 132.0, 82.0, 47.0, 30.0, 10.0, 9.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.28537750244140625, -0.2753448486328125, -0.26531219482421875, -0.255279541015625, -0.24524688720703125, -0.2352142333984375, -0.22518157958984375, -0.21514892578125, -0.20511627197265625, -0.1950836181640625, -0.18505096435546875, -0.175018310546875, -0.16498565673828125, -0.1549530029296875, -0.14492034912109375, -0.1348876953125, -0.12485504150390625, -0.1148223876953125, -0.10478973388671875, -0.094757080078125, -0.08472442626953125, -0.0746917724609375, -0.06465911865234375, -0.05462646484375, -0.04459381103515625, -0.0345611572265625, -0.02452850341796875, -0.014495849609375, -0.00446319580078125, 0.0055694580078125, 0.01560211181640625, 0.025634765625, 0.03566741943359375, 0.0457000732421875, 0.05573272705078125, 0.065765380859375, 0.07579803466796875, 0.0858306884765625, 0.09586334228515625, 0.10589599609375, 0.11592864990234375, 0.1259613037109375, 0.13599395751953125, 0.146026611328125, 0.15605926513671875, 0.1660919189453125, 0.17612457275390625, 0.1861572265625, 0.19618988037109375, 0.2062225341796875, 0.21625518798828125, 0.226287841796875, 0.23632049560546875, 0.2463531494140625, 0.25638580322265625, 0.26641845703125, 0.27645111083984375, 0.2864837646484375, 0.29651641845703125, 0.306549072265625, 0.31658172607421875, 0.3266143798828125, 0.33664703369140625, 0.3466796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 14.0, 18.0, 18.0, 18.0, 34.0, 36.0, 51.0, 39.0, 48.0, 66.0, 41.0, 50.0, 70.0, 59.0, 59.0, 61.0, 63.0, 42.0, 41.0, 18.0, 36.0, 25.0, 15.0, 14.0, 15.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33837890625, -0.32334136962890625, -0.3083038330078125, -0.29326629638671875, -0.278228759765625, -0.26319122314453125, -0.2481536865234375, -0.23311614990234375, -0.21807861328125, -0.20304107666015625, -0.1880035400390625, -0.17296600341796875, -0.157928466796875, -0.14289093017578125, -0.1278533935546875, -0.11281585693359375, -0.0977783203125, -0.08274078369140625, -0.0677032470703125, -0.05266571044921875, -0.037628173828125, -0.02259063720703125, -0.0075531005859375, 0.00748443603515625, 0.02252197265625, 0.03755950927734375, 0.0525970458984375, 0.06763458251953125, 0.082672119140625, 0.09770965576171875, 0.1127471923828125, 0.12778472900390625, 0.142822265625, 0.15785980224609375, 0.1728973388671875, 0.18793487548828125, 0.202972412109375, 0.21800994873046875, 0.2330474853515625, 0.24808502197265625, 0.26312255859375, 0.27816009521484375, 0.2931976318359375, 0.30823516845703125, 0.323272705078125, 0.33831024169921875, 0.3533477783203125, 0.36838531494140625, 0.3834228515625, 0.39846038818359375, 0.4134979248046875, 0.42853546142578125, 0.443572998046875, 0.45861053466796875, 0.4736480712890625, 0.48868560791015625, 0.50372314453125, 0.5187606811523438, 0.5337982177734375, 0.5488357543945312, 0.563873291015625, 0.5789108276367188, 0.5939483642578125, 0.6089859008789062, 0.6240234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 6.0, 6.0, 7.0, 12.0, 14.0, 7.0, 20.0, 34.0, 31.0, 52.0, 69.0, 114.0, 165.0, 223.0, 330.0, 543.0, 857.0, 1602.0, 2995.0, 6646.0, 15998.0, 46093.0, 180777.0, 517453.0, 194433.0, 49235.0, 16777.0, 6739.0, 3115.0, 1638.0, 894.0, 533.0, 344.0, 241.0, 135.0, 121.0, 83.0, 65.0, 35.0, 28.0, 25.0, 22.0, 13.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1170654296875, -0.11322975158691406, -0.10939407348632812, -0.10555839538574219, -0.10172271728515625, -0.09788703918457031, -0.09405136108398438, -0.09021568298339844, -0.0863800048828125, -0.08254432678222656, -0.07870864868164062, -0.07487297058105469, -0.07103729248046875, -0.06720161437988281, -0.06336593627929688, -0.05953025817871094, -0.055694580078125, -0.05185890197753906, -0.048023223876953125, -0.04418754577636719, -0.04035186767578125, -0.03651618957519531, -0.032680511474609375, -0.028844833374023438, -0.0250091552734375, -0.021173477172851562, -0.017337799072265625, -0.013502120971679688, -0.00966644287109375, -0.0058307647705078125, -0.001995086669921875, 0.0018405914306640625, 0.00567626953125, 0.009511947631835938, 0.013347625732421875, 0.017183303833007812, 0.02101898193359375, 0.024854660034179688, 0.028690338134765625, 0.03252601623535156, 0.0363616943359375, 0.04019737243652344, 0.044033050537109375, 0.04786872863769531, 0.05170440673828125, 0.05554008483886719, 0.059375762939453125, 0.06321144104003906, 0.067047119140625, 0.07088279724121094, 0.07471847534179688, 0.07855415344238281, 0.08238983154296875, 0.08622550964355469, 0.09006118774414062, 0.09389686584472656, 0.0977325439453125, 0.10156822204589844, 0.10540390014648438, 0.10923957824707031, 0.11307525634765625, 0.11691093444824219, 0.12074661254882812, 0.12458229064941406, 0.12841796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 2.0, 4.0, 4.0, 10.0, 3.0, 12.0, 11.0, 6.0, 15.0, 24.0, 8.0, 19.0, 28.0, 21.0, 30.0, 34.0, 35.0, 34.0, 42.0, 38.0, 52.0, 48.0, 42.0, 48.0, 55.0, 50.0, 39.0, 32.0, 36.0, 43.0, 17.0, 26.0, 20.0, 10.0, 23.0, 13.0, 14.0, 3.0, 8.0, 6.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61767578125, -0.5970077514648438, -0.5763397216796875, -0.5556716918945312, -0.535003662109375, -0.5143356323242188, -0.4936676025390625, -0.47299957275390625, -0.45233154296875, -0.43166351318359375, -0.4109954833984375, -0.39032745361328125, -0.369659423828125, -0.34899139404296875, -0.3283233642578125, -0.30765533447265625, -0.2869873046875, -0.26631927490234375, -0.2456512451171875, -0.22498321533203125, -0.204315185546875, -0.18364715576171875, -0.1629791259765625, -0.14231109619140625, -0.12164306640625, -0.10097503662109375, -0.0803070068359375, -0.05963897705078125, -0.038970947265625, -0.01830291748046875, 0.0023651123046875, 0.02303314208984375, 0.043701171875, 0.06436920166015625, 0.0850372314453125, 0.10570526123046875, 0.126373291015625, 0.14704132080078125, 0.1677093505859375, 0.18837738037109375, 0.20904541015625, 0.22971343994140625, 0.2503814697265625, 0.27104949951171875, 0.291717529296875, 0.31238555908203125, 0.3330535888671875, 0.35372161865234375, 0.3743896484375, 0.39505767822265625, 0.4157257080078125, 0.43639373779296875, 0.457061767578125, 0.47772979736328125, 0.4983978271484375, 0.5190658569335938, 0.53973388671875, 0.5604019165039062, 0.5810699462890625, 0.6017379760742188, 0.622406005859375, 0.6430740356445312, 0.6637420654296875, 0.6844100952148438, 0.705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 11.0, 9.0, 17.0, 39.0, 59.0, 106.0, 179.0, 277.0, 538.0, 1002.0, 1874.0, 4064.0, 9535.0, 27572.0, 107252.0, 521443.0, 287043.0, 57247.0, 17446.0, 6675.0, 2976.0, 1420.0, 738.0, 453.0, 195.0, 125.0, 92.0, 56.0, 30.0, 28.0, 10.0, 8.0, 8.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04376220703125, -0.04229307174682617, -0.040823936462402344, -0.039354801177978516, -0.03788566589355469, -0.03641653060913086, -0.03494739532470703, -0.0334782600402832, -0.032009124755859375, -0.030539989471435547, -0.02907085418701172, -0.02760171890258789, -0.026132583618164062, -0.024663448333740234, -0.023194313049316406, -0.021725177764892578, -0.02025604248046875, -0.018786907196044922, -0.017317771911621094, -0.015848636627197266, -0.014379501342773438, -0.01291036605834961, -0.011441230773925781, -0.009972095489501953, -0.008502960205078125, -0.007033824920654297, -0.005564689636230469, -0.004095554351806641, -0.0026264190673828125, -0.0011572837829589844, 0.00031185150146484375, 0.0017809867858886719, 0.0032501220703125, 0.004719257354736328, 0.006188392639160156, 0.007657527923583984, 0.009126663208007812, 0.01059579849243164, 0.012064933776855469, 0.013534069061279297, 0.015003204345703125, 0.016472339630126953, 0.01794147491455078, 0.01941061019897461, 0.020879745483398438, 0.022348880767822266, 0.023818016052246094, 0.025287151336669922, 0.02675628662109375, 0.028225421905517578, 0.029694557189941406, 0.031163692474365234, 0.03263282775878906, 0.03410196304321289, 0.03557109832763672, 0.03704023361206055, 0.038509368896484375, 0.0399785041809082, 0.04144763946533203, 0.04291677474975586, 0.04438591003417969, 0.045855045318603516, 0.047324180603027344, 0.04879331588745117, 0.050262451171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 13.0, 18.0, 16.0, 19.0, 27.0, 48.0, 75.0, 99.0, 143.0, 152.0, 126.0, 78.0, 67.0, 33.0, 15.0, 10.0, 11.0, 17.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.707408905029297e-05, -3.601983189582825e-05, -3.4965574741363525e-05, -3.3911317586898804e-05, -3.285706043243408e-05, -3.180280327796936e-05, -3.074854612350464e-05, -2.9694288969039917e-05, -2.8640031814575195e-05, -2.7585774660110474e-05, -2.6531517505645752e-05, -2.547726035118103e-05, -2.442300319671631e-05, -2.3368746042251587e-05, -2.2314488887786865e-05, -2.1260231733322144e-05, -2.0205974578857422e-05, -1.91517174243927e-05, -1.809746026992798e-05, -1.7043203115463257e-05, -1.5988945960998535e-05, -1.4934688806533813e-05, -1.3880431652069092e-05, -1.282617449760437e-05, -1.1771917343139648e-05, -1.0717660188674927e-05, -9.663403034210205e-06, -8.609145879745483e-06, -7.554888725280762e-06, -6.50063157081604e-06, -5.446374416351318e-06, -4.392117261886597e-06, -3.337860107421875e-06, -2.2836029529571533e-06, -1.2293457984924316e-06, -1.7508864402770996e-07, 8.791685104370117e-07, 1.9334256649017334e-06, 2.987682819366455e-06, 4.041939973831177e-06, 5.0961971282958984e-06, 6.15045428276062e-06, 7.204711437225342e-06, 8.258968591690063e-06, 9.313225746154785e-06, 1.0367482900619507e-05, 1.1421740055084229e-05, 1.247599720954895e-05, 1.3530254364013672e-05, 1.4584511518478394e-05, 1.5638768672943115e-05, 1.6693025827407837e-05, 1.774728298187256e-05, 1.880154013633728e-05, 1.9855797290802002e-05, 2.0910054445266724e-05, 2.1964311599731445e-05, 2.3018568754196167e-05, 2.407282590866089e-05, 2.512708306312561e-05, 2.6181340217590332e-05, 2.7235597372055054e-05, 2.8289854526519775e-05, 2.9344111680984497e-05, 3.039836883544922e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 9.0, 12.0, 28.0, 30.0, 59.0, 93.0, 123.0, 249.0, 433.0, 760.0, 1374.0, 2689.0, 5246.0, 11301.0, 26458.0, 69848.0, 210543.0, 415106.0, 194319.0, 64238.0, 24427.0, 10600.0, 5002.0, 2455.0, 1350.0, 769.0, 386.0, 245.0, 141.0, 80.0, 58.0, 40.0, 22.0, 15.0, 14.0, 11.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290985107421875, -0.02817368507385254, -0.027248859405517578, -0.026324033737182617, -0.025399208068847656, -0.024474382400512695, -0.023549556732177734, -0.022624731063842773, -0.021699905395507812, -0.02077507972717285, -0.01985025405883789, -0.01892542839050293, -0.01800060272216797, -0.017075777053833008, -0.016150951385498047, -0.015226125717163086, -0.014301300048828125, -0.013376474380493164, -0.012451648712158203, -0.011526823043823242, -0.010601997375488281, -0.00967717170715332, -0.00875234603881836, -0.007827520370483398, -0.0069026947021484375, -0.0059778690338134766, -0.005053043365478516, -0.004128217697143555, -0.0032033920288085938, -0.002278566360473633, -0.0013537406921386719, -0.00042891502380371094, 0.00049591064453125, 0.001420736312866211, 0.002345561981201172, 0.003270387649536133, 0.004195213317871094, 0.005120038986206055, 0.006044864654541016, 0.0069696903228759766, 0.007894515991210938, 0.008819341659545898, 0.00974416732788086, 0.01066899299621582, 0.011593818664550781, 0.012518644332885742, 0.013443470001220703, 0.014368295669555664, 0.015293121337890625, 0.016217947006225586, 0.017142772674560547, 0.018067598342895508, 0.01899242401123047, 0.01991724967956543, 0.02084207534790039, 0.02176690101623535, 0.022691726684570312, 0.023616552352905273, 0.024541378021240234, 0.025466203689575195, 0.026391029357910156, 0.027315855026245117, 0.028240680694580078, 0.02916550636291504, 0.03009033203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 4.0, 10.0, 17.0, 9.0, 13.0, 13.0, 15.0, 21.0, 29.0, 24.0, 38.0, 56.0, 49.0, 53.0, 64.0, 57.0, 71.0, 60.0, 54.0, 59.0, 51.0, 47.0, 33.0, 35.0, 17.0, 21.0, 10.0, 10.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00872039794921875, -0.008465349674224854, -0.008210301399230957, -0.00795525312423706, -0.007700204849243164, -0.007445156574249268, -0.007190108299255371, -0.006935060024261475, -0.006680011749267578, -0.006424963474273682, -0.006169915199279785, -0.005914866924285889, -0.005659818649291992, -0.005404770374298096, -0.005149722099304199, -0.004894673824310303, -0.004639625549316406, -0.00438457727432251, -0.004129528999328613, -0.003874480724334717, -0.0036194324493408203, -0.003364384174346924, -0.0031093358993530273, -0.002854287624359131, -0.0025992393493652344, -0.002344191074371338, -0.0020891427993774414, -0.001834094524383545, -0.0015790462493896484, -0.001323997974395752, -0.0010689496994018555, -0.000813901424407959, -0.0005588531494140625, -0.000303804874420166, -4.875659942626953e-05, 0.00020629167556762695, 0.00046133995056152344, 0.0007163882255554199, 0.0009714365005493164, 0.0012264847755432129, 0.0014815330505371094, 0.0017365813255310059, 0.0019916296005249023, 0.002246677875518799, 0.0025017261505126953, 0.002756774425506592, 0.0030118227005004883, 0.0032668709754943848, 0.0035219192504882812, 0.0037769675254821777, 0.004032015800476074, 0.004287064075469971, 0.004542112350463867, 0.004797160625457764, 0.00505220890045166, 0.005307257175445557, 0.005562305450439453, 0.00581735372543335, 0.006072402000427246, 0.006327450275421143, 0.006582498550415039, 0.0068375468254089355, 0.007092595100402832, 0.0073476433753967285, 0.007602691650390625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 20.0, 49.0, 109.0, 232.0, 313.0, 136.0, 61.0, 35.0, 12.0, 9.0, 11.0, 2.0, 1.0, 3.0, 1.0], "bins": [-2.4478647708892822, -2.401827335357666, -2.355790138244629, -2.3097527027130127, -2.2637152671813965, -2.2176780700683594, -2.171640634536743, -2.125603199005127, -2.07956600189209, -2.0335285663604736, -1.987491250038147, -1.9414539337158203, -1.895416498184204, -1.8493791818618774, -1.8033418655395508, -1.7573044300079346, -1.7112669944763184, -1.6652296781539917, -1.6191922426223755, -1.5731549263000488, -1.5271174907684326, -1.481080174446106, -1.4350428581237793, -1.389005422592163, -1.3429681062698364, -1.2969307899475098, -1.2508933544158936, -1.204856038093567, -1.1588187217712402, -1.112781286239624, -1.0667439699172974, -1.0207066535949707, -0.9746692180633545, -0.9286318421363831, -0.8825944662094116, -0.836557149887085, -0.7905197739601135, -0.7444823980331421, -0.6984450817108154, -0.652407705783844, -0.6063703298568726, -0.5603329539299011, -0.5142955780029297, -0.468258261680603, -0.4222208857536316, -0.37618350982666016, -0.3301461637020111, -0.28410881757736206, -0.238071471452713, -0.19203411042690277, -0.14599674940109253, -0.09995938837528229, -0.053922027349472046, -0.007884666323661804, 0.03815269470214844, 0.08419004082679749, 0.13022741675376892, 0.17626477777957916, 0.2223021388053894, 0.26833951473236084, 0.3143768608570099, 0.36041420698165894, 0.40645158290863037, 0.4524889290332794, 0.49852630496025085]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 6.0, 4.0, 13.0, 15.0, 21.0, 24.0, 29.0, 34.0, 44.0, 45.0, 53.0, 53.0, 51.0, 60.0, 56.0, 70.0, 78.0, 63.0, 55.0, 41.0, 43.0, 34.0, 25.0, 19.0, 20.0, 10.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42076849937438965, -0.4054759442806244, -0.39018338918685913, -0.37489083409309387, -0.3595982789993286, -0.34430569410324097, -0.3290131688117981, -0.31372058391571045, -0.2984280288219452, -0.28313547372817993, -0.2678429186344147, -0.2525503635406494, -0.23725779354572296, -0.2219652384519577, -0.20667268335819244, -0.191380113363266, -0.17608757317066193, -0.16079501807689667, -0.1455024629831314, -0.13020989298820496, -0.1149173378944397, -0.09962478280067444, -0.08433222770690918, -0.06903966516256332, -0.053747110068798065, -0.03845455124974251, -0.0231619942933321, -0.007869437336921692, 0.007423121482133865, 0.022715680301189423, 0.03800823539495468, 0.05330079793930054, 0.0685933530330658, 0.08388590812683105, 0.09917847067117691, 0.11447102576494217, 0.12976358830928802, 0.14505614340305328, 0.16034869849681854, 0.175641268491745, 0.19093382358551025, 0.2062263786792755, 0.22151893377304077, 0.23681148886680603, 0.2521040439605713, 0.26739662885665894, 0.2826891541481018, 0.29798173904418945, 0.3132742643356323, 0.3285668194293976, 0.34385937452316284, 0.3591519296169281, 0.37444448471069336, 0.389737069606781, 0.4050295948982239, 0.4203221797943115, 0.4356147348880768, 0.45090728998184204, 0.4661998450756073, 0.48149240016937256, 0.4967849552631378, 0.5120775103569031, 0.5273700952529907, 0.5426626205444336, 0.5579552054405212]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 11.0, 12.0, 20.0, 38.0, 71.0, 95.0, 188.0, 329.0, 586.0, 1222.0, 2534.0, 6624.0, 20019.0, 99461.0, 615374.0, 246921.0, 37295.0, 10243.0, 3977.0, 1683.0, 859.0, 397.0, 232.0, 120.0, 76.0, 44.0, 28.0, 24.0, 21.0, 12.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37255859375, -0.3608131408691406, -0.34906768798828125, -0.3373222351074219, -0.3255767822265625, -0.3138313293457031, -0.30208587646484375, -0.2903404235839844, -0.278594970703125, -0.2668495178222656, -0.25510406494140625, -0.24335861206054688, -0.2316131591796875, -0.21986770629882812, -0.20812225341796875, -0.19637680053710938, -0.18463134765625, -0.17288589477539062, -0.16114044189453125, -0.14939498901367188, -0.1376495361328125, -0.12590408325195312, -0.11415863037109375, -0.10241317749023438, -0.090667724609375, -0.07892227172851562, -0.06717681884765625, -0.055431365966796875, -0.0436859130859375, -0.031940460205078125, -0.02019500732421875, -0.008449554443359375, 0.0032958984375, 0.015041351318359375, 0.02678680419921875, 0.038532257080078125, 0.0502777099609375, 0.062023162841796875, 0.07376861572265625, 0.08551406860351562, 0.097259521484375, 0.10900497436523438, 0.12075042724609375, 0.13249588012695312, 0.1442413330078125, 0.15598678588867188, 0.16773223876953125, 0.17947769165039062, 0.19122314453125, 0.20296859741210938, 0.21471405029296875, 0.22645950317382812, 0.2382049560546875, 0.24995040893554688, 0.26169586181640625, 0.2734413146972656, 0.285186767578125, 0.2969322204589844, 0.30867767333984375, 0.3204231262207031, 0.3321685791015625, 0.3439140319824219, 0.35565948486328125, 0.3674049377441406, 0.379150390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 8.0, 22.0, 30.0, 37.0, 40.0, 47.0, 60.0, 66.0, 69.0, 85.0, 80.0, 99.0, 85.0, 62.0, 49.0, 43.0, 36.0, 20.0, 15.0, 10.0, 11.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9449996948242188, -0.9041595458984375, -0.8633193969726562, -0.822479248046875, -0.7816390991210938, -0.7407989501953125, -0.6999588012695312, -0.65911865234375, -0.6182785034179688, -0.5774383544921875, -0.5365982055664062, -0.495758056640625, -0.45491790771484375, -0.4140777587890625, -0.37323760986328125, -0.3323974609375, -0.29155731201171875, -0.2507171630859375, -0.20987701416015625, -0.169036865234375, -0.12819671630859375, -0.0873565673828125, -0.04651641845703125, -0.00567626953125, 0.03516387939453125, 0.0760040283203125, 0.11684417724609375, 0.157684326171875, 0.19852447509765625, 0.2393646240234375, 0.28020477294921875, 0.321044921875, 0.36188507080078125, 0.4027252197265625, 0.44356536865234375, 0.484405517578125, 0.5252456665039062, 0.5660858154296875, 0.6069259643554688, 0.64776611328125, 0.6886062622070312, 0.7294464111328125, 0.7702865600585938, 0.811126708984375, 0.8519668579101562, 0.8928070068359375, 0.9336471557617188, 0.9744873046875, 1.0153274536132812, 1.0561676025390625, 1.0970077514648438, 1.137847900390625, 1.1786880493164062, 1.2195281982421875, 1.2603683471679688, 1.30120849609375, 1.3420486450195312, 1.3828887939453125, 1.4237289428710938, 1.464569091796875, 1.5054092407226562, 1.5462493896484375, 1.5870895385742188, 1.6279296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 11.0, 8.0, 13.0, 7.0, 18.0, 21.0, 27.0, 24.0, 40.0, 51.0, 70.0, 92.0, 111.0, 210.0, 450.0, 1397.0, 7774.0, 119225.0, 876392.0, 36915.0, 3872.0, 914.0, 314.0, 132.0, 94.0, 67.0, 60.0, 47.0, 43.0, 35.0, 25.0, 21.0, 17.0, 15.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6001434326171875, -0.579681396484375, -0.5592193603515625, -0.53875732421875, -0.5182952880859375, -0.497833251953125, -0.4773712158203125, -0.4569091796875, -0.4364471435546875, -0.415985107421875, -0.3955230712890625, -0.37506103515625, -0.3545989990234375, -0.334136962890625, -0.3136749267578125, -0.293212890625, -0.2727508544921875, -0.252288818359375, -0.2318267822265625, -0.21136474609375, -0.1909027099609375, -0.170440673828125, -0.1499786376953125, -0.1295166015625, -0.1090545654296875, -0.088592529296875, -0.0681304931640625, -0.04766845703125, -0.0272064208984375, -0.006744384765625, 0.0137176513671875, 0.0341796875, 0.0546417236328125, 0.075103759765625, 0.0955657958984375, 0.11602783203125, 0.1364898681640625, 0.156951904296875, 0.1774139404296875, 0.1978759765625, 0.2183380126953125, 0.238800048828125, 0.2592620849609375, 0.27972412109375, 0.3001861572265625, 0.320648193359375, 0.3411102294921875, 0.361572265625, 0.3820343017578125, 0.402496337890625, 0.4229583740234375, 0.44342041015625, 0.4638824462890625, 0.484344482421875, 0.5048065185546875, 0.5252685546875, 0.5457305908203125, 0.566192626953125, 0.5866546630859375, 0.60711669921875, 0.6275787353515625, 0.648040771484375, 0.6685028076171875, 0.68896484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 8.0, 9.0, 6.0, 7.0, 14.0, 9.0, 14.0, 21.0, 25.0, 21.0, 35.0, 29.0, 44.0, 33.0, 44.0, 52.0, 44.0, 41.0, 40.0, 56.0, 51.0, 46.0, 30.0, 43.0, 28.0, 42.0, 33.0, 26.0, 32.0, 26.0, 17.0, 17.0, 10.0, 19.0, 10.0, 4.0, 2.0, 3.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77587890625, -0.7499008178710938, -0.7239227294921875, -0.6979446411132812, -0.671966552734375, -0.6459884643554688, -0.6200103759765625, -0.5940322875976562, -0.56805419921875, -0.5420761108398438, -0.5160980224609375, -0.49011993408203125, -0.464141845703125, -0.43816375732421875, -0.4121856689453125, -0.38620758056640625, -0.3602294921875, -0.33425140380859375, -0.3082733154296875, -0.28229522705078125, -0.256317138671875, -0.23033905029296875, -0.2043609619140625, -0.17838287353515625, -0.15240478515625, -0.12642669677734375, -0.1004486083984375, -0.07447052001953125, -0.048492431640625, -0.02251434326171875, 0.0034637451171875, 0.02944183349609375, 0.055419921875, 0.08139801025390625, 0.1073760986328125, 0.13335418701171875, 0.159332275390625, 0.18531036376953125, 0.2112884521484375, 0.23726654052734375, 0.26324462890625, 0.28922271728515625, 0.3152008056640625, 0.34117889404296875, 0.367156982421875, 0.39313507080078125, 0.4191131591796875, 0.44509124755859375, 0.4710693359375, 0.49704742431640625, 0.5230255126953125, 0.5490036010742188, 0.574981689453125, 0.6009597778320312, 0.6269378662109375, 0.6529159545898438, 0.67889404296875, 0.7048721313476562, 0.7308502197265625, 0.7568283081054688, 0.782806396484375, 0.8087844848632812, 0.8347625732421875, 0.8607406616210938, 0.88671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 5.0, 3.0, 4.0, 9.0, 10.0, 11.0, 14.0, 25.0, 48.0, 122.0, 254.0, 668.0, 2547.0, 15920.0, 552025.0, 458691.0, 14703.0, 2317.0, 653.0, 268.0, 106.0, 60.0, 33.0, 20.0, 8.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19370460510253906, -0.18562698364257812, -0.1775493621826172, -0.16947174072265625, -0.1613941192626953, -0.15331649780273438, -0.14523887634277344, -0.1371612548828125, -0.12908363342285156, -0.12100601196289062, -0.11292839050292969, -0.10485076904296875, -0.09677314758300781, -0.08869552612304688, -0.08061790466308594, -0.072540283203125, -0.06446266174316406, -0.056385040283203125, -0.04830741882324219, -0.04022979736328125, -0.03215217590332031, -0.024074554443359375, -0.015996932983398438, -0.0079193115234375, 0.0001583099365234375, 0.008235931396484375, 0.016313552856445312, 0.02439117431640625, 0.03246879577636719, 0.040546417236328125, 0.04862403869628906, 0.05670166015625, 0.06477928161621094, 0.07285690307617188, 0.08093452453613281, 0.08901214599609375, 0.09708976745605469, 0.10516738891601562, 0.11324501037597656, 0.1213226318359375, 0.12940025329589844, 0.13747787475585938, 0.1455554962158203, 0.15363311767578125, 0.1617107391357422, 0.16978836059570312, 0.17786598205566406, 0.185943603515625, 0.19402122497558594, 0.20209884643554688, 0.2101764678955078, 0.21825408935546875, 0.2263317108154297, 0.23440933227539062, 0.24248695373535156, 0.2505645751953125, 0.25864219665527344, 0.2667198181152344, 0.2747974395751953, 0.28287506103515625, 0.2909526824951172, 0.2990303039550781, 0.30710792541503906, 0.315185546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 10.0, 10.0, 14.0, 22.0, 33.0, 45.0, 49.0, 81.0, 113.0, 150.0, 125.0, 118.0, 45.0, 54.0, 37.0, 19.0, 21.0, 5.0, 15.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.6941299438476562e-05, -2.629496157169342e-05, -2.564862370491028e-05, -2.5002285838127136e-05, -2.4355947971343994e-05, -2.3709610104560852e-05, -2.306327223777771e-05, -2.2416934370994568e-05, -2.1770596504211426e-05, -2.1124258637428284e-05, -2.047792077064514e-05, -1.9831582903862e-05, -1.9185245037078857e-05, -1.8538907170295715e-05, -1.7892569303512573e-05, -1.724623143672943e-05, -1.659989356994629e-05, -1.5953555703163147e-05, -1.5307217836380005e-05, -1.4660879969596863e-05, -1.401454210281372e-05, -1.3368204236030579e-05, -1.2721866369247437e-05, -1.2075528502464294e-05, -1.1429190635681152e-05, -1.078285276889801e-05, -1.0136514902114868e-05, -9.490177035331726e-06, -8.843839168548584e-06, -8.197501301765442e-06, -7.5511634349823e-06, -6.904825568199158e-06, -6.258487701416016e-06, -5.6121498346328735e-06, -4.9658119678497314e-06, -4.319474101066589e-06, -3.6731362342834473e-06, -3.026798367500305e-06, -2.380460500717163e-06, -1.734122633934021e-06, -1.087784767150879e-06, -4.414469003677368e-07, 2.0489096641540527e-07, 8.512288331985474e-07, 1.4975666999816895e-06, 2.1439045667648315e-06, 2.7902424335479736e-06, 3.4365803003311157e-06, 4.082918167114258e-06, 4.7292560338974e-06, 5.375593900680542e-06, 6.021931767463684e-06, 6.668269634246826e-06, 7.314607501029968e-06, 7.96094536781311e-06, 8.607283234596252e-06, 9.253621101379395e-06, 9.899958968162537e-06, 1.0546296834945679e-05, 1.119263470172882e-05, 1.1838972568511963e-05, 1.2485310435295105e-05, 1.3131648302078247e-05, 1.377798616886139e-05, 1.4424324035644531e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 13.0, 17.0, 23.0, 24.0, 69.0, 67.0, 108.0, 192.0, 309.0, 597.0, 1224.0, 3398.0, 13280.0, 102916.0, 828731.0, 80614.0, 11268.0, 3184.0, 1208.0, 520.0, 278.0, 177.0, 109.0, 72.0, 47.0, 33.0, 23.0, 18.0, 6.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.241455078125, -0.23500823974609375, -0.2285614013671875, -0.22211456298828125, -0.215667724609375, -0.20922088623046875, -0.2027740478515625, -0.19632720947265625, -0.18988037109375, -0.18343353271484375, -0.1769866943359375, -0.17053985595703125, -0.164093017578125, -0.15764617919921875, -0.1511993408203125, -0.14475250244140625, -0.1383056640625, -0.13185882568359375, -0.1254119873046875, -0.11896514892578125, -0.112518310546875, -0.10607147216796875, -0.0996246337890625, -0.09317779541015625, -0.08673095703125, -0.08028411865234375, -0.0738372802734375, -0.06739044189453125, -0.060943603515625, -0.05449676513671875, -0.0480499267578125, -0.04160308837890625, -0.03515625, -0.02870941162109375, -0.0222625732421875, -0.01581573486328125, -0.009368896484375, -0.00292205810546875, 0.0035247802734375, 0.00997161865234375, 0.01641845703125, 0.02286529541015625, 0.0293121337890625, 0.03575897216796875, 0.042205810546875, 0.04865264892578125, 0.0550994873046875, 0.06154632568359375, 0.0679931640625, 0.07444000244140625, 0.0808868408203125, 0.08733367919921875, 0.093780517578125, 0.10022735595703125, 0.1066741943359375, 0.11312103271484375, 0.11956787109375, 0.12601470947265625, 0.1324615478515625, 0.13890838623046875, 0.145355224609375, 0.15180206298828125, 0.1582489013671875, 0.16469573974609375, 0.171142578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 10.0, 11.0, 17.0, 23.0, 16.0, 59.0, 52.0, 100.0, 150.0, 157.0, 113.0, 102.0, 51.0, 42.0, 29.0, 23.0, 14.0, 4.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06781005859375, -0.06533336639404297, -0.06285667419433594, -0.060379981994628906, -0.057903289794921875, -0.055426597595214844, -0.05294990539550781, -0.05047321319580078, -0.04799652099609375, -0.04551982879638672, -0.04304313659667969, -0.040566444396972656, -0.038089752197265625, -0.035613059997558594, -0.03313636779785156, -0.03065967559814453, -0.0281829833984375, -0.02570629119873047, -0.023229598999023438, -0.020752906799316406, -0.018276214599609375, -0.015799522399902344, -0.013322830200195312, -0.010846138000488281, -0.00836944580078125, -0.005892753601074219, -0.0034160614013671875, -0.0009393692016601562, 0.001537322998046875, 0.004014015197753906, 0.0064907073974609375, 0.008967399597167969, 0.011444091796875, 0.013920783996582031, 0.016397476196289062, 0.018874168395996094, 0.021350860595703125, 0.023827552795410156, 0.026304244995117188, 0.02878093719482422, 0.03125762939453125, 0.03373432159423828, 0.03621101379394531, 0.038687705993652344, 0.041164398193359375, 0.043641090393066406, 0.04611778259277344, 0.04859447479248047, 0.0510711669921875, 0.05354785919189453, 0.05602455139160156, 0.058501243591308594, 0.060977935791015625, 0.06345462799072266, 0.06593132019042969, 0.06840801239013672, 0.07088470458984375, 0.07336139678955078, 0.07583808898925781, 0.07831478118896484, 0.08079147338867188, 0.0832681655883789, 0.08574485778808594, 0.08822154998779297, 0.0906982421875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 19.0, 40.0, 84.0, 125.0, 238.0, 241.0, 105.0, 54.0, 27.0, 16.0, 13.0, 7.0, 9.0, 5.0, 1.0, 1.0, 3.0], "bins": [-3.7459495067596436, -3.673616886138916, -3.6012845039367676, -3.52895188331604, -3.4566192626953125, -3.384286880493164, -3.3119542598724365, -3.239621639251709, -3.1672892570495605, -3.094956636428833, -3.0226242542266846, -2.950291633605957, -2.8779590129852295, -2.805626392364502, -2.7332940101623535, -2.660961389541626, -2.5886287689208984, -2.516296148300171, -2.4439637660980225, -2.371631145477295, -2.2992985248565674, -2.22696590423584, -2.1546335220336914, -2.082300901412964, -2.0099682807922363, -1.9376357793807983, -1.8653031587600708, -1.7929706573486328, -1.7206380367279053, -1.6483055353164673, -1.5759730339050293, -1.5036404132843018, -1.4313082695007324, -1.3589757680892944, -1.286643147468567, -1.214310646057129, -1.1419780254364014, -1.0696455240249634, -0.9973130226135254, -0.9249804615974426, -0.8526478409767151, -0.7803152799606323, -0.7079827785491943, -0.6356502175331116, -0.5633176565170288, -0.49098509550094604, -0.41865256428718567, -0.3463200330734253, -0.27398747205734253, -0.20165492594242096, -0.1293223798274994, -0.05698983371257782, 0.01534271240234375, 0.08767527341842651, 0.1600078046321869, 0.23234033584594727, 0.30467289686203003, 0.3770054578781128, 0.44933798909187317, 0.5216705203056335, 0.5940030813217163, 0.6663356423377991, 0.7386682033538818, 0.8110007047653198, 0.8833332657814026]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 9.0, 14.0, 16.0, 12.0, 14.0, 27.0, 33.0, 33.0, 28.0, 40.0, 37.0, 37.0, 45.0, 40.0, 42.0, 35.0, 46.0, 41.0, 52.0, 34.0, 45.0, 41.0, 43.0, 20.0, 41.0, 29.0, 26.0, 16.0, 23.0, 11.0, 15.0, 8.0, 8.0, 6.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3355566263198853, -1.291715383529663, -1.247874140739441, -1.2040328979492188, -1.1601916551589966, -1.1163504123687744, -1.0725090503692627, -1.0286678075790405, -0.9848265647888184, -0.9409853219985962, -0.897144079208374, -0.8533028364181519, -0.8094615340232849, -0.7656202912330627, -0.7217790484428406, -0.6779377460479736, -0.6340965628623962, -0.5902553200721741, -0.5464140772819519, -0.502572774887085, -0.4587315320968628, -0.4148902893066406, -0.37104904651641846, -0.3272077739238739, -0.28336653113365173, -0.23952527344226837, -0.195684015750885, -0.15184277296066284, -0.10800151526927948, -0.06416025757789612, -0.02031901478767395, 0.023522257804870605, 0.06736350059509277, 0.11120475828647614, 0.1550460159778595, 0.19888725876808167, 0.24272851645946503, 0.2865697741508484, 0.33041101694107056, 0.3742522895336151, 0.4180935323238373, 0.46193477511405945, 0.505776047706604, 0.5496172904968262, 0.5934585332870483, 0.6372997760772705, 0.6811410188674927, 0.7249823212623596, 0.7688235640525818, 0.812664806842804, 0.8565060496330261, 0.9003473520278931, 0.9441885948181152, 0.9880298376083374, 1.0318710803985596, 1.0757123231887817, 1.119553565979004, 1.163394808769226, 1.2072360515594482, 1.2510772943496704, 1.2949185371398926, 1.3387598991394043, 1.382601022720337, 1.4264423847198486, 1.4702836275100708]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 9.0, 10.0, 14.0, 25.0, 39.0, 64.0, 106.0, 166.0, 339.0, 646.0, 1240.0, 3008.0, 9173.0, 304686.0, 3819075.0, 46396.0, 5381.0, 1983.0, 903.0, 404.0, 259.0, 155.0, 81.0, 41.0, 24.0, 18.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.470733642578125, -1.41021728515625, -1.349700927734375, -1.2891845703125, -1.228668212890625, -1.16815185546875, -1.107635498046875, -1.047119140625, -0.986602783203125, -0.92608642578125, -0.865570068359375, -0.8050537109375, -0.744537353515625, -0.68402099609375, -0.623504638671875, -0.56298828125, -0.502471923828125, -0.44195556640625, -0.381439208984375, -0.3209228515625, -0.260406494140625, -0.19989013671875, -0.139373779296875, -0.078857421875, -0.018341064453125, 0.04217529296875, 0.102691650390625, 0.1632080078125, 0.223724365234375, 0.28424072265625, 0.344757080078125, 0.4052734375, 0.465789794921875, 0.52630615234375, 0.586822509765625, 0.6473388671875, 0.707855224609375, 0.76837158203125, 0.828887939453125, 0.889404296875, 0.949920654296875, 1.01043701171875, 1.070953369140625, 1.1314697265625, 1.191986083984375, 1.25250244140625, 1.313018798828125, 1.37353515625, 1.434051513671875, 1.49456787109375, 1.555084228515625, 1.6156005859375, 1.676116943359375, 1.73663330078125, 1.797149658203125, 1.857666015625, 1.918182373046875, 1.97869873046875, 2.039215087890625, 2.0997314453125, 2.160247802734375, 2.22076416015625, 2.281280517578125, 2.341796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 3.0, 5.0, 8.0, 20.0, 19.0, 30.0, 29.0, 35.0, 35.0, 50.0, 52.0, 53.0, 61.0, 72.0, 70.0, 52.0, 78.0, 56.0, 64.0, 35.0, 23.0, 36.0, 30.0, 17.0, 17.0, 11.0, 6.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5660552978515625, -0.546661376953125, -0.5272674560546875, -0.50787353515625, -0.4884796142578125, -0.469085693359375, -0.4496917724609375, -0.4302978515625, -0.4109039306640625, -0.391510009765625, -0.3721160888671875, -0.35272216796875, -0.3333282470703125, -0.313934326171875, -0.2945404052734375, -0.275146484375, -0.2557525634765625, -0.236358642578125, -0.2169647216796875, -0.19757080078125, -0.1781768798828125, -0.158782958984375, -0.1393890380859375, -0.1199951171875, -0.1006011962890625, -0.081207275390625, -0.0618133544921875, -0.04241943359375, -0.0230255126953125, -0.003631591796875, 0.0157623291015625, 0.03515625, 0.0545501708984375, 0.073944091796875, 0.0933380126953125, 0.11273193359375, 0.1321258544921875, 0.151519775390625, 0.1709136962890625, 0.1903076171875, 0.2097015380859375, 0.229095458984375, 0.2484893798828125, 0.26788330078125, 0.2872772216796875, 0.306671142578125, 0.3260650634765625, 0.345458984375, 0.3648529052734375, 0.384246826171875, 0.4036407470703125, 0.42303466796875, 0.4424285888671875, 0.461822509765625, 0.4812164306640625, 0.5006103515625, 0.5200042724609375, 0.539398193359375, 0.5587921142578125, 0.57818603515625, 0.5975799560546875, 0.616973876953125, 0.6363677978515625, 0.65576171875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 12.0, 11.0, 18.0, 38.0, 35.0, 58.0, 110.0, 147.0, 243.0, 371.0, 604.0, 1046.0, 1914.0, 3423.0, 7207.0, 19611.0, 87656.0, 2487563.0, 1483216.0, 69777.0, 17077.0, 6655.0, 3228.0, 1663.0, 991.0, 596.0, 364.0, 199.0, 138.0, 96.0, 68.0, 34.0, 31.0, 20.0, 12.0, 8.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71044921875, -0.6888809204101562, -0.6673126220703125, -0.6457443237304688, -0.624176025390625, -0.6026077270507812, -0.5810394287109375, -0.5594711303710938, -0.53790283203125, -0.5163345336914062, -0.4947662353515625, -0.47319793701171875, -0.451629638671875, -0.43006134033203125, -0.4084930419921875, -0.38692474365234375, -0.3653564453125, -0.34378814697265625, -0.3222198486328125, -0.30065155029296875, -0.279083251953125, -0.25751495361328125, -0.2359466552734375, -0.21437835693359375, -0.19281005859375, -0.17124176025390625, -0.1496734619140625, -0.12810516357421875, -0.106536865234375, -0.08496856689453125, -0.0634002685546875, -0.04183197021484375, -0.020263671875, 0.00130462646484375, 0.0228729248046875, 0.04444122314453125, 0.066009521484375, 0.08757781982421875, 0.1091461181640625, 0.13071441650390625, 0.15228271484375, 0.17385101318359375, 0.1954193115234375, 0.21698760986328125, 0.238555908203125, 0.26012420654296875, 0.2816925048828125, 0.30326080322265625, 0.3248291015625, 0.34639739990234375, 0.3679656982421875, 0.38953399658203125, 0.411102294921875, 0.43267059326171875, 0.4542388916015625, 0.47580718994140625, 0.49737548828125, 0.5189437866210938, 0.5405120849609375, 0.5620803833007812, 0.583648681640625, 0.6052169799804688, 0.6267852783203125, 0.6483535766601562, 0.669921875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 5.0, 9.0, 13.0, 9.0, 13.0, 28.0, 35.0, 57.0, 110.0, 197.0, 357.0, 690.0, 987.0, 694.0, 374.0, 183.0, 91.0, 67.0, 33.0, 23.0, 11.0, 12.0, 8.0, 11.0, 3.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2161865234375, -0.2088489532470703, -0.20151138305664062, -0.19417381286621094, -0.18683624267578125, -0.17949867248535156, -0.17216110229492188, -0.1648235321044922, -0.1574859619140625, -0.1501483917236328, -0.14281082153320312, -0.13547325134277344, -0.12813568115234375, -0.12079811096191406, -0.11346054077148438, -0.10612297058105469, -0.098785400390625, -0.09144783020019531, -0.08411026000976562, -0.07677268981933594, -0.06943511962890625, -0.06209754943847656, -0.054759979248046875, -0.04742240905761719, -0.0400848388671875, -0.03274726867675781, -0.025409698486328125, -0.018072128295898438, -0.01073455810546875, -0.0033969879150390625, 0.003940582275390625, 0.011278152465820312, 0.01861572265625, 0.025953292846679688, 0.033290863037109375, 0.04062843322753906, 0.04796600341796875, 0.05530357360839844, 0.06264114379882812, 0.06997871398925781, 0.0773162841796875, 0.08465385437011719, 0.09199142456054688, 0.09932899475097656, 0.10666656494140625, 0.11400413513183594, 0.12134170532226562, 0.1286792755126953, 0.136016845703125, 0.1433544158935547, 0.15069198608398438, 0.15802955627441406, 0.16536712646484375, 0.17270469665527344, 0.18004226684570312, 0.1873798370361328, 0.1947174072265625, 0.2020549774169922, 0.20939254760742188, 0.21673011779785156, 0.22406768798828125, 0.23140525817871094, 0.23874282836914062, 0.2460803985595703, 0.25341796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 8.0, 9.0, 15.0, 25.0, 30.0, 45.0, 65.0, 104.0, 115.0, 153.0, 121.0, 73.0, 61.0, 48.0, 27.0, 21.0, 11.0, 9.0, 8.0, 8.0, 7.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.006345510482788, -0.9785889387130737, -0.9508323669433594, -0.923075795173645, -0.8953192234039307, -0.8675626516342163, -0.839806079864502, -0.8120495080947876, -0.7842929363250732, -0.7565363645553589, -0.7287797927856445, -0.7010232210159302, -0.6732666492462158, -0.6455100774765015, -0.6177535057067871, -0.5899969339370728, -0.5622404217720032, -0.5344838500022888, -0.5067272782325745, -0.4789707064628601, -0.45121413469314575, -0.4234575629234314, -0.39570102095603943, -0.3679444491863251, -0.3401878774166107, -0.31243130564689636, -0.284674733877182, -0.25691819190979004, -0.2291616052389145, -0.20140503346920013, -0.17364847660064697, -0.14589190483093262, -0.11813539266586304, -0.09037882089614868, -0.06262225657701492, -0.034865692257881165, -0.007109120488166809, 0.020647451281547546, 0.04840400815010071, 0.07616057991981506, 0.10391715168952942, 0.13167372345924377, 0.15943029522895813, 0.1871868520975113, 0.21494342386722565, 0.24269999563694, 0.27045655250549316, 0.2982131242752075, 0.3259696960449219, 0.35372626781463623, 0.3814828395843506, 0.40923941135406494, 0.4369959831237793, 0.46475255489349365, 0.4925090968608856, 0.5202656984329224, 0.5480222702026367, 0.5757788419723511, 0.6035354137420654, 0.6312919855117798, 0.6590485572814941, 0.6868051290512085, 0.7145617008209229, 0.7423182725906372, 0.7700747847557068]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 6.0, 17.0, 24.0, 26.0, 25.0, 31.0, 31.0, 41.0, 43.0, 45.0, 52.0, 45.0, 60.0, 58.0, 60.0, 62.0, 53.0, 52.0, 44.0, 39.0, 33.0, 25.0, 26.0, 23.0, 14.0, 21.0, 11.0, 11.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5457655191421509, -0.5264434814453125, -0.5071214437484741, -0.48779940605163574, -0.46847739815711975, -0.44915536046028137, -0.429833322763443, -0.410511314868927, -0.3911892771720886, -0.37186723947525024, -0.35254520177841187, -0.3332231640815735, -0.3139011561870575, -0.2945791184902191, -0.27525708079338074, -0.25593507289886475, -0.23661300539970398, -0.2172909677028656, -0.19796894490718842, -0.17864690721035004, -0.15932488441467285, -0.14000284671783447, -0.1206808090209961, -0.10135878622531891, -0.08203674852848053, -0.06271471828222275, -0.04339268431067467, -0.024070650339126587, -0.004748620092868805, 0.014573410153388977, 0.033895447850227356, 0.05321747064590454, 0.07253950834274292, 0.0918615385890007, 0.11118356883525848, 0.13050560653209686, 0.14982762932777405, 0.16914966702461243, 0.1884717047214508, 0.207793727517128, 0.22711576521396637, 0.24643780291080475, 0.26575982570648193, 0.2850818634033203, 0.3044039011001587, 0.32372593879699707, 0.34304797649383545, 0.36236998438835144, 0.3816920220851898, 0.4010140597820282, 0.4203360974788666, 0.43965810537338257, 0.45898014307022095, 0.4783021807670593, 0.4976242184638977, 0.5169462561607361, 0.5362682938575745, 0.5555903315544128, 0.5749123692512512, 0.5942344069480896, 0.613556444644928, 0.6328784227371216, 0.65220046043396, 0.6715224981307983, 0.6908445358276367]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 6.0, 7.0, 12.0, 9.0, 19.0, 27.0, 32.0, 43.0, 58.0, 67.0, 116.0, 170.0, 254.0, 452.0, 746.0, 1424.0, 2700.0, 5500.0, 11426.0, 26122.0, 66329.0, 197824.0, 419762.0, 198922.0, 66516.0, 26680.0, 11607.0, 5531.0, 2711.0, 1411.0, 781.0, 432.0, 287.0, 176.0, 103.0, 89.0, 50.0, 40.0, 31.0, 20.0, 13.0, 11.0, 5.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0755615234375, -0.07316303253173828, -0.07076454162597656, -0.06836605072021484, -0.06596755981445312, -0.0635690689086914, -0.06117057800292969, -0.05877208709716797, -0.05637359619140625, -0.05397510528564453, -0.05157661437988281, -0.049178123474121094, -0.046779632568359375, -0.044381141662597656, -0.04198265075683594, -0.03958415985107422, -0.0371856689453125, -0.03478717803955078, -0.03238868713378906, -0.029990196228027344, -0.027591705322265625, -0.025193214416503906, -0.022794723510742188, -0.02039623260498047, -0.01799774169921875, -0.015599250793457031, -0.013200759887695312, -0.010802268981933594, -0.008403778076171875, -0.006005287170410156, -0.0036067962646484375, -0.0012083053588867188, 0.001190185546875, 0.0035886764526367188, 0.0059871673583984375, 0.008385658264160156, 0.010784149169921875, 0.013182640075683594, 0.015581130981445312, 0.01797962188720703, 0.02037811279296875, 0.02277660369873047, 0.025175094604492188, 0.027573585510253906, 0.029972076416015625, 0.032370567321777344, 0.03476905822753906, 0.03716754913330078, 0.0395660400390625, 0.04196453094482422, 0.04436302185058594, 0.046761512756347656, 0.049160003662109375, 0.051558494567871094, 0.05395698547363281, 0.05635547637939453, 0.05875396728515625, 0.06115245819091797, 0.06355094909667969, 0.0659494400024414, 0.06834793090820312, 0.07074642181396484, 0.07314491271972656, 0.07554340362548828, 0.07794189453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 12.0, 15.0, 32.0, 28.0, 35.0, 51.0, 54.0, 65.0, 77.0, 93.0, 89.0, 92.0, 70.0, 64.0, 47.0, 35.0, 42.0, 21.0, 25.0, 16.0, 13.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.4050445556640625, -0.387725830078125, -0.3704071044921875, -0.35308837890625, -0.3357696533203125, -0.318450927734375, -0.3011322021484375, -0.2838134765625, -0.2664947509765625, -0.249176025390625, -0.2318572998046875, -0.21453857421875, -0.1972198486328125, -0.179901123046875, -0.1625823974609375, -0.145263671875, -0.1279449462890625, -0.110626220703125, -0.0933074951171875, -0.07598876953125, -0.0586700439453125, -0.041351318359375, -0.0240325927734375, -0.0067138671875, 0.0106048583984375, 0.027923583984375, 0.0452423095703125, 0.06256103515625, 0.0798797607421875, 0.097198486328125, 0.1145172119140625, 0.1318359375, 0.1491546630859375, 0.166473388671875, 0.1837921142578125, 0.20111083984375, 0.2184295654296875, 0.235748291015625, 0.2530670166015625, 0.2703857421875, 0.2877044677734375, 0.305023193359375, 0.3223419189453125, 0.33966064453125, 0.3569793701171875, 0.374298095703125, 0.3916168212890625, 0.408935546875, 0.4262542724609375, 0.443572998046875, 0.4608917236328125, 0.47821044921875, 0.4955291748046875, 0.512847900390625, 0.5301666259765625, 0.5474853515625, 0.5648040771484375, 0.582122802734375, 0.5994415283203125, 0.61676025390625, 0.6340789794921875, 0.651397705078125, 0.6687164306640625, 0.68603515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 19.0, 13.0, 18.0, 33.0, 46.0, 46.0, 105.0, 153.0, 248.0, 349.0, 634.0, 1089.0, 1856.0, 3389.0, 6196.0, 12906.0, 27814.0, 65877.0, 168063.0, 344421.0, 241246.0, 96810.0, 39893.0, 18068.0, 8680.0, 4504.0, 2505.0, 1403.0, 787.0, 493.0, 295.0, 178.0, 140.0, 77.0, 50.0, 47.0, 29.0, 26.0, 11.0, 10.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055755615234375, -0.0538783073425293, -0.052000999450683594, -0.05012369155883789, -0.04824638366699219, -0.046369075775146484, -0.04449176788330078, -0.04261445999145508, -0.040737152099609375, -0.03885984420776367, -0.03698253631591797, -0.035105228424072266, -0.03322792053222656, -0.03135061264038086, -0.029473304748535156, -0.027595996856689453, -0.02571868896484375, -0.023841381072998047, -0.021964073181152344, -0.02008676528930664, -0.018209457397460938, -0.016332149505615234, -0.014454841613769531, -0.012577533721923828, -0.010700225830078125, -0.008822917938232422, -0.006945610046386719, -0.005068302154541016, -0.0031909942626953125, -0.0013136863708496094, 0.0005636215209960938, 0.002440929412841797, 0.0043182373046875, 0.006195545196533203, 0.008072853088378906, 0.00995016098022461, 0.011827468872070312, 0.013704776763916016, 0.015582084655761719, 0.017459392547607422, 0.019336700439453125, 0.021214008331298828, 0.02309131622314453, 0.024968624114990234, 0.026845932006835938, 0.02872323989868164, 0.030600547790527344, 0.03247785568237305, 0.03435516357421875, 0.03623247146606445, 0.038109779357910156, 0.03998708724975586, 0.04186439514160156, 0.043741703033447266, 0.04561901092529297, 0.04749631881713867, 0.049373626708984375, 0.05125093460083008, 0.05312824249267578, 0.055005550384521484, 0.05688285827636719, 0.05876016616821289, 0.060637474060058594, 0.0625147819519043, 0.06439208984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 11.0, 7.0, 11.0, 11.0, 9.0, 16.0, 17.0, 23.0, 31.0, 20.0, 30.0, 48.0, 38.0, 41.0, 46.0, 56.0, 43.0, 42.0, 47.0, 41.0, 44.0, 41.0, 36.0, 34.0, 29.0, 22.0, 22.0, 22.0, 24.0, 24.0, 14.0, 8.0, 14.0, 12.0, 9.0, 6.0, 11.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.57763671875, -0.5601806640625, -0.542724609375, -0.5252685546875, -0.5078125, -0.4903564453125, -0.472900390625, -0.4554443359375, -0.43798828125, -0.4205322265625, -0.403076171875, -0.3856201171875, -0.3681640625, -0.3507080078125, -0.333251953125, -0.3157958984375, -0.29833984375, -0.2808837890625, -0.263427734375, -0.2459716796875, -0.228515625, -0.2110595703125, -0.193603515625, -0.1761474609375, -0.15869140625, -0.1412353515625, -0.123779296875, -0.1063232421875, -0.0888671875, -0.0714111328125, -0.053955078125, -0.0364990234375, -0.01904296875, -0.0015869140625, 0.015869140625, 0.0333251953125, 0.05078125, 0.0682373046875, 0.085693359375, 0.1031494140625, 0.12060546875, 0.1380615234375, 0.155517578125, 0.1729736328125, 0.1904296875, 0.2078857421875, 0.225341796875, 0.2427978515625, 0.26025390625, 0.2777099609375, 0.295166015625, 0.3126220703125, 0.330078125, 0.3475341796875, 0.364990234375, 0.3824462890625, 0.39990234375, 0.4173583984375, 0.434814453125, 0.4522705078125, 0.4697265625, 0.4871826171875, 0.504638671875, 0.5220947265625, 0.53955078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 14.0, 19.0, 28.0, 38.0, 55.0, 124.0, 229.0, 448.0, 850.0, 2068.0, 5245.0, 16776.0, 72480.0, 459626.0, 403635.0, 63116.0, 15177.0, 4865.0, 1988.0, 886.0, 423.0, 181.0, 105.0, 73.0, 43.0, 18.0, 13.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0443115234375, -0.04314422607421875, -0.0419769287109375, -0.04080963134765625, -0.039642333984375, -0.03847503662109375, -0.0373077392578125, -0.03614044189453125, -0.03497314453125, -0.03380584716796875, -0.0326385498046875, -0.03147125244140625, -0.030303955078125, -0.02913665771484375, -0.0279693603515625, -0.02680206298828125, -0.025634765625, -0.02446746826171875, -0.0233001708984375, -0.02213287353515625, -0.020965576171875, -0.01979827880859375, -0.0186309814453125, -0.01746368408203125, -0.01629638671875, -0.01512908935546875, -0.0139617919921875, -0.01279449462890625, -0.011627197265625, -0.01045989990234375, -0.0092926025390625, -0.00812530517578125, -0.0069580078125, -0.00579071044921875, -0.0046234130859375, -0.00345611572265625, -0.002288818359375, -0.00112152099609375, 4.57763671875e-05, 0.00121307373046875, 0.00238037109375, 0.00354766845703125, 0.0047149658203125, 0.00588226318359375, 0.007049560546875, 0.00821685791015625, 0.0093841552734375, 0.01055145263671875, 0.01171875, 0.01288604736328125, 0.0140533447265625, 0.01522064208984375, 0.016387939453125, 0.01755523681640625, 0.0187225341796875, 0.01988983154296875, 0.02105712890625, 0.02222442626953125, 0.0233917236328125, 0.02455902099609375, 0.025726318359375, 0.02689361572265625, 0.0280609130859375, 0.02922821044921875, 0.0303955078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 10.0, 20.0, 20.0, 20.0, 41.0, 55.0, 96.0, 104.0, 129.0, 148.0, 92.0, 78.0, 50.0, 32.0, 26.0, 17.0, 14.0, 6.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7583370208740234e-05, -1.690257340669632e-05, -1.6221776604652405e-05, -1.554097980260849e-05, -1.4860183000564575e-05, -1.417938619852066e-05, -1.3498589396476746e-05, -1.281779259443283e-05, -1.2136995792388916e-05, -1.1456198990345001e-05, -1.0775402188301086e-05, -1.0094605386257172e-05, -9.413808584213257e-06, -8.733011782169342e-06, -8.052214980125427e-06, -7.3714181780815125e-06, -6.690621376037598e-06, -6.009824573993683e-06, -5.329027771949768e-06, -4.648230969905853e-06, -3.9674341678619385e-06, -3.2866373658180237e-06, -2.605840563774109e-06, -1.925043761730194e-06, -1.2442469596862793e-06, -5.634501576423645e-07, 1.1734664440155029e-07, 7.981434464454651e-07, 1.4789402484893799e-06, 2.1597370505332947e-06, 2.8405338525772095e-06, 3.5213306546211243e-06, 4.202127456665039e-06, 4.882924258708954e-06, 5.563721060752869e-06, 6.2445178627967834e-06, 6.925314664840698e-06, 7.606111466884613e-06, 8.286908268928528e-06, 8.967705070972443e-06, 9.648501873016357e-06, 1.0329298675060272e-05, 1.1010095477104187e-05, 1.1690892279148102e-05, 1.2371689081192017e-05, 1.3052485883235931e-05, 1.3733282685279846e-05, 1.4414079487323761e-05, 1.5094876289367676e-05, 1.577567309141159e-05, 1.6456469893455505e-05, 1.713726669549942e-05, 1.7818063497543335e-05, 1.849886029958725e-05, 1.9179657101631165e-05, 1.986045390367508e-05, 2.0541250705718994e-05, 2.122204750776291e-05, 2.1902844309806824e-05, 2.258364111185074e-05, 2.3264437913894653e-05, 2.3945234715938568e-05, 2.4626031517982483e-05, 2.5306828320026398e-05, 2.5987625122070312e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 6.0, 5.0, 10.0, 17.0, 16.0, 30.0, 37.0, 55.0, 88.0, 119.0, 221.0, 332.0, 605.0, 1058.0, 1968.0, 3654.0, 7472.0, 16687.0, 41348.0, 112174.0, 319239.0, 341410.0, 123158.0, 44183.0, 17858.0, 8037.0, 3926.0, 2087.0, 1114.0, 647.0, 401.0, 223.0, 119.0, 76.0, 53.0, 43.0, 19.0, 22.0, 11.0, 10.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0227508544921875, -0.022062301635742188, -0.021373748779296875, -0.020685195922851562, -0.01999664306640625, -0.019308090209960938, -0.018619537353515625, -0.017930984497070312, -0.017242431640625, -0.016553878784179688, -0.015865325927734375, -0.015176773071289062, -0.01448822021484375, -0.013799667358398438, -0.013111114501953125, -0.012422561645507812, -0.0117340087890625, -0.011045455932617188, -0.010356903076171875, -0.009668350219726562, -0.00897979736328125, -0.008291244506835938, -0.007602691650390625, -0.0069141387939453125, -0.0062255859375, -0.0055370330810546875, -0.004848480224609375, -0.0041599273681640625, -0.00347137451171875, -0.0027828216552734375, -0.002094268798828125, -0.0014057159423828125, -0.0007171630859375, -2.86102294921875e-05, 0.000659942626953125, 0.0013484954833984375, 0.00203704833984375, 0.0027256011962890625, 0.003414154052734375, 0.0041027069091796875, 0.004791259765625, 0.0054798126220703125, 0.006168365478515625, 0.0068569183349609375, 0.00754547119140625, 0.008234024047851562, 0.008922576904296875, 0.009611129760742188, 0.0102996826171875, 0.010988235473632812, 0.011676788330078125, 0.012365341186523438, 0.01305389404296875, 0.013742446899414062, 0.014430999755859375, 0.015119552612304688, 0.01580810546875, 0.016496658325195312, 0.017185211181640625, 0.017873764038085938, 0.01856231689453125, 0.019250869750976562, 0.019939422607421875, 0.020627975463867188, 0.0213165283203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 15.0, 6.0, 16.0, 21.0, 21.0, 28.0, 43.0, 46.0, 50.0, 53.0, 56.0, 85.0, 65.0, 60.0, 66.0, 70.0, 55.0, 48.0, 32.0, 30.0, 20.0, 24.0, 18.0, 17.0, 11.0, 4.0, 7.0, 2.0, 3.0, 7.0, 0.0, 5.0, 1.0, 1.0], "bins": [-0.010040283203125, -0.009804010391235352, -0.009567737579345703, -0.009331464767456055, -0.009095191955566406, -0.008858919143676758, -0.00862264633178711, -0.008386373519897461, -0.008150100708007812, -0.007913827896118164, -0.007677555084228516, -0.007441282272338867, -0.007205009460449219, -0.00696873664855957, -0.006732463836669922, -0.0064961910247802734, -0.006259918212890625, -0.0060236454010009766, -0.005787372589111328, -0.00555109977722168, -0.005314826965332031, -0.005078554153442383, -0.004842281341552734, -0.004606008529663086, -0.0043697357177734375, -0.004133462905883789, -0.0038971900939941406, -0.003660917282104492, -0.0034246444702148438, -0.0031883716583251953, -0.002952098846435547, -0.0027158260345458984, -0.00247955322265625, -0.0022432804107666016, -0.002007007598876953, -0.0017707347869873047, -0.0015344619750976562, -0.0012981891632080078, -0.0010619163513183594, -0.0008256435394287109, -0.0005893707275390625, -0.00035309791564941406, -0.00011682510375976562, 0.00011944770812988281, 0.00035572052001953125, 0.0005919933319091797, 0.0008282661437988281, 0.0010645389556884766, 0.001300811767578125, 0.0015370845794677734, 0.0017733573913574219, 0.0020096302032470703, 0.0022459030151367188, 0.002482175827026367, 0.0027184486389160156, 0.002954721450805664, 0.0031909942626953125, 0.003427267074584961, 0.0036635398864746094, 0.003899812698364258, 0.004136085510253906, 0.004372358322143555, 0.004608631134033203, 0.0048449039459228516, 0.0050811767578125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 12.0, 15.0, 43.0, 98.0, 275.0, 335.0, 137.0, 35.0, 23.0, 11.0, 13.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-2.4358296394348145, -2.389970541000366, -2.344111204147339, -2.2982521057128906, -2.2523930072784424, -2.206533670425415, -2.160674571990967, -2.1148154735565186, -2.0689563751220703, -2.023097276687622, -1.9772380590438843, -1.9313788414001465, -1.8855197429656982, -1.8396605253219604, -1.7938013076782227, -1.7479422092437744, -1.702082872390747, -1.6562236547470093, -1.610364556312561, -1.5645053386688232, -1.518646240234375, -1.4727870225906372, -1.4269278049468994, -1.3810687065124512, -1.3352094888687134, -1.2893502712249756, -1.2434911727905273, -1.1976319551467896, -1.1517727375030518, -1.1059136390686035, -1.0600544214248657, -1.014195203781128, -0.9683359861373901, -0.9224768280982971, -0.8766176700592041, -0.8307584524154663, -0.7848992943763733, -0.7390401363372803, -0.6931809186935425, -0.6473217606544495, -0.6014626026153564, -0.5556034445762634, -0.5097442865371704, -0.4638850688934326, -0.4180259108543396, -0.3721667528152466, -0.3263075649738312, -0.28044837713241577, -0.23458921909332275, -0.18873004615306854, -0.14287087321281433, -0.09701170027256012, -0.05115252733230591, -0.005293354392051697, 0.040565818548202515, 0.08642500638961792, 0.13228416442871094, 0.17814333736896515, 0.22400251030921936, 0.26986169815063477, 0.3157208561897278, 0.3615800142288208, 0.4074392020702362, 0.4532983899116516, 0.49915754795074463]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 14.0, 23.0, 23.0, 21.0, 37.0, 40.0, 37.0, 52.0, 52.0, 64.0, 66.0, 68.0, 69.0, 72.0, 57.0, 62.0, 42.0, 38.0, 36.0, 27.0, 17.0, 20.0, 16.0, 13.0, 6.0, 3.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3846094310283661, -0.37079745531082153, -0.35698550939559937, -0.3431735336780548, -0.32936158776283264, -0.3155496120452881, -0.3017376661300659, -0.28792569041252136, -0.2741137146949768, -0.26030173897743225, -0.24648979306221008, -0.23267781734466553, -0.21886587142944336, -0.2050538957118988, -0.19124193489551544, -0.17742997407913208, -0.1636180281639099, -0.14980606734752655, -0.1359941065311432, -0.12218213826417923, -0.10837017744779587, -0.0945582166314125, -0.08074624836444855, -0.06693428754806519, -0.053122326731681824, -0.03931036591529846, -0.0254984013736248, -0.011686436831951141, 0.0021255239844322205, 0.015937484800815582, 0.02974945306777954, 0.0435614138841629, 0.057373374700546265, 0.07118533551692963, 0.08499729633331299, 0.09880926460027695, 0.11262122541666031, 0.12643319368362427, 0.14024515450000763, 0.154057115316391, 0.16786907613277435, 0.18168103694915771, 0.19549299776554108, 0.20930495858192444, 0.223116934299469, 0.23692888021469116, 0.2507408559322357, 0.2645528316497803, 0.27836477756500244, 0.292176753282547, 0.30598869919776917, 0.3198006749153137, 0.3336126208305359, 0.34742459654808044, 0.361236572265625, 0.37504851818084717, 0.38886046409606934, 0.4026724398136139, 0.41648438572883606, 0.4302963614463806, 0.4441083073616028, 0.45792028307914734, 0.4717322587966919, 0.48554420471191406, 0.4993561804294586]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 7.0, 19.0, 23.0, 35.0, 48.0, 75.0, 126.0, 241.0, 375.0, 723.0, 1237.0, 2643.0, 6032.0, 16155.0, 59343.0, 378934.0, 477513.0, 73438.0, 18814.0, 6755.0, 2816.0, 1381.0, 715.0, 434.0, 236.0, 156.0, 89.0, 64.0, 26.0, 29.0, 18.0, 12.0, 12.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.26369476318359375, -0.2539520263671875, -0.24420928955078125, -0.234466552734375, -0.22472381591796875, -0.2149810791015625, -0.20523834228515625, -0.19549560546875, -0.18575286865234375, -0.1760101318359375, -0.16626739501953125, -0.156524658203125, -0.14678192138671875, -0.1370391845703125, -0.12729644775390625, -0.1175537109375, -0.10781097412109375, -0.0980682373046875, -0.08832550048828125, -0.078582763671875, -0.06884002685546875, -0.0590972900390625, -0.04935455322265625, -0.03961181640625, -0.02986907958984375, -0.0201263427734375, -0.01038360595703125, -0.000640869140625, 0.00910186767578125, 0.0188446044921875, 0.02858734130859375, 0.038330078125, 0.04807281494140625, 0.0578155517578125, 0.06755828857421875, 0.077301025390625, 0.08704376220703125, 0.0967864990234375, 0.10652923583984375, 0.11627197265625, 0.12601470947265625, 0.1357574462890625, 0.14550018310546875, 0.155242919921875, 0.16498565673828125, 0.1747283935546875, 0.18447113037109375, 0.1942138671875, 0.20395660400390625, 0.2136993408203125, 0.22344207763671875, 0.233184814453125, 0.24292755126953125, 0.2526702880859375, 0.26241302490234375, 0.27215576171875, 0.28189849853515625, 0.2916412353515625, 0.30138397216796875, 0.311126708984375, 0.32086944580078125, 0.3306121826171875, 0.34035491943359375, 0.35009765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 1.0, 5.0, 14.0, 15.0, 28.0, 21.0, 25.0, 41.0, 44.0, 42.0, 63.0, 74.0, 72.0, 67.0, 70.0, 84.0, 55.0, 61.0, 46.0, 38.0, 26.0, 19.0, 24.0, 16.0, 15.0, 9.0, 8.0, 2.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.836090087890625, -0.80596923828125, -0.775848388671875, -0.7457275390625, -0.715606689453125, -0.68548583984375, -0.655364990234375, -0.625244140625, -0.595123291015625, -0.56500244140625, -0.534881591796875, -0.5047607421875, -0.474639892578125, -0.44451904296875, -0.414398193359375, -0.38427734375, -0.354156494140625, -0.32403564453125, -0.293914794921875, -0.2637939453125, -0.233673095703125, -0.20355224609375, -0.173431396484375, -0.143310546875, -0.113189697265625, -0.08306884765625, -0.052947998046875, -0.0228271484375, 0.007293701171875, 0.03741455078125, 0.067535400390625, 0.09765625, 0.127777099609375, 0.15789794921875, 0.188018798828125, 0.2181396484375, 0.248260498046875, 0.27838134765625, 0.308502197265625, 0.338623046875, 0.368743896484375, 0.39886474609375, 0.428985595703125, 0.4591064453125, 0.489227294921875, 0.51934814453125, 0.549468994140625, 0.57958984375, 0.609710693359375, 0.63983154296875, 0.669952392578125, 0.7000732421875, 0.730194091796875, 0.76031494140625, 0.790435791015625, 0.820556640625, 0.850677490234375, 0.88079833984375, 0.910919189453125, 0.9410400390625, 0.971160888671875, 1.00128173828125, 1.031402587890625, 1.0615234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 16.0, 20.0, 18.0, 30.0, 36.0, 65.0, 105.0, 159.0, 249.0, 562.0, 2199.0, 17864.0, 678809.0, 334272.0, 11391.0, 1598.0, 513.0, 228.0, 123.0, 82.0, 68.0, 41.0, 30.0, 19.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.673828125, -0.6545257568359375, -0.635223388671875, -0.6159210205078125, -0.59661865234375, -0.5773162841796875, -0.558013916015625, -0.5387115478515625, -0.5194091796875, -0.5001068115234375, -0.480804443359375, -0.4615020751953125, -0.44219970703125, -0.4228973388671875, -0.403594970703125, -0.3842926025390625, -0.364990234375, -0.3456878662109375, -0.326385498046875, -0.3070831298828125, -0.28778076171875, -0.2684783935546875, -0.249176025390625, -0.2298736572265625, -0.2105712890625, -0.1912689208984375, -0.171966552734375, -0.1526641845703125, -0.13336181640625, -0.1140594482421875, -0.094757080078125, -0.0754547119140625, -0.05615234375, -0.0368499755859375, -0.017547607421875, 0.0017547607421875, 0.02105712890625, 0.0403594970703125, 0.059661865234375, 0.0789642333984375, 0.0982666015625, 0.1175689697265625, 0.136871337890625, 0.1561737060546875, 0.17547607421875, 0.1947784423828125, 0.214080810546875, 0.2333831787109375, 0.252685546875, 0.2719879150390625, 0.291290283203125, 0.3105926513671875, 0.32989501953125, 0.3491973876953125, 0.368499755859375, 0.3878021240234375, 0.4071044921875, 0.4264068603515625, 0.445709228515625, 0.4650115966796875, 0.48431396484375, 0.5036163330078125, 0.522918701171875, 0.5422210693359375, 0.5615234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 5.0, 7.0, 8.0, 8.0, 12.0, 20.0, 19.0, 20.0, 26.0, 29.0, 26.0, 29.0, 44.0, 40.0, 48.0, 38.0, 33.0, 44.0, 40.0, 60.0, 48.0, 52.0, 54.0, 35.0, 47.0, 25.0, 23.0, 16.0, 24.0, 15.0, 14.0, 16.0, 14.0, 7.0, 10.0, 5.0, 6.0, 10.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67431640625, -0.6527099609375, -0.631103515625, -0.6094970703125, -0.587890625, -0.5662841796875, -0.544677734375, -0.5230712890625, -0.50146484375, -0.4798583984375, -0.458251953125, -0.4366455078125, -0.4150390625, -0.3934326171875, -0.371826171875, -0.3502197265625, -0.32861328125, -0.3070068359375, -0.285400390625, -0.2637939453125, -0.2421875, -0.2205810546875, -0.198974609375, -0.1773681640625, -0.15576171875, -0.1341552734375, -0.112548828125, -0.0909423828125, -0.0693359375, -0.0477294921875, -0.026123046875, -0.0045166015625, 0.01708984375, 0.0386962890625, 0.060302734375, 0.0819091796875, 0.103515625, 0.1251220703125, 0.146728515625, 0.1683349609375, 0.18994140625, 0.2115478515625, 0.233154296875, 0.2547607421875, 0.2763671875, 0.2979736328125, 0.319580078125, 0.3411865234375, 0.36279296875, 0.3843994140625, 0.406005859375, 0.4276123046875, 0.44921875, 0.4708251953125, 0.492431640625, 0.5140380859375, 0.53564453125, 0.5572509765625, 0.578857421875, 0.6004638671875, 0.6220703125, 0.6436767578125, 0.665283203125, 0.6868896484375, 0.70849609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 10.0, 10.0, 16.0, 15.0, 26.0, 37.0, 82.0, 125.0, 251.0, 756.0, 2417.0, 12286.0, 192757.0, 803654.0, 29661.0, 4487.0, 1175.0, 403.0, 158.0, 95.0, 35.0, 23.0, 21.0, 10.0, 6.0, 10.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.239501953125, -0.2318267822265625, -0.224151611328125, -0.2164764404296875, -0.20880126953125, -0.2011260986328125, -0.193450927734375, -0.1857757568359375, -0.1781005859375, -0.1704254150390625, -0.162750244140625, -0.1550750732421875, -0.14739990234375, -0.1397247314453125, -0.132049560546875, -0.1243743896484375, -0.11669921875, -0.1090240478515625, -0.101348876953125, -0.0936737060546875, -0.08599853515625, -0.0783233642578125, -0.070648193359375, -0.0629730224609375, -0.0552978515625, -0.0476226806640625, -0.039947509765625, -0.0322723388671875, -0.02459716796875, -0.0169219970703125, -0.009246826171875, -0.0015716552734375, 0.006103515625, 0.0137786865234375, 0.021453857421875, 0.0291290283203125, 0.03680419921875, 0.0444793701171875, 0.052154541015625, 0.0598297119140625, 0.0675048828125, 0.0751800537109375, 0.082855224609375, 0.0905303955078125, 0.09820556640625, 0.1058807373046875, 0.113555908203125, 0.1212310791015625, 0.12890625, 0.1365814208984375, 0.144256591796875, 0.1519317626953125, 0.15960693359375, 0.1672821044921875, 0.174957275390625, 0.1826324462890625, 0.1903076171875, 0.1979827880859375, 0.205657958984375, 0.2133331298828125, 0.22100830078125, 0.2286834716796875, 0.236358642578125, 0.2440338134765625, 0.251708984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 7.0, 18.0, 14.0, 29.0, 25.0, 40.0, 67.0, 89.0, 129.0, 136.0, 120.0, 96.0, 55.0, 43.0, 27.0, 17.0, 20.0, 12.0, 8.0, 8.0, 6.0, 7.0, 2.0, 7.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.2351741790771484e-05, -2.1683983504772186e-05, -2.1016225218772888e-05, -2.034846693277359e-05, -1.9680708646774292e-05, -1.9012950360774994e-05, -1.8345192074775696e-05, -1.7677433788776398e-05, -1.70096755027771e-05, -1.63419172167778e-05, -1.5674158930778503e-05, -1.5006400644779205e-05, -1.4338642358779907e-05, -1.3670884072780609e-05, -1.3003125786781311e-05, -1.2335367500782013e-05, -1.1667609214782715e-05, -1.0999850928783417e-05, -1.0332092642784119e-05, -9.66433435678482e-06, -8.996576070785522e-06, -8.328817784786224e-06, -7.661059498786926e-06, -6.993301212787628e-06, -6.32554292678833e-06, -5.657784640789032e-06, -4.990026354789734e-06, -4.322268068790436e-06, -3.6545097827911377e-06, -2.9867514967918396e-06, -2.3189932107925415e-06, -1.6512349247932434e-06, -9.834766387939453e-07, -3.157183527946472e-07, 3.520399332046509e-07, 1.019798219203949e-06, 1.687556505203247e-06, 2.355314791202545e-06, 3.0230730772018433e-06, 3.6908313632011414e-06, 4.3585896492004395e-06, 5.0263479351997375e-06, 5.694106221199036e-06, 6.361864507198334e-06, 7.029622793197632e-06, 7.69738107919693e-06, 8.365139365196228e-06, 9.032897651195526e-06, 9.700655937194824e-06, 1.0368414223194122e-05, 1.103617250919342e-05, 1.1703930795192719e-05, 1.2371689081192017e-05, 1.3039447367191315e-05, 1.3707205653190613e-05, 1.4374963939189911e-05, 1.5042722225189209e-05, 1.5710480511188507e-05, 1.6378238797187805e-05, 1.7045997083187103e-05, 1.77137553691864e-05, 1.83815136551857e-05, 1.9049271941184998e-05, 1.9717030227184296e-05, 2.0384788513183594e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 10.0, 5.0, 11.0, 17.0, 23.0, 32.0, 50.0, 48.0, 99.0, 144.0, 201.0, 336.0, 601.0, 1318.0, 3053.0, 9340.0, 50008.0, 719223.0, 230976.0, 23065.0, 5612.0, 2136.0, 944.0, 521.0, 262.0, 166.0, 108.0, 84.0, 54.0, 34.0, 29.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.2319011688232422, -0.22576522827148438, -0.21962928771972656, -0.21349334716796875, -0.20735740661621094, -0.20122146606445312, -0.1950855255126953, -0.1889495849609375, -0.1828136444091797, -0.17667770385742188, -0.17054176330566406, -0.16440582275390625, -0.15826988220214844, -0.15213394165039062, -0.1459980010986328, -0.139862060546875, -0.1337261199951172, -0.12759017944335938, -0.12145423889160156, -0.11531829833984375, -0.10918235778808594, -0.10304641723632812, -0.09691047668457031, -0.0907745361328125, -0.08463859558105469, -0.07850265502929688, -0.07236671447753906, -0.06623077392578125, -0.06009483337402344, -0.053958892822265625, -0.04782295227050781, -0.04168701171875, -0.03555107116699219, -0.029415130615234375, -0.023279190063476562, -0.01714324951171875, -0.011007308959960938, -0.004871368408203125, 0.0012645721435546875, 0.0074005126953125, 0.013536453247070312, 0.019672393798828125, 0.025808334350585938, 0.03194427490234375, 0.03808021545410156, 0.044216156005859375, 0.05035209655761719, 0.056488037109375, 0.06262397766113281, 0.06875991821289062, 0.07489585876464844, 0.08103179931640625, 0.08716773986816406, 0.09330368041992188, 0.09943962097167969, 0.1055755615234375, 0.11171150207519531, 0.11784744262695312, 0.12398338317871094, 0.13011932373046875, 0.13625526428222656, 0.14239120483398438, 0.1485271453857422, 0.1546630859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 11.0, 11.0, 20.0, 23.0, 29.0, 39.0, 65.0, 118.0, 154.0, 142.0, 121.0, 78.0, 54.0, 37.0, 25.0, 18.0, 8.0, 7.0, 5.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05908203125, -0.05674266815185547, -0.05440330505371094, -0.052063941955566406, -0.049724578857421875, -0.047385215759277344, -0.04504585266113281, -0.04270648956298828, -0.04036712646484375, -0.03802776336669922, -0.03568840026855469, -0.033349037170410156, -0.031009674072265625, -0.028670310974121094, -0.026330947875976562, -0.02399158477783203, -0.0216522216796875, -0.01931285858154297, -0.016973495483398438, -0.014634132385253906, -0.012294769287109375, -0.009955406188964844, -0.0076160430908203125, -0.005276679992675781, -0.00293731689453125, -0.0005979537963867188, 0.0017414093017578125, 0.004080772399902344, 0.006420135498046875, 0.008759498596191406, 0.011098861694335938, 0.013438224792480469, 0.015777587890625, 0.01811695098876953, 0.020456314086914062, 0.022795677185058594, 0.025135040283203125, 0.027474403381347656, 0.029813766479492188, 0.03215312957763672, 0.03449249267578125, 0.03683185577392578, 0.03917121887207031, 0.041510581970214844, 0.043849945068359375, 0.046189308166503906, 0.04852867126464844, 0.05086803436279297, 0.0532073974609375, 0.05554676055908203, 0.05788612365722656, 0.060225486755371094, 0.06256484985351562, 0.06490421295166016, 0.06724357604980469, 0.06958293914794922, 0.07192230224609375, 0.07426166534423828, 0.07660102844238281, 0.07894039154052734, 0.08127975463867188, 0.0836191177368164, 0.08595848083496094, 0.08829784393310547, 0.09063720703125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 14.0, 22.0, 66.0, 169.0, 350.0, 210.0, 88.0, 35.0, 16.0, 10.0, 10.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1026254892349243, -1.0155296325683594, -0.9284337162971497, -0.8413378000259399, -0.754241943359375, -0.6671460866928101, -0.5800501704216003, -0.4929542541503906, -0.4058583974838257, -0.31876251101493835, -0.23166662454605103, -0.1445707380771637, -0.05747485160827637, 0.029621034860610962, 0.11671692132949829, 0.203812837600708, 0.29090869426727295, 0.3780045807361603, 0.4651004672050476, 0.5521963834762573, 0.6392922401428223, 0.7263880968093872, 0.8134840130805969, 0.9005799293518066, 0.9876757860183716, 1.0747716426849365, 1.161867618560791, 1.248963475227356, 1.336059331893921, 1.4231551885604858, 1.5102510452270508, 1.5973470211029053, 1.6844429969787598, 1.7715388536453247, 1.8586347103118896, 1.9457306861877441, 2.0328264236450195, 2.119922399520874, 2.2070183753967285, 2.294114112854004, 2.3812100887298584, 2.468306064605713, 2.5554018020629883, 2.6424977779388428, 2.7295937538146973, 2.8166894912719727, 2.903785467147827, 2.9908814430236816, 3.077977180480957, 3.1650731563568115, 3.252168893814087, 3.3392648696899414, 3.426360607147217, 3.5134565830230713, 3.600552558898926, 3.687648296356201, 3.7747442722320557, 3.86184024810791, 3.9489359855651855, 4.036031723022461, 4.1231279373168945, 4.21022367477417, 4.297319412231445, 4.384415626525879, 4.471511363983154]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 9.0, 9.0, 17.0, 12.0, 30.0, 14.0, 25.0, 17.0, 31.0, 31.0, 17.0, 39.0, 33.0, 43.0, 47.0, 41.0, 35.0, 41.0, 46.0, 46.0, 34.0, 31.0, 39.0, 35.0, 32.0, 29.0, 32.0, 15.0, 21.0, 15.0, 14.0, 21.0, 24.0, 12.0, 9.0, 8.0, 11.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.1144568920135498, -1.0803848505020142, -1.046312928199768, -1.0122408866882324, -0.9781688451766968, -0.9440968632698059, -0.910024881362915, -0.8759528398513794, -0.8418807983398438, -0.8078088164329529, -0.7737367749214172, -0.7396647930145264, -0.7055927515029907, -0.6715207695960999, -0.637448787689209, -0.6033767461776733, -0.5693047642707825, -0.5352327823638916, -0.501160740852356, -0.4670887589454651, -0.43301671743392944, -0.3989447355270386, -0.3648727238178253, -0.33080071210861206, -0.2967287003993988, -0.26265668869018555, -0.2285846769809723, -0.19451268017292023, -0.16044066846370697, -0.1263686567544937, -0.09229665994644165, -0.058224648237228394, -0.024152636528015137, 0.009919371455907822, 0.04399137943983078, 0.07806338369846344, 0.1121353954076767, 0.14620740711688995, 0.18027940392494202, 0.21435141563415527, 0.24842342734336853, 0.2824954390525818, 0.31656745076179504, 0.3506394624710083, 0.38471144437789917, 0.4187834858894348, 0.4528554677963257, 0.48692747950553894, 0.5209994912147522, 0.5550714731216431, 0.5891435146331787, 0.6232154965400696, 0.6572875380516052, 0.6913595199584961, 0.7254315614700317, 0.7595035433769226, 0.7935755252838135, 0.8276475071907043, 0.86171954870224, 0.8957915306091309, 0.9298635721206665, 0.9639355540275574, 0.9980075359344482, 1.0320795774459839, 1.0661516189575195]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 12.0, 11.0, 17.0, 12.0, 18.0, 11.0, 27.0, 35.0, 49.0, 73.0, 108.0, 130.0, 188.0, 302.0, 399.0, 669.0, 984.0, 1971.0, 3945.0, 11594.0, 161677.0, 3706916.0, 278504.0, 16602.0, 4627.0, 2113.0, 1197.0, 659.0, 458.0, 268.0, 206.0, 138.0, 113.0, 74.0, 40.0, 35.0, 36.0, 20.0, 16.0, 5.0, 1.0, 6.0, 9.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.27734375, -1.239288330078125, -1.20123291015625, -1.163177490234375, -1.1251220703125, -1.087066650390625, -1.04901123046875, -1.010955810546875, -0.972900390625, -0.934844970703125, -0.89678955078125, -0.858734130859375, -0.8206787109375, -0.782623291015625, -0.74456787109375, -0.706512451171875, -0.66845703125, -0.630401611328125, -0.59234619140625, -0.554290771484375, -0.5162353515625, -0.478179931640625, -0.44012451171875, -0.402069091796875, -0.364013671875, -0.325958251953125, -0.28790283203125, -0.249847412109375, -0.2117919921875, -0.173736572265625, -0.13568115234375, -0.097625732421875, -0.0595703125, -0.021514892578125, 0.01654052734375, 0.054595947265625, 0.0926513671875, 0.130706787109375, 0.16876220703125, 0.206817626953125, 0.244873046875, 0.282928466796875, 0.32098388671875, 0.359039306640625, 0.3970947265625, 0.435150146484375, 0.47320556640625, 0.511260986328125, 0.54931640625, 0.587371826171875, 0.62542724609375, 0.663482666015625, 0.7015380859375, 0.739593505859375, 0.77764892578125, 0.815704345703125, 0.853759765625, 0.891815185546875, 0.92987060546875, 0.967926025390625, 1.0059814453125, 1.044036865234375, 1.08209228515625, 1.120147705078125, 1.158203125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 4.0, 2.0, 8.0, 11.0, 14.0, 20.0, 28.0, 25.0, 27.0, 36.0, 36.0, 46.0, 48.0, 43.0, 57.0, 63.0, 78.0, 66.0, 57.0, 63.0, 54.0, 43.0, 31.0, 28.0, 24.0, 18.0, 17.0, 6.0, 10.0, 15.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5202560424804688, -0.5058441162109375, -0.49143218994140625, -0.477020263671875, -0.46260833740234375, -0.4481964111328125, -0.43378448486328125, -0.41937255859375, -0.40496063232421875, -0.3905487060546875, -0.37613677978515625, -0.361724853515625, -0.34731292724609375, -0.3329010009765625, -0.31848907470703125, -0.3040771484375, -0.28966522216796875, -0.2752532958984375, -0.26084136962890625, -0.246429443359375, -0.23201751708984375, -0.2176055908203125, -0.20319366455078125, -0.18878173828125, -0.17436981201171875, -0.1599578857421875, -0.14554595947265625, -0.131134033203125, -0.11672210693359375, -0.1023101806640625, -0.08789825439453125, -0.073486328125, -0.05907440185546875, -0.0446624755859375, -0.03025054931640625, -0.015838623046875, -0.00142669677734375, 0.0129852294921875, 0.02739715576171875, 0.04180908203125, 0.05622100830078125, 0.0706329345703125, 0.08504486083984375, 0.099456787109375, 0.11386871337890625, 0.1282806396484375, 0.14269256591796875, 0.1571044921875, 0.17151641845703125, 0.1859283447265625, 0.20034027099609375, 0.214752197265625, 0.22916412353515625, 0.2435760498046875, 0.25798797607421875, 0.27239990234375, 0.28681182861328125, 0.3012237548828125, 0.31563568115234375, 0.330047607421875, 0.34445953369140625, 0.3588714599609375, 0.37328338623046875, 0.3876953125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 10.0, 10.0, 29.0, 24.0, 50.0, 77.0, 132.0, 196.0, 361.0, 685.0, 1281.0, 3132.0, 9888.0, 58161.0, 3548501.0, 535264.0, 25930.0, 6062.0, 2179.0, 1043.0, 512.0, 308.0, 180.0, 105.0, 62.0, 34.0, 27.0, 17.0, 3.0, 9.0, 3.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1892471313476562, -1.1577911376953125, -1.1263351440429688, -1.094879150390625, -1.0634231567382812, -1.0319671630859375, -1.0005111694335938, -0.96905517578125, -0.9375991821289062, -0.9061431884765625, -0.8746871948242188, -0.843231201171875, -0.8117752075195312, -0.7803192138671875, -0.7488632202148438, -0.7174072265625, -0.6859512329101562, -0.6544952392578125, -0.6230392456054688, -0.591583251953125, -0.5601272583007812, -0.5286712646484375, -0.49721527099609375, -0.46575927734375, -0.43430328369140625, -0.4028472900390625, -0.37139129638671875, -0.339935302734375, -0.30847930908203125, -0.2770233154296875, -0.24556732177734375, -0.214111328125, -0.18265533447265625, -0.1511993408203125, -0.11974334716796875, -0.088287353515625, -0.05683135986328125, -0.0253753662109375, 0.00608062744140625, 0.03753662109375, 0.06899261474609375, 0.1004486083984375, 0.13190460205078125, 0.163360595703125, 0.19481658935546875, 0.2262725830078125, 0.25772857666015625, 0.2891845703125, 0.32064056396484375, 0.3520965576171875, 0.38355255126953125, 0.415008544921875, 0.44646453857421875, 0.4779205322265625, 0.5093765258789062, 0.54083251953125, 0.5722885131835938, 0.6037445068359375, 0.6352005004882812, 0.666656494140625, 0.6981124877929688, 0.7295684814453125, 0.7610244750976562, 0.79248046875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 29.0, 39.0, 52.0, 107.0, 253.0, 544.0, 1075.0, 999.0, 469.0, 206.0, 86.0, 46.0, 50.0, 18.0, 17.0, 9.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2783203125, -0.2698707580566406, -0.26142120361328125, -0.2529716491699219, -0.2445220947265625, -0.23607254028320312, -0.22762298583984375, -0.21917343139648438, -0.210723876953125, -0.20227432250976562, -0.19382476806640625, -0.18537521362304688, -0.1769256591796875, -0.16847610473632812, -0.16002655029296875, -0.15157699584960938, -0.14312744140625, -0.13467788696289062, -0.12622833251953125, -0.11777877807617188, -0.1093292236328125, -0.10087966918945312, -0.09243011474609375, -0.08398056030273438, -0.075531005859375, -0.06708145141601562, -0.05863189697265625, -0.050182342529296875, -0.0417327880859375, -0.033283233642578125, -0.02483367919921875, -0.016384124755859375, -0.0079345703125, 0.000514984130859375, 0.00896453857421875, 0.017414093017578125, 0.0258636474609375, 0.034313201904296875, 0.04276275634765625, 0.051212310791015625, 0.059661865234375, 0.06811141967773438, 0.07656097412109375, 0.08501052856445312, 0.0934600830078125, 0.10190963745117188, 0.11035919189453125, 0.11880874633789062, 0.12725830078125, 0.13570785522460938, 0.14415740966796875, 0.15260696411132812, 0.1610565185546875, 0.16950607299804688, 0.17795562744140625, 0.18640518188476562, 0.194854736328125, 0.20330429077148438, 0.21175384521484375, 0.22020339965820312, 0.2286529541015625, 0.23710250854492188, 0.24555206298828125, 0.2540016174316406, 0.262451171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 11.0, 8.0, 20.0, 14.0, 34.0, 43.0, 65.0, 85.0, 133.0, 149.0, 125.0, 86.0, 59.0, 56.0, 35.0, 23.0, 13.0, 7.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0908448696136475, -1.0625654458999634, -1.0342860221862793, -1.0060065984725952, -0.9777271151542664, -0.9494476914405823, -0.9211682677268982, -0.8928887844085693, -0.8646093606948853, -0.8363299369812012, -0.8080505132675171, -0.7797710299491882, -0.7514916062355042, -0.7232121825218201, -0.694932758808136, -0.6666532754898071, -0.638373851776123, -0.610094428062439, -0.5818150043487549, -0.553535521030426, -0.5252560973167419, -0.49697667360305786, -0.4686972498893738, -0.4404177963733673, -0.4121384024620056, -0.38385897874832153, -0.35557952523231506, -0.327300101518631, -0.2990206480026245, -0.27074122428894043, -0.24246178567409515, -0.21418234705924988, -0.1859028935432434, -0.15762345492839813, -0.12934401631355286, -0.10106458514928818, -0.0727851465344429, -0.04450571537017822, -0.016226276755332947, 0.012053161859512329, 0.040332600474357605, 0.06861203908920288, 0.09689147770404816, 0.12517091631889343, 0.15345034003257751, 0.1817297786474228, 0.21000921726226807, 0.23828865587711334, 0.2665680944919586, 0.2948475182056427, 0.32312697172164917, 0.35140639543533325, 0.3796858489513397, 0.4079652726650238, 0.4362447261810303, 0.46452414989471436, 0.49280357360839844, 0.5210829973220825, 0.5493624210357666, 0.5776419043540955, 0.6059213280677795, 0.6342007517814636, 0.6624801754951477, 0.6907596588134766, 0.7190390825271606]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 9.0, 8.0, 5.0, 6.0, 22.0, 21.0, 21.0, 27.0, 43.0, 28.0, 42.0, 35.0, 43.0, 51.0, 54.0, 55.0, 56.0, 52.0, 48.0, 38.0, 43.0, 46.0, 41.0, 27.0, 38.0, 20.0, 23.0, 17.0, 13.0, 15.0, 12.0, 7.0, 10.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.510971188545227, -0.49620920419692993, -0.4814472198486328, -0.4666852355003357, -0.4519232511520386, -0.43716126680374146, -0.42239928245544434, -0.4076372981071472, -0.3928753137588501, -0.378113329410553, -0.36335134506225586, -0.34858936071395874, -0.3338273763656616, -0.3190653920173645, -0.3043034076690674, -0.28954142332077026, -0.27477943897247314, -0.260017454624176, -0.2452554702758789, -0.2304934859275818, -0.21573150157928467, -0.20096951723098755, -0.18620753288269043, -0.1714455485343933, -0.1566835641860962, -0.14192157983779907, -0.12715959548950195, -0.11239761114120483, -0.09763562679290771, -0.0828736424446106, -0.06811165809631348, -0.05334967374801636, -0.03858768939971924, -0.02382570505142212, -0.009063720703125, 0.005698263645172119, 0.02046024799346924, 0.03522223234176636, 0.04998421669006348, 0.0647462010383606, 0.07950818538665771, 0.09427016973495483, 0.10903215408325195, 0.12379413843154907, 0.1385561227798462, 0.1533181071281433, 0.16808009147644043, 0.18284207582473755, 0.19760406017303467, 0.2123660445213318, 0.2271280288696289, 0.24189001321792603, 0.25665199756622314, 0.27141398191452026, 0.2861759662628174, 0.3009379506111145, 0.3156999349594116, 0.33046191930770874, 0.34522390365600586, 0.359985888004303, 0.3747478723526001, 0.3895098567008972, 0.40427184104919434, 0.41903382539749146, 0.4337958097457886]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 10.0, 18.0, 19.0, 28.0, 43.0, 57.0, 88.0, 119.0, 193.0, 299.0, 498.0, 850.0, 1458.0, 2708.0, 5178.0, 10694.0, 24983.0, 65598.0, 200869.0, 425952.0, 197335.0, 64584.0, 24813.0, 10737.0, 4995.0, 2709.0, 1434.0, 796.0, 528.0, 317.0, 208.0, 130.0, 83.0, 60.0, 42.0, 26.0, 27.0, 12.0, 8.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.09173583984375, -0.08899688720703125, -0.0862579345703125, -0.08351898193359375, -0.080780029296875, -0.07804107666015625, -0.0753021240234375, -0.07256317138671875, -0.06982421875, -0.06708526611328125, -0.0643463134765625, -0.06160736083984375, -0.058868408203125, -0.05612945556640625, -0.0533905029296875, -0.05065155029296875, -0.04791259765625, -0.04517364501953125, -0.0424346923828125, -0.03969573974609375, -0.036956787109375, -0.03421783447265625, -0.0314788818359375, -0.02873992919921875, -0.0260009765625, -0.02326202392578125, -0.0205230712890625, -0.01778411865234375, -0.015045166015625, -0.01230621337890625, -0.0095672607421875, -0.00682830810546875, -0.00408935546875, -0.00135040283203125, 0.0013885498046875, 0.00412750244140625, 0.006866455078125, 0.00960540771484375, 0.0123443603515625, 0.01508331298828125, 0.017822265625, 0.02056121826171875, 0.0233001708984375, 0.02603912353515625, 0.028778076171875, 0.03151702880859375, 0.0342559814453125, 0.03699493408203125, 0.03973388671875, 0.04247283935546875, 0.0452117919921875, 0.04795074462890625, 0.050689697265625, 0.05342864990234375, 0.0561676025390625, 0.05890655517578125, 0.0616455078125, 0.06438446044921875, 0.0671234130859375, 0.06986236572265625, 0.072601318359375, 0.07534027099609375, 0.0780792236328125, 0.08081817626953125, 0.08355712890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 4.0, 4.0, 7.0, 4.0, 11.0, 9.0, 23.0, 18.0, 22.0, 31.0, 32.0, 36.0, 42.0, 46.0, 50.0, 59.0, 51.0, 62.0, 65.0, 71.0, 36.0, 45.0, 51.0, 33.0, 29.0, 28.0, 21.0, 25.0, 16.0, 13.0, 15.0, 10.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340576171875, -0.32952880859375, -0.3184814453125, -0.30743408203125, -0.29638671875, -0.28533935546875, -0.2742919921875, -0.26324462890625, -0.252197265625, -0.24114990234375, -0.2301025390625, -0.21905517578125, -0.2080078125, -0.19696044921875, -0.1859130859375, -0.17486572265625, -0.163818359375, -0.15277099609375, -0.1417236328125, -0.13067626953125, -0.11962890625, -0.10858154296875, -0.0975341796875, -0.08648681640625, -0.075439453125, -0.06439208984375, -0.0533447265625, -0.04229736328125, -0.03125, -0.02020263671875, -0.0091552734375, 0.00189208984375, 0.012939453125, 0.02398681640625, 0.0350341796875, 0.04608154296875, 0.05712890625, 0.06817626953125, 0.0792236328125, 0.09027099609375, 0.101318359375, 0.11236572265625, 0.1234130859375, 0.13446044921875, 0.1455078125, 0.15655517578125, 0.1676025390625, 0.17864990234375, 0.189697265625, 0.20074462890625, 0.2117919921875, 0.22283935546875, 0.23388671875, 0.24493408203125, 0.2559814453125, 0.26702880859375, 0.278076171875, 0.28912353515625, 0.3001708984375, 0.31121826171875, 0.322265625, 0.33331298828125, 0.3443603515625, 0.35540771484375, 0.366455078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 10.0, 22.0, 28.0, 45.0, 35.0, 70.0, 93.0, 123.0, 193.0, 284.0, 460.0, 697.0, 1096.0, 1924.0, 3184.0, 5631.0, 10427.0, 19500.0, 39308.0, 83136.0, 188957.0, 322460.0, 197202.0, 86987.0, 40860.0, 20457.0, 10717.0, 5939.0, 3355.0, 1942.0, 1211.0, 724.0, 485.0, 307.0, 197.0, 150.0, 99.0, 78.0, 52.0, 30.0, 14.0, 15.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.05401611328125, -0.052186012268066406, -0.05035591125488281, -0.04852581024169922, -0.046695709228515625, -0.04486560821533203, -0.04303550720214844, -0.041205406188964844, -0.03937530517578125, -0.037545204162597656, -0.03571510314941406, -0.03388500213623047, -0.032054901123046875, -0.03022480010986328, -0.028394699096679688, -0.026564598083496094, -0.0247344970703125, -0.022904396057128906, -0.021074295043945312, -0.01924419403076172, -0.017414093017578125, -0.015583992004394531, -0.013753890991210938, -0.011923789978027344, -0.01009368896484375, -0.008263587951660156, -0.0064334869384765625, -0.004603385925292969, -0.002773284912109375, -0.0009431838989257812, 0.0008869171142578125, 0.0027170181274414062, 0.004547119140625, 0.006377220153808594, 0.008207321166992188, 0.010037422180175781, 0.011867523193359375, 0.013697624206542969, 0.015527725219726562, 0.017357826232910156, 0.01918792724609375, 0.021018028259277344, 0.022848129272460938, 0.02467823028564453, 0.026508331298828125, 0.02833843231201172, 0.030168533325195312, 0.031998634338378906, 0.0338287353515625, 0.035658836364746094, 0.03748893737792969, 0.03931903839111328, 0.041149139404296875, 0.04297924041748047, 0.04480934143066406, 0.046639442443847656, 0.04846954345703125, 0.050299644470214844, 0.05212974548339844, 0.05395984649658203, 0.055789947509765625, 0.05762004852294922, 0.05945014953613281, 0.061280250549316406, 0.0631103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 5.0, 14.0, 6.0, 9.0, 13.0, 16.0, 13.0, 18.0, 22.0, 19.0, 17.0, 28.0, 23.0, 34.0, 39.0, 32.0, 32.0, 44.0, 45.0, 48.0, 50.0, 54.0, 40.0, 47.0, 33.0, 32.0, 34.0, 21.0, 36.0, 21.0, 21.0, 22.0, 20.0, 22.0, 14.0, 10.0, 4.0, 9.0, 6.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5400390625, -0.523040771484375, -0.50604248046875, -0.489044189453125, -0.4720458984375, -0.455047607421875, -0.43804931640625, -0.421051025390625, -0.404052734375, -0.387054443359375, -0.37005615234375, -0.353057861328125, -0.3360595703125, -0.319061279296875, -0.30206298828125, -0.285064697265625, -0.26806640625, -0.251068115234375, -0.23406982421875, -0.217071533203125, -0.2000732421875, -0.183074951171875, -0.16607666015625, -0.149078369140625, -0.132080078125, -0.115081787109375, -0.09808349609375, -0.081085205078125, -0.0640869140625, -0.047088623046875, -0.03009033203125, -0.013092041015625, 0.00390625, 0.020904541015625, 0.03790283203125, 0.054901123046875, 0.0718994140625, 0.088897705078125, 0.10589599609375, 0.122894287109375, 0.139892578125, 0.156890869140625, 0.17388916015625, 0.190887451171875, 0.2078857421875, 0.224884033203125, 0.24188232421875, 0.258880615234375, 0.27587890625, 0.292877197265625, 0.30987548828125, 0.326873779296875, 0.3438720703125, 0.360870361328125, 0.37786865234375, 0.394866943359375, 0.411865234375, 0.428863525390625, 0.44586181640625, 0.462860107421875, 0.4798583984375, 0.496856689453125, 0.51385498046875, 0.530853271484375, 0.5478515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 11.0, 17.0, 19.0, 25.0, 33.0, 65.0, 112.0, 202.0, 390.0, 721.0, 1561.0, 3669.0, 9399.0, 29132.0, 116315.0, 517442.0, 283745.0, 58674.0, 16482.0, 5946.0, 2287.0, 1077.0, 513.0, 281.0, 189.0, 76.0, 68.0, 33.0, 26.0, 14.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.048828125, -0.04760026931762695, -0.046372413635253906, -0.04514455795288086, -0.04391670227050781, -0.042688846588134766, -0.04146099090576172, -0.04023313522338867, -0.039005279541015625, -0.03777742385864258, -0.03654956817626953, -0.035321712493896484, -0.03409385681152344, -0.03286600112915039, -0.031638145446777344, -0.030410289764404297, -0.02918243408203125, -0.027954578399658203, -0.026726722717285156, -0.02549886703491211, -0.024271011352539062, -0.023043155670166016, -0.02181529998779297, -0.020587444305419922, -0.019359588623046875, -0.018131732940673828, -0.01690387725830078, -0.015676021575927734, -0.014448165893554688, -0.01322031021118164, -0.011992454528808594, -0.010764598846435547, -0.0095367431640625, -0.008308887481689453, -0.007081031799316406, -0.005853176116943359, -0.0046253204345703125, -0.0033974647521972656, -0.0021696090698242188, -0.0009417533874511719, 0.000286102294921875, 0.0015139579772949219, 0.0027418136596679688, 0.003969669342041016, 0.0051975250244140625, 0.006425380706787109, 0.007653236389160156, 0.008881092071533203, 0.01010894775390625, 0.011336803436279297, 0.012564659118652344, 0.01379251480102539, 0.015020370483398438, 0.016248226165771484, 0.01747608184814453, 0.018703937530517578, 0.019931793212890625, 0.021159648895263672, 0.02238750457763672, 0.023615360260009766, 0.024843215942382812, 0.02607107162475586, 0.027298927307128906, 0.028526782989501953, 0.029754638671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 8.0, 10.0, 16.0, 24.0, 40.0, 62.0, 98.0, 107.0, 136.0, 146.0, 111.0, 64.0, 44.0, 33.0, 32.0, 9.0, 12.0, 7.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.159046173095703e-05, -3.07764858007431e-05, -2.9962509870529175e-05, -2.9148533940315247e-05, -2.833455801010132e-05, -2.752058207988739e-05, -2.6706606149673462e-05, -2.5892630219459534e-05, -2.5078654289245605e-05, -2.4264678359031677e-05, -2.345070242881775e-05, -2.263672649860382e-05, -2.1822750568389893e-05, -2.1008774638175964e-05, -2.0194798707962036e-05, -1.9380822777748108e-05, -1.856684684753418e-05, -1.775287091732025e-05, -1.6938894987106323e-05, -1.6124919056892395e-05, -1.5310943126678467e-05, -1.4496967196464539e-05, -1.368299126625061e-05, -1.2869015336036682e-05, -1.2055039405822754e-05, -1.1241063475608826e-05, -1.0427087545394897e-05, -9.61311161518097e-06, -8.799135684967041e-06, -7.985159754753113e-06, -7.1711838245391846e-06, -6.357207894325256e-06, -5.543231964111328e-06, -4.7292560338974e-06, -3.915280103683472e-06, -3.1013041734695435e-06, -2.2873282432556152e-06, -1.473352313041687e-06, -6.593763828277588e-07, 1.5459954738616943e-07, 9.685754776000977e-07, 1.7825514078140259e-06, 2.596527338027954e-06, 3.4105032682418823e-06, 4.2244791984558105e-06, 5.038455128669739e-06, 5.852431058883667e-06, 6.666406989097595e-06, 7.4803829193115234e-06, 8.294358849525452e-06, 9.10833477973938e-06, 9.922310709953308e-06, 1.0736286640167236e-05, 1.1550262570381165e-05, 1.2364238500595093e-05, 1.3178214430809021e-05, 1.399219036102295e-05, 1.4806166291236877e-05, 1.5620142221450806e-05, 1.6434118151664734e-05, 1.7248094081878662e-05, 1.806207001209259e-05, 1.887604594230652e-05, 1.9690021872520447e-05, 2.0503997802734375e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 6.0, 13.0, 24.0, 28.0, 31.0, 59.0, 88.0, 143.0, 229.0, 377.0, 568.0, 983.0, 1588.0, 2869.0, 5558.0, 11076.0, 23334.0, 53624.0, 136157.0, 323894.0, 287083.0, 114624.0, 45520.0, 20048.0, 9336.0, 4809.0, 2685.0, 1522.0, 845.0, 539.0, 322.0, 208.0, 124.0, 90.0, 56.0, 33.0, 23.0, 15.0, 11.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244140625, -0.02369403839111328, -0.022974014282226562, -0.022253990173339844, -0.021533966064453125, -0.020813941955566406, -0.020093917846679688, -0.01937389373779297, -0.01865386962890625, -0.01793384552001953, -0.017213821411132812, -0.016493797302246094, -0.015773773193359375, -0.015053749084472656, -0.014333724975585938, -0.013613700866699219, -0.0128936767578125, -0.012173652648925781, -0.011453628540039062, -0.010733604431152344, -0.010013580322265625, -0.009293556213378906, -0.008573532104492188, -0.007853507995605469, -0.00713348388671875, -0.006413459777832031, -0.0056934356689453125, -0.004973411560058594, -0.004253387451171875, -0.0035333633422851562, -0.0028133392333984375, -0.0020933151245117188, -0.001373291015625, -0.0006532669067382812, 6.67572021484375e-05, 0.0007867813110351562, 0.001506805419921875, 0.0022268295288085938, 0.0029468536376953125, 0.0036668777465820312, 0.00438690185546875, 0.005106925964355469, 0.0058269500732421875, 0.006546974182128906, 0.007266998291015625, 0.007987022399902344, 0.008707046508789062, 0.009427070617675781, 0.0101470947265625, 0.010867118835449219, 0.011587142944335938, 0.012307167053222656, 0.013027191162109375, 0.013747215270996094, 0.014467239379882812, 0.015187263488769531, 0.01590728759765625, 0.01662731170654297, 0.017347335815429688, 0.018067359924316406, 0.018787384033203125, 0.019507408142089844, 0.020227432250976562, 0.02094745635986328, 0.02166748046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 4.0, 3.0, 13.0, 14.0, 15.0, 10.0, 15.0, 22.0, 34.0, 28.0, 37.0, 42.0, 46.0, 47.0, 54.0, 60.0, 67.0, 64.0, 44.0, 48.0, 57.0, 48.0, 31.0, 36.0, 27.0, 24.0, 16.0, 14.0, 18.0, 11.0, 13.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0079498291015625, -0.007714807987213135, -0.0074797868728637695, -0.007244765758514404, -0.007009744644165039, -0.006774723529815674, -0.006539702415466309, -0.006304681301116943, -0.006069660186767578, -0.005834639072418213, -0.005599617958068848, -0.005364596843719482, -0.005129575729370117, -0.004894554615020752, -0.004659533500671387, -0.0044245123863220215, -0.004189491271972656, -0.003954470157623291, -0.0037194490432739258, -0.0034844279289245605, -0.0032494068145751953, -0.00301438570022583, -0.002779364585876465, -0.0025443434715270996, -0.0023093223571777344, -0.002074301242828369, -0.001839280128479004, -0.0016042590141296387, -0.0013692378997802734, -0.0011342167854309082, -0.000899195671081543, -0.0006641745567321777, -0.0004291534423828125, -0.00019413232803344727, 4.088878631591797e-05, 0.0002759099006652832, 0.0005109310150146484, 0.0007459521293640137, 0.000980973243713379, 0.0012159943580627441, 0.0014510154724121094, 0.0016860365867614746, 0.0019210577011108398, 0.002156078815460205, 0.0023910999298095703, 0.0026261210441589355, 0.0028611421585083008, 0.003096163272857666, 0.0033311843872070312, 0.0035662055015563965, 0.0038012266159057617, 0.004036247730255127, 0.004271268844604492, 0.004506289958953857, 0.004741311073303223, 0.004976332187652588, 0.005211353302001953, 0.005446374416351318, 0.005681395530700684, 0.005916416645050049, 0.006151437759399414, 0.006386458873748779, 0.0066214799880981445, 0.00685650110244751, 0.007091522216796875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 4.0, 4.0, 4.0, 12.0, 24.0, 38.0, 89.0, 145.0, 236.0, 191.0, 105.0, 63.0, 41.0, 19.0, 11.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2030118703842163, -1.174246072769165, -1.1454803943634033, -1.1167147159576416, -1.0879489183425903, -1.059183120727539, -1.0304174423217773, -1.0016517639160156, -0.9728859663009644, -0.9441202282905579, -0.9153544902801514, -0.8865887522697449, -0.8578230142593384, -0.8290572762489319, -0.8002915382385254, -0.7715258002281189, -0.7427600622177124, -0.7139943242073059, -0.6852285861968994, -0.6564628481864929, -0.6276971101760864, -0.5989313721656799, -0.5701656341552734, -0.5413998961448669, -0.5126341581344604, -0.48386842012405396, -0.45510268211364746, -0.42633694410324097, -0.3975712060928345, -0.368805468082428, -0.3400397300720215, -0.311273992061615, -0.2825081944465637, -0.2537424564361572, -0.22497671842575073, -0.19621098041534424, -0.16744524240493774, -0.13867950439453125, -0.10991376638412476, -0.08114802837371826, -0.05238229036331177, -0.023616552352905273, 0.005149185657501221, 0.033914923667907715, 0.06268066167831421, 0.0914463996887207, 0.1202121376991272, 0.1489778757095337, 0.17774361371994019, 0.20650935173034668, 0.23527508974075317, 0.26404082775115967, 0.29280656576156616, 0.32157230377197266, 0.35033804178237915, 0.37910377979278564, 0.40786951780319214, 0.43663525581359863, 0.4654009938240051, 0.4941667318344116, 0.5229324698448181, 0.5516982078552246, 0.5804639458656311, 0.6092296838760376, 0.6379954218864441]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 9.0, 20.0, 17.0, 29.0, 30.0, 28.0, 41.0, 35.0, 42.0, 48.0, 53.0, 52.0, 62.0, 68.0, 37.0, 55.0, 43.0, 43.0, 50.0, 25.0, 37.0, 29.0, 23.0, 16.0, 15.0, 10.0, 6.0, 10.0, 12.0, 7.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3230491578578949, -0.31289345026016235, -0.3027377128601074, -0.2925819754600525, -0.28242626786231995, -0.2722705602645874, -0.26211482286453247, -0.25195908546447754, -0.241803377866745, -0.23164765536785126, -0.22149193286895752, -0.21133621037006378, -0.20118048787117004, -0.1910247653722763, -0.18086904287338257, -0.17071332037448883, -0.1605575978755951, -0.15040187537670135, -0.14024615287780762, -0.13009043037891388, -0.11993470788002014, -0.1097789853811264, -0.09962326288223267, -0.08946754038333893, -0.07931181788444519, -0.06915609538555145, -0.059000372886657715, -0.04884465038776398, -0.03868892788887024, -0.0285332053899765, -0.018377482891082764, -0.008221760392189026, 0.0019339919090270996, 0.012089714407920837, 0.022245436906814575, 0.03240115940570831, 0.04255688190460205, 0.05271260440349579, 0.06286832690238953, 0.07302404940128326, 0.083179771900177, 0.09333549439907074, 0.10349121689796448, 0.11364693939685822, 0.12380266189575195, 0.1339583843946457, 0.14411410689353943, 0.15426982939243317, 0.1644255518913269, 0.17458127439022064, 0.18473699688911438, 0.19489271938800812, 0.20504844188690186, 0.2152041643857956, 0.22535988688468933, 0.23551560938358307, 0.2456713318824768, 0.25582706928253174, 0.2659827768802643, 0.2761384844779968, 0.28629422187805176, 0.2964499592781067, 0.30660566687583923, 0.3167613744735718, 0.3269171118736267]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 1.0, 7.0, 12.0, 17.0, 18.0, 27.0, 42.0, 52.0, 65.0, 101.0, 143.0, 228.0, 412.0, 591.0, 947.0, 1690.0, 3206.0, 6810.0, 20802.0, 166446.0, 761878.0, 61500.0, 12616.0, 4857.0, 2511.0, 1321.0, 789.0, 480.0, 301.0, 210.0, 134.0, 92.0, 76.0, 45.0, 29.0, 16.0, 19.0, 18.0, 12.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.358154296875, -0.3467140197753906, -0.33527374267578125, -0.3238334655761719, -0.3123931884765625, -0.3009529113769531, -0.28951263427734375, -0.2780723571777344, -0.266632080078125, -0.2551918029785156, -0.24375152587890625, -0.23231124877929688, -0.2208709716796875, -0.20943069458007812, -0.19799041748046875, -0.18655014038085938, -0.17510986328125, -0.16366958618164062, -0.15222930908203125, -0.14078903198242188, -0.1293487548828125, -0.11790847778320312, -0.10646820068359375, -0.09502792358398438, -0.083587646484375, -0.07214736938476562, -0.06070709228515625, -0.049266815185546875, -0.0378265380859375, -0.026386260986328125, -0.01494598388671875, -0.003505706787109375, 0.0079345703125, 0.019374847412109375, 0.03081512451171875, 0.042255401611328125, 0.0536956787109375, 0.06513595581054688, 0.07657623291015625, 0.08801651000976562, 0.099456787109375, 0.11089706420898438, 0.12233734130859375, 0.13377761840820312, 0.1452178955078125, 0.15665817260742188, 0.16809844970703125, 0.17953872680664062, 0.19097900390625, 0.20241928100585938, 0.21385955810546875, 0.22529983520507812, 0.2367401123046875, 0.24818038940429688, 0.25962066650390625, 0.2710609436035156, 0.282501220703125, 0.2939414978027344, 0.30538177490234375, 0.3168220520019531, 0.3282623291015625, 0.3397026062011719, 0.35114288330078125, 0.3625831604003906, 0.3740234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 9.0, 8.0, 11.0, 12.0, 22.0, 33.0, 36.0, 32.0, 44.0, 64.0, 47.0, 56.0, 51.0, 76.0, 68.0, 58.0, 59.0, 49.0, 54.0, 38.0, 36.0, 28.0, 18.0, 21.0, 12.0, 9.0, 13.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73828125, -0.7150039672851562, -0.6917266845703125, -0.6684494018554688, -0.645172119140625, -0.6218948364257812, -0.5986175537109375, -0.5753402709960938, -0.55206298828125, -0.5287857055664062, -0.5055084228515625, -0.48223114013671875, -0.458953857421875, -0.43567657470703125, -0.4123992919921875, -0.38912200927734375, -0.3658447265625, -0.34256744384765625, -0.3192901611328125, -0.29601287841796875, -0.272735595703125, -0.24945831298828125, -0.2261810302734375, -0.20290374755859375, -0.17962646484375, -0.15634918212890625, -0.1330718994140625, -0.10979461669921875, -0.086517333984375, -0.06324005126953125, -0.0399627685546875, -0.01668548583984375, 0.006591796875, 0.02986907958984375, 0.0531463623046875, 0.07642364501953125, 0.099700927734375, 0.12297821044921875, 0.1462554931640625, 0.16953277587890625, 0.19281005859375, 0.21608734130859375, 0.2393646240234375, 0.26264190673828125, 0.285919189453125, 0.30919647216796875, 0.3324737548828125, 0.35575103759765625, 0.3790283203125, 0.40230560302734375, 0.4255828857421875, 0.44886016845703125, 0.472137451171875, 0.49541473388671875, 0.5186920166015625, 0.5419692993164062, 0.56524658203125, 0.5885238647460938, 0.6118011474609375, 0.6350784301757812, 0.658355712890625, 0.6816329956054688, 0.7049102783203125, 0.7281875610351562, 0.75146484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 9.0, 7.0, 8.0, 21.0, 28.0, 55.0, 115.0, 266.0, 812.0, 3481.0, 67036.0, 965316.0, 9074.0, 1501.0, 478.0, 178.0, 86.0, 36.0, 22.0, 13.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0540008544921875, -1.019134521484375, -0.9842681884765625, -0.94940185546875, -0.9145355224609375, -0.879669189453125, -0.8448028564453125, -0.8099365234375, -0.7750701904296875, -0.740203857421875, -0.7053375244140625, -0.67047119140625, -0.6356048583984375, -0.600738525390625, -0.5658721923828125, -0.531005859375, -0.4961395263671875, -0.461273193359375, -0.4264068603515625, -0.39154052734375, -0.3566741943359375, -0.321807861328125, -0.2869415283203125, -0.2520751953125, -0.2172088623046875, -0.182342529296875, -0.1474761962890625, -0.11260986328125, -0.0777435302734375, -0.042877197265625, -0.0080108642578125, 0.02685546875, 0.0617218017578125, 0.096588134765625, 0.1314544677734375, 0.16632080078125, 0.2011871337890625, 0.236053466796875, 0.2709197998046875, 0.3057861328125, 0.3406524658203125, 0.375518798828125, 0.4103851318359375, 0.44525146484375, 0.4801177978515625, 0.514984130859375, 0.5498504638671875, 0.584716796875, 0.6195831298828125, 0.654449462890625, 0.6893157958984375, 0.72418212890625, 0.7590484619140625, 0.793914794921875, 0.8287811279296875, 0.8636474609375, 0.8985137939453125, 0.933380126953125, 0.9682464599609375, 1.00311279296875, 1.0379791259765625, 1.072845458984375, 1.1077117919921875, 1.142578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 8.0, 8.0, 12.0, 15.0, 19.0, 24.0, 15.0, 27.0, 28.0, 32.0, 33.0, 31.0, 39.0, 34.0, 29.0, 55.0, 42.0, 50.0, 38.0, 44.0, 48.0, 37.0, 43.0, 35.0, 30.0, 13.0, 36.0, 19.0, 20.0, 24.0, 18.0, 8.0, 9.0, 6.0, 5.0, 8.0, 7.0, 4.0, 3.0, 9.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5345077514648438, -0.5157928466796875, -0.49707794189453125, -0.478363037109375, -0.45964813232421875, -0.4409332275390625, -0.42221832275390625, -0.40350341796875, -0.38478851318359375, -0.3660736083984375, -0.34735870361328125, -0.328643798828125, -0.30992889404296875, -0.2912139892578125, -0.27249908447265625, -0.2537841796875, -0.23506927490234375, -0.2163543701171875, -0.19763946533203125, -0.178924560546875, -0.16020965576171875, -0.1414947509765625, -0.12277984619140625, -0.10406494140625, -0.08535003662109375, -0.0666351318359375, -0.04792022705078125, -0.029205322265625, -0.01049041748046875, 0.0082244873046875, 0.02693939208984375, 0.045654296875, 0.06436920166015625, 0.0830841064453125, 0.10179901123046875, 0.120513916015625, 0.13922882080078125, 0.1579437255859375, 0.17665863037109375, 0.19537353515625, 0.21408843994140625, 0.2328033447265625, 0.25151824951171875, 0.270233154296875, 0.28894805908203125, 0.3076629638671875, 0.32637786865234375, 0.3450927734375, 0.36380767822265625, 0.3825225830078125, 0.40123748779296875, 0.419952392578125, 0.43866729736328125, 0.4573822021484375, 0.47609710693359375, 0.49481201171875, 0.5135269165039062, 0.5322418212890625, 0.5509567260742188, 0.569671630859375, 0.5883865356445312, 0.6071014404296875, 0.6258163452148438, 0.64453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 24.0, 34.0, 83.0, 230.0, 674.0, 3352.0, 118792.0, 914863.0, 8783.0, 1133.0, 331.0, 124.0, 48.0, 30.0, 17.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24860382080078125, -0.2403717041015625, -0.23213958740234375, -0.223907470703125, -0.21567535400390625, -0.2074432373046875, -0.19921112060546875, -0.19097900390625, -0.18274688720703125, -0.1745147705078125, -0.16628265380859375, -0.158050537109375, -0.14981842041015625, -0.1415863037109375, -0.13335418701171875, -0.1251220703125, -0.11688995361328125, -0.1086578369140625, -0.10042572021484375, -0.092193603515625, -0.08396148681640625, -0.0757293701171875, -0.06749725341796875, -0.05926513671875, -0.05103302001953125, -0.0428009033203125, -0.03456878662109375, -0.026336669921875, -0.01810455322265625, -0.0098724365234375, -0.00164031982421875, 0.006591796875, 0.01482391357421875, 0.0230560302734375, 0.03128814697265625, 0.039520263671875, 0.04775238037109375, 0.0559844970703125, 0.06421661376953125, 0.07244873046875, 0.08068084716796875, 0.0889129638671875, 0.09714508056640625, 0.105377197265625, 0.11360931396484375, 0.1218414306640625, 0.13007354736328125, 0.1383056640625, 0.14653778076171875, 0.1547698974609375, 0.16300201416015625, 0.171234130859375, 0.17946624755859375, 0.1876983642578125, 0.19593048095703125, 0.20416259765625, 0.21239471435546875, 0.2206268310546875, 0.22885894775390625, 0.237091064453125, 0.24532318115234375, 0.2535552978515625, 0.26178741455078125, 0.27001953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 4.0, 2.0, 9.0, 16.0, 34.0, 31.0, 95.0, 178.0, 266.0, 163.0, 75.0, 55.0, 31.0, 13.0, 11.0, 10.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.8505921363830566e-05, -2.7745962142944336e-05, -2.6986002922058105e-05, -2.6226043701171875e-05, -2.5466084480285645e-05, -2.4706125259399414e-05, -2.3946166038513184e-05, -2.3186206817626953e-05, -2.2426247596740723e-05, -2.1666288375854492e-05, -2.0906329154968262e-05, -2.014636993408203e-05, -1.93864107131958e-05, -1.862645149230957e-05, -1.786649227142334e-05, -1.710653305053711e-05, -1.634657382965088e-05, -1.558661460876465e-05, -1.4826655387878418e-05, -1.4066696166992188e-05, -1.3306736946105957e-05, -1.2546777725219727e-05, -1.1786818504333496e-05, -1.1026859283447266e-05, -1.0266900062561035e-05, -9.506940841674805e-06, -8.746981620788574e-06, -7.987022399902344e-06, -7.227063179016113e-06, -6.467103958129883e-06, -5.707144737243652e-06, -4.947185516357422e-06, -4.187226295471191e-06, -3.427267074584961e-06, -2.6673078536987305e-06, -1.9073486328125e-06, -1.1473894119262695e-06, -3.8743019104003906e-07, 3.725290298461914e-07, 1.1324882507324219e-06, 1.8924474716186523e-06, 2.652406692504883e-06, 3.4123659133911133e-06, 4.172325134277344e-06, 4.932284355163574e-06, 5.692243576049805e-06, 6.452202796936035e-06, 7.212162017822266e-06, 7.972121238708496e-06, 8.732080459594727e-06, 9.492039680480957e-06, 1.0251998901367188e-05, 1.1011958122253418e-05, 1.1771917343139648e-05, 1.2531876564025879e-05, 1.329183578491211e-05, 1.405179500579834e-05, 1.481175422668457e-05, 1.55717134475708e-05, 1.633167266845703e-05, 1.7091631889343262e-05, 1.7851591110229492e-05, 1.8611550331115723e-05, 1.9371509552001953e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 8.0, 11.0, 25.0, 38.0, 61.0, 129.0, 209.0, 443.0, 969.0, 2794.0, 12670.0, 356866.0, 653338.0, 15736.0, 3187.0, 1107.0, 429.0, 219.0, 127.0, 81.0, 45.0, 19.0, 19.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2376708984375, -0.2317371368408203, -0.22580337524414062, -0.21986961364746094, -0.21393585205078125, -0.20800209045410156, -0.20206832885742188, -0.1961345672607422, -0.1902008056640625, -0.1842670440673828, -0.17833328247070312, -0.17239952087402344, -0.16646575927734375, -0.16053199768066406, -0.15459823608398438, -0.1486644744873047, -0.142730712890625, -0.1367969512939453, -0.13086318969726562, -0.12492942810058594, -0.11899566650390625, -0.11306190490722656, -0.10712814331054688, -0.10119438171386719, -0.0952606201171875, -0.08932685852050781, -0.08339309692382812, -0.07745933532714844, -0.07152557373046875, -0.06559181213378906, -0.059658050537109375, -0.05372428894042969, -0.04779052734375, -0.04185676574707031, -0.035923004150390625, -0.029989242553710938, -0.02405548095703125, -0.018121719360351562, -0.012187957763671875, -0.0062541961669921875, -0.0003204345703125, 0.0056133270263671875, 0.011547088623046875, 0.017480850219726562, 0.02341461181640625, 0.029348373413085938, 0.035282135009765625, 0.04121589660644531, 0.047149658203125, 0.05308341979980469, 0.059017181396484375, 0.06495094299316406, 0.07088470458984375, 0.07681846618652344, 0.08275222778320312, 0.08868598937988281, 0.0946197509765625, 0.10055351257324219, 0.10648727416992188, 0.11242103576660156, 0.11835479736328125, 0.12428855895996094, 0.13022232055664062, 0.1361560821533203, 0.14208984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 4.0, 9.0, 4.0, 7.0, 21.0, 27.0, 24.0, 38.0, 45.0, 69.0, 76.0, 149.0, 160.0, 91.0, 74.0, 55.0, 42.0, 26.0, 13.0, 15.0, 9.0, 8.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02728271484375, -0.0260467529296875, -0.024810791015625, -0.0235748291015625, -0.0223388671875, -0.0211029052734375, -0.019866943359375, -0.0186309814453125, -0.01739501953125, -0.0161590576171875, -0.014923095703125, -0.0136871337890625, -0.012451171875, -0.0112152099609375, -0.009979248046875, -0.0087432861328125, -0.00750732421875, -0.0062713623046875, -0.005035400390625, -0.0037994384765625, -0.0025634765625, -0.0013275146484375, -9.1552734375e-05, 0.0011444091796875, 0.00238037109375, 0.0036163330078125, 0.004852294921875, 0.0060882568359375, 0.00732421875, 0.0085601806640625, 0.009796142578125, 0.0110321044921875, 0.01226806640625, 0.0135040283203125, 0.014739990234375, 0.0159759521484375, 0.0172119140625, 0.0184478759765625, 0.019683837890625, 0.0209197998046875, 0.02215576171875, 0.0233917236328125, 0.024627685546875, 0.0258636474609375, 0.027099609375, 0.0283355712890625, 0.029571533203125, 0.0308074951171875, 0.03204345703125, 0.0332794189453125, 0.034515380859375, 0.0357513427734375, 0.0369873046875, 0.0382232666015625, 0.039459228515625, 0.0406951904296875, 0.04193115234375, 0.0431671142578125, 0.044403076171875, 0.0456390380859375, 0.046875, 0.0481109619140625, 0.049346923828125, 0.0505828857421875, 0.05181884765625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 1.0, 7.0, 15.0, 13.0, 37.0, 83.0, 137.0, 203.0, 207.0, 113.0, 72.0, 50.0, 23.0, 13.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4265085458755493, -1.3737664222717285, -1.3210242986679077, -1.268282175064087, -1.2155400514602661, -1.1627979278564453, -1.110055685043335, -1.0573135614395142, -1.0045714378356934, -0.9518293142318726, -0.8990871906280518, -0.846345067024231, -0.7936028838157654, -0.7408607602119446, -0.6881186366081238, -0.6353764533996582, -0.5826343894004822, -0.5298922657966614, -0.4771501123905182, -0.4244079887866974, -0.3716658353805542, -0.3189237117767334, -0.2661815881729126, -0.2134394347667694, -0.1606973111629486, -0.10795517265796661, -0.055213041603565216, -0.0024709105491638184, 0.050271227955818176, 0.10301336646080017, 0.15575549006462097, 0.20849764347076416, 0.26123976707458496, 0.31398189067840576, 0.36672404408454895, 0.41946616768836975, 0.47220832109451294, 0.5249504446983337, 0.5776925683021545, 0.6304347515106201, 0.6831768751144409, 0.7359189987182617, 0.7886611223220825, 0.8414032459259033, 0.8941454291343689, 0.9468875527381897, 0.9996296763420105, 1.052371859550476, 1.1051139831542969, 1.1578561067581177, 1.2105982303619385, 1.2633403539657593, 1.31608247756958, 1.3688247203826904, 1.4215667247772217, 1.474308967590332, 1.5270509719848633, 1.579793095588684, 1.6325352191925049, 1.6852773427963257, 1.7380194664001465, 1.7907617092132568, 1.843503713607788, 1.8962459564208984, 1.9489880800247192]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 13.0, 3.0, 9.0, 11.0, 11.0, 9.0, 16.0, 10.0, 14.0, 16.0, 11.0, 28.0, 21.0, 22.0, 28.0, 22.0, 25.0, 32.0, 45.0, 29.0, 35.0, 34.0, 37.0, 31.0, 41.0, 40.0, 35.0, 28.0, 31.0, 32.0, 24.0, 29.0, 40.0, 30.0, 16.0, 20.0, 11.0, 18.0, 12.0, 14.0, 7.0, 16.0, 19.0, 7.0, 2.0, 7.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8438077569007874, -0.815995991230011, -0.7881841659545898, -0.7603724002838135, -0.7325605750083923, -0.704748809337616, -0.6769369840621948, -0.6491252183914185, -0.6213134527206421, -0.5935016870498657, -0.5656898617744446, -0.5378780961036682, -0.5100662708282471, -0.4822545051574707, -0.45444270968437195, -0.4266309142112732, -0.39881908893585205, -0.3710072934627533, -0.34319549798965454, -0.3153837323188782, -0.28757190704345703, -0.25976014137268066, -0.2319483458995819, -0.20413655042648315, -0.1763247549533844, -0.14851295948028564, -0.12070117145776749, -0.09288938343524933, -0.06507758796215057, -0.03726579248905182, -0.009454011917114258, 0.018357783555984497, 0.04616951942443848, 0.07398131489753723, 0.10179310292005539, 0.12960489094257355, 0.1574166864156723, 0.18522848188877106, 0.21304026246070862, 0.24085205793380737, 0.26866385340690613, 0.2964756488800049, 0.32428744435310364, 0.3520992398262024, 0.37991100549697876, 0.4077228307723999, 0.43553459644317627, 0.463346391916275, 0.4911581873893738, 0.5189699530601501, 0.5467817783355713, 0.5745935440063477, 0.6024053692817688, 0.6302171349525452, 0.6580289602279663, 0.6858407258987427, 0.713652491569519, 0.7414642572402954, 0.7692760825157166, 0.7970878481864929, 0.8248996734619141, 0.8527114391326904, 0.8805232048034668, 0.9083350300788879, 0.9361468553543091]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 16.0, 11.0, 16.0, 22.0, 19.0, 29.0, 35.0, 36.0, 46.0, 67.0, 126.0, 153.0, 243.0, 422.0, 650.0, 1095.0, 2235.0, 5718.0, 31711.0, 1835508.0, 2266340.0, 38438.0, 5955.0, 2293.0, 1201.0, 664.0, 397.0, 214.0, 184.0, 107.0, 82.0, 48.0, 53.0, 30.0, 28.0, 16.0, 20.0, 12.0, 9.0, 9.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96923828125, -0.9358444213867188, -0.9024505615234375, -0.8690567016601562, -0.835662841796875, -0.8022689819335938, -0.7688751220703125, -0.7354812622070312, -0.70208740234375, -0.6686935424804688, -0.6352996826171875, -0.6019058227539062, -0.568511962890625, -0.5351181030273438, -0.5017242431640625, -0.46833038330078125, -0.4349365234375, -0.40154266357421875, -0.3681488037109375, -0.33475494384765625, -0.301361083984375, -0.26796722412109375, -0.2345733642578125, -0.20117950439453125, -0.16778564453125, -0.13439178466796875, -0.1009979248046875, -0.06760406494140625, -0.034210205078125, -0.00081634521484375, 0.0325775146484375, 0.06597137451171875, 0.099365234375, 0.13275909423828125, 0.1661529541015625, 0.19954681396484375, 0.232940673828125, 0.26633453369140625, 0.2997283935546875, 0.33312225341796875, 0.36651611328125, 0.39990997314453125, 0.4333038330078125, 0.46669769287109375, 0.500091552734375, 0.5334854125976562, 0.5668792724609375, 0.6002731323242188, 0.6336669921875, 0.6670608520507812, 0.7004547119140625, 0.7338485717773438, 0.767242431640625, 0.8006362915039062, 0.8340301513671875, 0.8674240112304688, 0.90081787109375, 0.9342117309570312, 0.9676055908203125, 1.0009994506835938, 1.034393310546875, 1.0677871704101562, 1.1011810302734375, 1.1345748901367188, 1.16796875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 7.0, 14.0, 14.0, 17.0, 19.0, 26.0, 24.0, 23.0, 34.0, 45.0, 41.0, 62.0, 53.0, 52.0, 50.0, 51.0, 53.0, 68.0, 48.0, 46.0, 42.0, 41.0, 19.0, 32.0, 26.0, 12.0, 17.0, 8.0, 9.0, 11.0, 3.0, 8.0, 5.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.3283653259277344, -0.31664276123046875, -0.3049201965332031, -0.2931976318359375, -0.2814750671386719, -0.26975250244140625, -0.2580299377441406, -0.246307373046875, -0.23458480834960938, -0.22286224365234375, -0.21113967895507812, -0.1994171142578125, -0.18769454956054688, -0.17597198486328125, -0.16424942016601562, -0.15252685546875, -0.14080429077148438, -0.12908172607421875, -0.11735916137695312, -0.1056365966796875, -0.09391403198242188, -0.08219146728515625, -0.07046890258789062, -0.058746337890625, -0.047023773193359375, -0.03530120849609375, -0.023578643798828125, -0.0118560791015625, -0.000133514404296875, 0.01158905029296875, 0.023311614990234375, 0.0350341796875, 0.046756744384765625, 0.05847930908203125, 0.07020187377929688, 0.0819244384765625, 0.09364700317382812, 0.10536956787109375, 0.11709213256835938, 0.128814697265625, 0.14053726196289062, 0.15225982666015625, 0.16398239135742188, 0.1757049560546875, 0.18742752075195312, 0.19915008544921875, 0.21087265014648438, 0.22259521484375, 0.23431777954101562, 0.24604034423828125, 0.2577629089355469, 0.2694854736328125, 0.2812080383300781, 0.29293060302734375, 0.3046531677246094, 0.316375732421875, 0.3280982971191406, 0.33982086181640625, 0.3515434265136719, 0.3632659912109375, 0.3749885559082031, 0.38671112060546875, 0.3984336853027344, 0.41015625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 15.0, 23.0, 45.0, 45.0, 81.0, 147.0, 250.0, 543.0, 1119.0, 2638.0, 8344.0, 44778.0, 3008414.0, 1086484.0, 30774.0, 6609.0, 2135.0, 862.0, 412.0, 232.0, 105.0, 67.0, 42.0, 28.0, 22.0, 16.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9650344848632812, -0.9373931884765625, -0.9097518920898438, -0.882110595703125, -0.8544692993164062, -0.8268280029296875, -0.7991867065429688, -0.77154541015625, -0.7439041137695312, -0.7162628173828125, -0.6886215209960938, -0.660980224609375, -0.6333389282226562, -0.6056976318359375, -0.5780563354492188, -0.5504150390625, -0.5227737426757812, -0.4951324462890625, -0.46749114990234375, -0.439849853515625, -0.41220855712890625, -0.3845672607421875, -0.35692596435546875, -0.32928466796875, -0.30164337158203125, -0.2740020751953125, -0.24636077880859375, -0.218719482421875, -0.19107818603515625, -0.1634368896484375, -0.13579559326171875, -0.108154296875, -0.08051300048828125, -0.0528717041015625, -0.02523040771484375, 0.002410888671875, 0.03005218505859375, 0.0576934814453125, 0.08533477783203125, 0.11297607421875, 0.14061737060546875, 0.1682586669921875, 0.19589996337890625, 0.223541259765625, 0.25118255615234375, 0.2788238525390625, 0.30646514892578125, 0.3341064453125, 0.36174774169921875, 0.3893890380859375, 0.41703033447265625, 0.444671630859375, 0.47231292724609375, 0.4999542236328125, 0.5275955200195312, 0.55523681640625, 0.5828781127929688, 0.6105194091796875, 0.6381607055664062, 0.665802001953125, 0.6934432983398438, 0.7210845947265625, 0.7487258911132812, 0.7763671875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 10.0, 22.0, 16.0, 15.0, 49.0, 69.0, 157.0, 296.0, 574.0, 988.0, 877.0, 415.0, 241.0, 114.0, 66.0, 37.0, 27.0, 23.0, 15.0, 12.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.1618175506591797, -0.15530014038085938, -0.14878273010253906, -0.14226531982421875, -0.13574790954589844, -0.12923049926757812, -0.12271308898925781, -0.1161956787109375, -0.10967826843261719, -0.10316085815429688, -0.09664344787597656, -0.09012603759765625, -0.08360862731933594, -0.07709121704101562, -0.07057380676269531, -0.064056396484375, -0.05753898620605469, -0.051021575927734375, -0.04450416564941406, -0.03798675537109375, -0.03146934509277344, -0.024951934814453125, -0.018434524536132812, -0.0119171142578125, -0.0053997039794921875, 0.001117706298828125, 0.0076351165771484375, 0.01415252685546875, 0.020669937133789062, 0.027187347412109375, 0.03370475769042969, 0.04022216796875, 0.04673957824707031, 0.053256988525390625, 0.05977439880371094, 0.06629180908203125, 0.07280921936035156, 0.07932662963867188, 0.08584403991699219, 0.0923614501953125, 0.09887886047363281, 0.10539627075195312, 0.11191368103027344, 0.11843109130859375, 0.12494850158691406, 0.13146591186523438, 0.1379833221435547, 0.144500732421875, 0.1510181427001953, 0.15753555297851562, 0.16405296325683594, 0.17057037353515625, 0.17708778381347656, 0.18360519409179688, 0.1901226043701172, 0.1966400146484375, 0.2031574249267578, 0.20967483520507812, 0.21619224548339844, 0.22270965576171875, 0.22922706604003906, 0.23574447631835938, 0.2422618865966797, 0.248779296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 10.0, 15.0, 13.0, 44.0, 52.0, 139.0, 189.0, 185.0, 136.0, 92.0, 58.0, 31.0, 15.0, 7.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4539974927902222, -1.416054368019104, -1.3781112432479858, -1.3401682376861572, -1.302225112915039, -1.264281988143921, -1.2263388633728027, -1.1883957386016846, -1.1504526138305664, -1.1125094890594482, -1.07456636428833, -1.036623239517212, -0.9986801743507385, -0.9607371091842651, -0.922793984413147, -0.8848508596420288, -0.8469077944755554, -0.8089646697044373, -0.7710216045379639, -0.7330784797668457, -0.6951353549957275, -0.6571922302246094, -0.619249165058136, -0.5813060402870178, -0.5433629751205444, -0.5054198503494263, -0.4674767553806305, -0.4295336604118347, -0.39159053564071655, -0.3536474406719208, -0.315704345703125, -0.27776122093200684, -0.23981809616088867, -0.2018749862909317, -0.16393187642097473, -0.12598878145217896, -0.08804567158222198, -0.050102561712265015, -0.012159466743469238, 0.025783658027648926, 0.0637267529964447, 0.10166986286640167, 0.13961297273635864, 0.17755606770515442, 0.2154991775751114, 0.25344228744506836, 0.29138538241386414, 0.3293285071849823, 0.3672716021537781, 0.40521469712257385, 0.443157821893692, 0.4811009168624878, 0.519044041633606, 0.5569871664047241, 0.5949302315711975, 0.6328733563423157, 0.6708164215087891, 0.7087595462799072, 0.7467026114463806, 0.7846457362174988, 0.8225888609886169, 0.8605319261550903, 0.8984750509262085, 0.9364181756973267, 0.9743613004684448]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 9.0, 3.0, 10.0, 11.0, 11.0, 13.0, 10.0, 18.0, 12.0, 20.0, 21.0, 22.0, 29.0, 40.0, 46.0, 41.0, 42.0, 35.0, 39.0, 44.0, 41.0, 34.0, 41.0, 42.0, 45.0, 47.0, 35.0, 35.0, 26.0, 31.0, 23.0, 31.0, 18.0, 11.0, 9.0, 10.0, 11.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3959617614746094, -0.3849647045135498, -0.37396761775016785, -0.3629705607891083, -0.3519735038280487, -0.34097644686698914, -0.3299793601036072, -0.3189823031425476, -0.30798524618148804, -0.29698818922042847, -0.2859911024570465, -0.27499404549598694, -0.26399698853492737, -0.2529999315738678, -0.24200284481048584, -0.23100578784942627, -0.2200087159872055, -0.20901164412498474, -0.19801458716392517, -0.1870175153017044, -0.17602045834064484, -0.16502338647842407, -0.1540263295173645, -0.14302925765514374, -0.13203218579292297, -0.1210351213812828, -0.11003805696964264, -0.09904098510742188, -0.0880439281463623, -0.07704685628414154, -0.06604979187250137, -0.055052727460861206, -0.044055670499801636, -0.03305860608816147, -0.022061539813876152, -0.011064473539590836, -6.740912795066833e-05, 0.010929655283689499, 0.021926723420619965, 0.03292378783226013, 0.0439208522439003, 0.054917916655540466, 0.06591498106718063, 0.0769120454788208, 0.08790911734104156, 0.09890617430210114, 0.1099032461643219, 0.12090031057596207, 0.13189737498760223, 0.142894446849823, 0.15389150381088257, 0.16488857567310333, 0.1758856326341629, 0.18688270449638367, 0.19787976145744324, 0.208876833319664, 0.21987390518188477, 0.23087097704410553, 0.2418680340051651, 0.25286510586738586, 0.26386216282844543, 0.274859219789505, 0.28585630655288696, 0.29685336351394653, 0.3078504204750061]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 15.0, 23.0, 32.0, 59.0, 102.0, 181.0, 339.0, 677.0, 1483.0, 4088.0, 14162.0, 80342.0, 663418.0, 242384.0, 29971.0, 6967.0, 2318.0, 942.0, 443.0, 218.0, 131.0, 96.0, 44.0, 34.0, 14.0, 14.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.1441783905029297, -0.13857650756835938, -0.13297462463378906, -0.12737274169921875, -0.12177085876464844, -0.11616897583007812, -0.11056709289550781, -0.1049652099609375, -0.09936332702636719, -0.09376144409179688, -0.08815956115722656, -0.08255767822265625, -0.07695579528808594, -0.07135391235351562, -0.06575202941894531, -0.060150146484375, -0.05454826354980469, -0.048946380615234375, -0.04334449768066406, -0.03774261474609375, -0.03214073181152344, -0.026538848876953125, -0.020936965942382812, -0.0153350830078125, -0.009733200073242188, -0.004131317138671875, 0.0014705657958984375, 0.00707244873046875, 0.012674331665039062, 0.018276214599609375, 0.023878097534179688, 0.02947998046875, 0.03508186340332031, 0.040683746337890625, 0.04628562927246094, 0.05188751220703125, 0.05748939514160156, 0.06309127807617188, 0.06869316101074219, 0.0742950439453125, 0.07989692687988281, 0.08549880981445312, 0.09110069274902344, 0.09670257568359375, 0.10230445861816406, 0.10790634155273438, 0.11350822448730469, 0.119110107421875, 0.12471199035644531, 0.13031387329101562, 0.13591575622558594, 0.14151763916015625, 0.14711952209472656, 0.15272140502929688, 0.1583232879638672, 0.1639251708984375, 0.1695270538330078, 0.17512893676757812, 0.18073081970214844, 0.18633270263671875, 0.19193458557128906, 0.19753646850585938, 0.2031383514404297, 0.208740234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 9.0, 7.0, 12.0, 11.0, 14.0, 9.0, 18.0, 30.0, 25.0, 38.0, 48.0, 53.0, 47.0, 54.0, 53.0, 63.0, 55.0, 58.0, 60.0, 43.0, 56.0, 38.0, 32.0, 36.0, 35.0, 28.0, 15.0, 10.0, 14.0, 4.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286865234375, -0.2773017883300781, -0.26773834228515625, -0.2581748962402344, -0.2486114501953125, -0.23904800415039062, -0.22948455810546875, -0.21992111206054688, -0.210357666015625, -0.20079421997070312, -0.19123077392578125, -0.18166732788085938, -0.1721038818359375, -0.16254043579101562, -0.15297698974609375, -0.14341354370117188, -0.13385009765625, -0.12428665161132812, -0.11472320556640625, -0.10515975952148438, -0.0955963134765625, -0.08603286743164062, -0.07646942138671875, -0.06690597534179688, -0.057342529296875, -0.047779083251953125, -0.03821563720703125, -0.028652191162109375, -0.0190887451171875, -0.009525299072265625, 3.814697265625e-05, 0.009601593017578125, 0.0191650390625, 0.028728485107421875, 0.03829193115234375, 0.047855377197265625, 0.0574188232421875, 0.06698226928710938, 0.07654571533203125, 0.08610916137695312, 0.095672607421875, 0.10523605346679688, 0.11479949951171875, 0.12436294555664062, 0.1339263916015625, 0.14348983764648438, 0.15305328369140625, 0.16261672973632812, 0.17218017578125, 0.18174362182617188, 0.19130706787109375, 0.20087051391601562, 0.2104339599609375, 0.21999740600585938, 0.22956085205078125, 0.23912429809570312, 0.248687744140625, 0.2582511901855469, 0.26781463623046875, 0.2773780822753906, 0.2869415283203125, 0.2965049743652344, 0.30606842041015625, 0.3156318664550781, 0.3251953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 14.0, 19.0, 25.0, 26.0, 53.0, 82.0, 100.0, 140.0, 183.0, 320.0, 514.0, 799.0, 1380.0, 2535.0, 5544.0, 14214.0, 47166.0, 210498.0, 534732.0, 166962.0, 39489.0, 12687.0, 5100.0, 2407.0, 1367.0, 763.0, 428.0, 310.0, 200.0, 142.0, 112.0, 66.0, 55.0, 25.0, 25.0, 19.0, 10.0, 12.0, 5.0, 1.0, 2.0, 5.0, 4.0, 3.0, 1.0], "bins": [-0.11151123046875, -0.10853195190429688, -0.10555267333984375, -0.10257339477539062, -0.0995941162109375, -0.09661483764648438, -0.09363555908203125, -0.09065628051757812, -0.087677001953125, -0.08469772338867188, -0.08171844482421875, -0.07873916625976562, -0.0757598876953125, -0.07278060913085938, -0.06980133056640625, -0.06682205200195312, -0.0638427734375, -0.060863494873046875, -0.05788421630859375, -0.054904937744140625, -0.0519256591796875, -0.048946380615234375, -0.04596710205078125, -0.042987823486328125, -0.040008544921875, -0.037029266357421875, -0.03404998779296875, -0.031070709228515625, -0.0280914306640625, -0.025112152099609375, -0.02213287353515625, -0.019153594970703125, -0.01617431640625, -0.013195037841796875, -0.01021575927734375, -0.007236480712890625, -0.0042572021484375, -0.001277923583984375, 0.00170135498046875, 0.004680633544921875, 0.007659912109375, 0.010639190673828125, 0.01361846923828125, 0.016597747802734375, 0.0195770263671875, 0.022556304931640625, 0.02553558349609375, 0.028514862060546875, 0.031494140625, 0.034473419189453125, 0.03745269775390625, 0.040431976318359375, 0.0434112548828125, 0.046390533447265625, 0.04936981201171875, 0.052349090576171875, 0.055328369140625, 0.058307647705078125, 0.06128692626953125, 0.06426620483398438, 0.0672454833984375, 0.07022476196289062, 0.07320404052734375, 0.07618331909179688, 0.07916259765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 4.0, 10.0, 7.0, 10.0, 19.0, 18.0, 27.0, 25.0, 28.0, 40.0, 36.0, 35.0, 37.0, 45.0, 59.0, 48.0, 53.0, 55.0, 52.0, 47.0, 51.0, 39.0, 39.0, 38.0, 31.0, 23.0, 18.0, 23.0, 10.0, 18.0, 8.0, 5.0, 10.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4663810729980469, -0.45058441162109375, -0.4347877502441406, -0.4189910888671875, -0.4031944274902344, -0.38739776611328125, -0.3716011047363281, -0.355804443359375, -0.3400077819824219, -0.32421112060546875, -0.3084144592285156, -0.2926177978515625, -0.2768211364746094, -0.26102447509765625, -0.24522781372070312, -0.22943115234375, -0.21363449096679688, -0.19783782958984375, -0.18204116821289062, -0.1662445068359375, -0.15044784545898438, -0.13465118408203125, -0.11885452270507812, -0.103057861328125, -0.08726119995117188, -0.07146453857421875, -0.055667877197265625, -0.0398712158203125, -0.024074554443359375, -0.00827789306640625, 0.007518768310546875, 0.0233154296875, 0.039112091064453125, 0.05490875244140625, 0.07070541381835938, 0.0865020751953125, 0.10229873657226562, 0.11809539794921875, 0.13389205932617188, 0.149688720703125, 0.16548538208007812, 0.18128204345703125, 0.19707870483398438, 0.2128753662109375, 0.22867202758789062, 0.24446868896484375, 0.2602653503417969, 0.27606201171875, 0.2918586730957031, 0.30765533447265625, 0.3234519958496094, 0.3392486572265625, 0.3550453186035156, 0.37084197998046875, 0.3866386413574219, 0.402435302734375, 0.4182319641113281, 0.43402862548828125, 0.4498252868652344, 0.4656219482421875, 0.4814186096191406, 0.49721527099609375, 0.5130119323730469, 0.52880859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 17.0, 17.0, 28.0, 44.0, 52.0, 101.0, 162.0, 258.0, 478.0, 998.0, 2073.0, 4651.0, 12838.0, 45234.0, 230089.0, 557710.0, 144950.0, 31728.0, 9828.0, 3766.0, 1625.0, 833.0, 425.0, 216.0, 155.0, 86.0, 53.0, 36.0, 28.0, 10.0, 12.0, 14.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03021240234375, -0.029249191284179688, -0.028285980224609375, -0.027322769165039062, -0.02635955810546875, -0.025396347045898438, -0.024433135986328125, -0.023469924926757812, -0.0225067138671875, -0.021543502807617188, -0.020580291748046875, -0.019617080688476562, -0.01865386962890625, -0.017690658569335938, -0.016727447509765625, -0.015764236450195312, -0.014801025390625, -0.013837814331054688, -0.012874603271484375, -0.011911392211914062, -0.01094818115234375, -0.009984970092773438, -0.009021759033203125, -0.008058547973632812, -0.0070953369140625, -0.0061321258544921875, -0.005168914794921875, -0.0042057037353515625, -0.00324249267578125, -0.0022792816162109375, -0.001316070556640625, -0.0003528594970703125, 0.0006103515625, 0.0015735626220703125, 0.002536773681640625, 0.0034999847412109375, 0.00446319580078125, 0.0054264068603515625, 0.006389617919921875, 0.0073528289794921875, 0.0083160400390625, 0.009279251098632812, 0.010242462158203125, 0.011205673217773438, 0.01216888427734375, 0.013132095336914062, 0.014095306396484375, 0.015058517456054688, 0.016021728515625, 0.016984939575195312, 0.017948150634765625, 0.018911361694335938, 0.01987457275390625, 0.020837783813476562, 0.021800994873046875, 0.022764205932617188, 0.0237274169921875, 0.024690628051757812, 0.025653839111328125, 0.026617050170898438, 0.02758026123046875, 0.028543472290039062, 0.029506683349609375, 0.030469894409179688, 0.03143310546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 1.0, 5.0, 8.0, 7.0, 22.0, 12.0, 32.0, 38.0, 49.0, 65.0, 94.0, 112.0, 110.0, 110.0, 71.0, 69.0, 52.0, 31.0, 30.0, 20.0, 18.0, 7.0, 9.0, 7.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4781951904296875e-05, -1.4241784811019897e-05, -1.370161771774292e-05, -1.3161450624465942e-05, -1.2621283531188965e-05, -1.2081116437911987e-05, -1.154094934463501e-05, -1.1000782251358032e-05, -1.0460615158081055e-05, -9.920448064804077e-06, -9.3802809715271e-06, -8.840113878250122e-06, -8.299946784973145e-06, -7.759779691696167e-06, -7.2196125984191895e-06, -6.679445505142212e-06, -6.139278411865234e-06, -5.599111318588257e-06, -5.058944225311279e-06, -4.518777132034302e-06, -3.978610038757324e-06, -3.4384429454803467e-06, -2.898275852203369e-06, -2.3581087589263916e-06, -1.817941665649414e-06, -1.2777745723724365e-06, -7.37607479095459e-07, -1.9744038581848145e-07, 3.427267074584961e-07, 8.828938007354736e-07, 1.4230608940124512e-06, 1.9632279872894287e-06, 2.5033950805664062e-06, 3.043562173843384e-06, 3.5837292671203613e-06, 4.123896360397339e-06, 4.664063453674316e-06, 5.204230546951294e-06, 5.7443976402282715e-06, 6.284564733505249e-06, 6.8247318267822266e-06, 7.364898920059204e-06, 7.905066013336182e-06, 8.44523310661316e-06, 8.985400199890137e-06, 9.525567293167114e-06, 1.0065734386444092e-05, 1.060590147972107e-05, 1.1146068572998047e-05, 1.1686235666275024e-05, 1.2226402759552002e-05, 1.276656985282898e-05, 1.3306736946105957e-05, 1.3846904039382935e-05, 1.4387071132659912e-05, 1.492723822593689e-05, 1.5467405319213867e-05, 1.6007572412490845e-05, 1.6547739505767822e-05, 1.70879065990448e-05, 1.7628073692321777e-05, 1.8168240785598755e-05, 1.8708407878875732e-05, 1.924857497215271e-05, 1.9788742065429688e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 13.0, 15.0, 18.0, 37.0, 46.0, 84.0, 121.0, 160.0, 287.0, 466.0, 766.0, 1242.0, 2375.0, 4582.0, 8882.0, 19570.0, 46646.0, 123927.0, 304241.0, 314509.0, 130991.0, 49634.0, 20278.0, 9289.0, 4528.0, 2439.0, 1314.0, 780.0, 463.0, 302.0, 182.0, 112.0, 74.0, 57.0, 42.0, 27.0, 19.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017547607421875, -0.016921520233154297, -0.016295433044433594, -0.01566934585571289, -0.015043258666992188, -0.014417171478271484, -0.013791084289550781, -0.013164997100830078, -0.012538909912109375, -0.011912822723388672, -0.011286735534667969, -0.010660648345947266, -0.010034561157226562, -0.00940847396850586, -0.008782386779785156, -0.008156299591064453, -0.00753021240234375, -0.006904125213623047, -0.006278038024902344, -0.005651950836181641, -0.0050258636474609375, -0.004399776458740234, -0.0037736892700195312, -0.003147602081298828, -0.002521514892578125, -0.0018954277038574219, -0.0012693405151367188, -0.0006432533264160156, -1.71661376953125e-05, 0.0006089210510253906, 0.0012350082397460938, 0.0018610954284667969, 0.0024871826171875, 0.003113269805908203, 0.0037393569946289062, 0.004365444183349609, 0.0049915313720703125, 0.005617618560791016, 0.006243705749511719, 0.006869792938232422, 0.007495880126953125, 0.008121967315673828, 0.008748054504394531, 0.009374141693115234, 0.010000228881835938, 0.01062631607055664, 0.011252403259277344, 0.011878490447998047, 0.01250457763671875, 0.013130664825439453, 0.013756752014160156, 0.01438283920288086, 0.015008926391601562, 0.015635013580322266, 0.01626110076904297, 0.016887187957763672, 0.017513275146484375, 0.018139362335205078, 0.01876544952392578, 0.019391536712646484, 0.020017623901367188, 0.02064371109008789, 0.021269798278808594, 0.021895885467529297, 0.02252197265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 7.0, 6.0, 14.0, 18.0, 14.0, 20.0, 23.0, 31.0, 35.0, 40.0, 59.0, 54.0, 77.0, 79.0, 51.0, 69.0, 74.0, 52.0, 48.0, 51.0, 24.0, 38.0, 30.0, 24.0, 12.0, 10.0, 8.0, 9.0, 7.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00891876220703125, -0.008684635162353516, -0.008450508117675781, -0.008216381072998047, -0.007982254028320312, -0.007748126983642578, -0.007513999938964844, -0.007279872894287109, -0.007045745849609375, -0.006811618804931641, -0.006577491760253906, -0.006343364715576172, -0.0061092376708984375, -0.005875110626220703, -0.005640983581542969, -0.005406856536865234, -0.0051727294921875, -0.004938602447509766, -0.004704475402832031, -0.004470348358154297, -0.0042362213134765625, -0.004002094268798828, -0.0037679672241210938, -0.0035338401794433594, -0.003299713134765625, -0.0030655860900878906, -0.0028314590454101562, -0.002597332000732422, -0.0023632049560546875, -0.002129077911376953, -0.0018949508666992188, -0.0016608238220214844, -0.00142669677734375, -0.0011925697326660156, -0.0009584426879882812, -0.0007243156433105469, -0.0004901885986328125, -0.0002560615539550781, -2.193450927734375e-05, 0.00021219253540039062, 0.000446319580078125, 0.0006804466247558594, 0.0009145736694335938, 0.0011487007141113281, 0.0013828277587890625, 0.0016169548034667969, 0.0018510818481445312, 0.0020852088928222656, 0.0023193359375, 0.0025534629821777344, 0.0027875900268554688, 0.003021717071533203, 0.0032558441162109375, 0.003489971160888672, 0.0037240982055664062, 0.003958225250244141, 0.004192352294921875, 0.004426479339599609, 0.004660606384277344, 0.004894733428955078, 0.0051288604736328125, 0.005362987518310547, 0.005597114562988281, 0.005831241607666016, 0.00606536865234375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 44.0, 51.0, 104.0, 159.0, 174.0, 157.0, 104.0, 61.0, 43.0, 19.0, 19.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.8640743494033813, -0.8442875146865845, -0.8245007395744324, -0.8047139048576355, -0.7849271297454834, -0.7651402950286865, -0.7453534603118896, -0.7255666255950928, -0.7057798504829407, -0.6859930157661438, -0.6662062406539917, -0.6464194059371948, -0.626632571220398, -0.6068457961082458, -0.587058961391449, -0.5672721862792969, -0.5474853515625, -0.5276985168457031, -0.507911741733551, -0.48812490701675415, -0.46833810210227966, -0.4485512971878052, -0.4287644624710083, -0.4089776575565338, -0.3891908526420593, -0.36940404772758484, -0.34961724281311035, -0.3298304080963135, -0.310043603181839, -0.2902567982673645, -0.2704699635505676, -0.25068315863609314, -0.23089641332626343, -0.21110960841178894, -0.19132278859615326, -0.17153596878051758, -0.1517491638660431, -0.1319623589515686, -0.11217553913593292, -0.09238871932029724, -0.07260191440582275, -0.05281510204076767, -0.033028289675712585, -0.013241477310657501, 0.006545335054397583, 0.026332147419452667, 0.04611895978450775, 0.06590577960014343, 0.08569258451461792, 0.105479396879673, 0.1252662092447281, 0.14505302906036377, 0.16483983397483826, 0.18462663888931274, 0.20441345870494843, 0.2242002785205841, 0.2439870834350586, 0.2637738883495331, 0.28356069326400757, 0.30334752798080444, 0.32313433289527893, 0.3429211378097534, 0.3627079725265503, 0.3824947774410248, 0.40228158235549927]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 10.0, 6.0, 3.0, 10.0, 7.0, 16.0, 11.0, 15.0, 15.0, 19.0, 27.0, 28.0, 35.0, 46.0, 42.0, 60.0, 53.0, 41.0, 50.0, 43.0, 62.0, 53.0, 57.0, 43.0, 48.0, 32.0, 43.0, 33.0, 22.0, 17.0, 12.0, 14.0, 8.0, 6.0, 4.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2526215612888336, -0.24417267739772797, -0.23572379350662231, -0.22727490961551666, -0.218826025724411, -0.21037714183330536, -0.2019282579421997, -0.19347938895225525, -0.1850304901599884, -0.17658160626888275, -0.1681327223777771, -0.15968383848667145, -0.1512349545955658, -0.14278607070446014, -0.1343371868133545, -0.12588831782341003, -0.11743943393230438, -0.10899055004119873, -0.10054166615009308, -0.09209278225898743, -0.08364389836788177, -0.07519501447677612, -0.06674613803625107, -0.058297254145145416, -0.049848370254039764, -0.04139948636293411, -0.03295060247182846, -0.024501722306013107, -0.016052838414907455, -0.007603954523801804, 0.0008449256420135498, 0.009293809533119202, 0.017742693424224854, 0.026191577315330505, 0.03464046120643616, 0.04308934137225151, 0.05153822526335716, 0.059987109154462814, 0.06843598932027817, 0.07688487321138382, 0.08533375710248947, 0.09378264099359512, 0.10223152488470078, 0.11068040132522583, 0.11912928521633148, 0.12757816910743713, 0.13602705299854279, 0.14447593688964844, 0.1529248207807541, 0.16137370467185974, 0.1698225885629654, 0.17827147245407104, 0.1867203563451767, 0.19516924023628235, 0.2036181092262268, 0.21206700801849365, 0.2205158770084381, 0.22896476089954376, 0.23741364479064941, 0.24586252868175507, 0.2543114125728607, 0.2627602815628052, 0.271209180355072, 0.2796580493450165, 0.2881069481372833]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 11.0, 18.0, 23.0, 28.0, 50.0, 69.0, 88.0, 118.0, 202.0, 273.0, 448.0, 699.0, 1246.0, 2173.0, 4392.0, 8942.0, 21255.0, 56364.0, 244036.0, 559658.0, 92269.0, 30941.0, 12612.0, 5724.0, 2887.0, 1552.0, 834.0, 548.0, 308.0, 229.0, 160.0, 107.0, 76.0, 50.0, 32.0, 26.0, 24.0, 23.0, 12.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.196044921875, -0.19031333923339844, -0.18458175659179688, -0.1788501739501953, -0.17311859130859375, -0.1673870086669922, -0.16165542602539062, -0.15592384338378906, -0.1501922607421875, -0.14446067810058594, -0.13872909545898438, -0.1329975128173828, -0.12726593017578125, -0.12153434753417969, -0.11580276489257812, -0.11007118225097656, -0.104339599609375, -0.09860801696777344, -0.09287643432617188, -0.08714485168457031, -0.08141326904296875, -0.07568168640136719, -0.06995010375976562, -0.06421852111816406, -0.0584869384765625, -0.05275535583496094, -0.047023773193359375, -0.04129219055175781, -0.03556060791015625, -0.029829025268554688, -0.024097442626953125, -0.018365859985351562, -0.01263427734375, -0.0069026947021484375, -0.001171112060546875, 0.0045604705810546875, 0.01029205322265625, 0.016023635864257812, 0.021755218505859375, 0.027486801147460938, 0.0332183837890625, 0.03894996643066406, 0.044681549072265625, 0.05041313171386719, 0.05614471435546875, 0.06187629699707031, 0.06760787963867188, 0.07333946228027344, 0.079071044921875, 0.08480262756347656, 0.09053421020507812, 0.09626579284667969, 0.10199737548828125, 0.10772895812988281, 0.11346054077148438, 0.11919212341308594, 0.1249237060546875, 0.13065528869628906, 0.13638687133789062, 0.1421184539794922, 0.14785003662109375, 0.1535816192626953, 0.15931320190429688, 0.16504478454589844, 0.1707763671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 5.0, 6.0, 8.0, 11.0, 14.0, 10.0, 18.0, 17.0, 18.0, 28.0, 34.0, 54.0, 50.0, 66.0, 47.0, 56.0, 66.0, 50.0, 58.0, 60.0, 63.0, 50.0, 29.0, 44.0, 24.0, 34.0, 18.0, 14.0, 13.0, 5.0, 6.0, 3.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5216445922851562, -0.5027618408203125, -0.48387908935546875, -0.464996337890625, -0.44611358642578125, -0.4272308349609375, -0.40834808349609375, -0.38946533203125, -0.37058258056640625, -0.3516998291015625, -0.33281707763671875, -0.313934326171875, -0.29505157470703125, -0.2761688232421875, -0.25728607177734375, -0.2384033203125, -0.21952056884765625, -0.2006378173828125, -0.18175506591796875, -0.162872314453125, -0.14398956298828125, -0.1251068115234375, -0.10622406005859375, -0.08734130859375, -0.06845855712890625, -0.0495758056640625, -0.03069305419921875, -0.011810302734375, 0.00707244873046875, 0.0259552001953125, 0.04483795166015625, 0.063720703125, 0.08260345458984375, 0.1014862060546875, 0.12036895751953125, 0.139251708984375, 0.15813446044921875, 0.1770172119140625, 0.19589996337890625, 0.21478271484375, 0.23366546630859375, 0.2525482177734375, 0.27143096923828125, 0.290313720703125, 0.30919647216796875, 0.3280792236328125, 0.34696197509765625, 0.3658447265625, 0.38472747802734375, 0.4036102294921875, 0.42249298095703125, 0.441375732421875, 0.46025848388671875, 0.4791412353515625, 0.49802398681640625, 0.51690673828125, 0.5357894897460938, 0.5546722412109375, 0.5735549926757812, 0.592437744140625, 0.6113204956054688, 0.6302032470703125, 0.6490859985351562, 0.66796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 9.0, 8.0, 8.0, 12.0, 10.0, 22.0, 17.0, 20.0, 37.0, 49.0, 66.0, 80.0, 139.0, 404.0, 2014.0, 46598.0, 970749.0, 25869.0, 1553.0, 382.0, 140.0, 93.0, 49.0, 42.0, 34.0, 34.0, 15.0, 20.0, 24.0, 16.0, 8.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.80517578125, -0.7824478149414062, -0.7597198486328125, -0.7369918823242188, -0.714263916015625, -0.6915359497070312, -0.6688079833984375, -0.6460800170898438, -0.62335205078125, -0.6006240844726562, -0.5778961181640625, -0.5551681518554688, -0.532440185546875, -0.5097122192382812, -0.4869842529296875, -0.46425628662109375, -0.4415283203125, -0.41880035400390625, -0.3960723876953125, -0.37334442138671875, -0.350616455078125, -0.32788848876953125, -0.3051605224609375, -0.28243255615234375, -0.25970458984375, -0.23697662353515625, -0.2142486572265625, -0.19152069091796875, -0.168792724609375, -0.14606475830078125, -0.1233367919921875, -0.10060882568359375, -0.077880859375, -0.05515289306640625, -0.0324249267578125, -0.00969696044921875, 0.013031005859375, 0.03575897216796875, 0.0584869384765625, 0.08121490478515625, 0.10394287109375, 0.12667083740234375, 0.1493988037109375, 0.17212677001953125, 0.194854736328125, 0.21758270263671875, 0.2403106689453125, 0.26303863525390625, 0.2857666015625, 0.30849456787109375, 0.3312225341796875, 0.35395050048828125, 0.376678466796875, 0.39940643310546875, 0.4221343994140625, 0.44486236572265625, 0.46759033203125, 0.49031829833984375, 0.5130462646484375, 0.5357742309570312, 0.558502197265625, 0.5812301635742188, 0.6039581298828125, 0.6266860961914062, 0.6494140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 13.0, 5.0, 10.0, 6.0, 15.0, 12.0, 14.0, 23.0, 28.0, 39.0, 34.0, 47.0, 45.0, 51.0, 64.0, 60.0, 53.0, 54.0, 57.0, 51.0, 44.0, 53.0, 39.0, 26.0, 22.0, 25.0, 19.0, 24.0, 13.0, 12.0, 9.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61279296875, -0.59356689453125, -0.5743408203125, -0.55511474609375, -0.535888671875, -0.51666259765625, -0.4974365234375, -0.47821044921875, -0.458984375, -0.43975830078125, -0.4205322265625, -0.40130615234375, -0.382080078125, -0.36285400390625, -0.3436279296875, -0.32440185546875, -0.30517578125, -0.28594970703125, -0.2667236328125, -0.24749755859375, -0.228271484375, -0.20904541015625, -0.1898193359375, -0.17059326171875, -0.1513671875, -0.13214111328125, -0.1129150390625, -0.09368896484375, -0.074462890625, -0.05523681640625, -0.0360107421875, -0.01678466796875, 0.00244140625, 0.02166748046875, 0.0408935546875, 0.06011962890625, 0.079345703125, 0.09857177734375, 0.1177978515625, 0.13702392578125, 0.15625, 0.17547607421875, 0.1947021484375, 0.21392822265625, 0.233154296875, 0.25238037109375, 0.2716064453125, 0.29083251953125, 0.31005859375, 0.32928466796875, 0.3485107421875, 0.36773681640625, 0.386962890625, 0.40618896484375, 0.4254150390625, 0.44464111328125, 0.4638671875, 0.48309326171875, 0.5023193359375, 0.52154541015625, 0.540771484375, 0.55999755859375, 0.5792236328125, 0.59844970703125, 0.61767578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 7.0, 8.0, 15.0, 25.0, 45.0, 99.0, 212.0, 552.0, 1684.0, 9674.0, 318866.0, 702227.0, 12258.0, 1840.0, 566.0, 261.0, 87.0, 58.0, 19.0, 21.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14550018310546875, -0.1389007568359375, -0.13230133056640625, -0.125701904296875, -0.11910247802734375, -0.1125030517578125, -0.10590362548828125, -0.09930419921875, -0.09270477294921875, -0.0861053466796875, -0.07950592041015625, -0.072906494140625, -0.06630706787109375, -0.0597076416015625, -0.05310821533203125, -0.0465087890625, -0.03990936279296875, -0.0333099365234375, -0.02671051025390625, -0.020111083984375, -0.01351165771484375, -0.0069122314453125, -0.00031280517578125, 0.00628662109375, 0.01288604736328125, 0.0194854736328125, 0.02608489990234375, 0.032684326171875, 0.03928375244140625, 0.0458831787109375, 0.05248260498046875, 0.05908203125, 0.06568145751953125, 0.0722808837890625, 0.07888031005859375, 0.085479736328125, 0.09207916259765625, 0.0986785888671875, 0.10527801513671875, 0.11187744140625, 0.11847686767578125, 0.1250762939453125, 0.13167572021484375, 0.138275146484375, 0.14487457275390625, 0.1514739990234375, 0.15807342529296875, 0.1646728515625, 0.17127227783203125, 0.1778717041015625, 0.18447113037109375, 0.191070556640625, 0.19766998291015625, 0.2042694091796875, 0.21086883544921875, 0.21746826171875, 0.22406768798828125, 0.2306671142578125, 0.23726654052734375, 0.243865966796875, 0.25046539306640625, 0.2570648193359375, 0.26366424560546875, 0.270263671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 7.0, 2.0, 8.0, 15.0, 19.0, 20.0, 30.0, 41.0, 76.0, 212.0, 291.0, 98.0, 50.0, 41.0, 19.0, 16.0, 20.0, 14.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4497509002685547e-05, -2.3801811039447784e-05, -2.3106113076210022e-05, -2.241041511297226e-05, -2.1714717149734497e-05, -2.1019019186496735e-05, -2.0323321223258972e-05, -1.962762326002121e-05, -1.8931925296783447e-05, -1.8236227333545685e-05, -1.7540529370307922e-05, -1.684483140707016e-05, -1.6149133443832397e-05, -1.5453435480594635e-05, -1.4757737517356873e-05, -1.406203955411911e-05, -1.3366341590881348e-05, -1.2670643627643585e-05, -1.1974945664405823e-05, -1.127924770116806e-05, -1.0583549737930298e-05, -9.887851774692535e-06, -9.192153811454773e-06, -8.49645584821701e-06, -7.800757884979248e-06, -7.105059921741486e-06, -6.409361958503723e-06, -5.713663995265961e-06, -5.017966032028198e-06, -4.322268068790436e-06, -3.6265701055526733e-06, -2.930872142314911e-06, -2.2351741790771484e-06, -1.539476215839386e-06, -8.437782526016235e-07, -1.4808028936386108e-07, 5.476176738739014e-07, 1.2433156371116638e-06, 1.9390136003494263e-06, 2.6347115635871887e-06, 3.330409526824951e-06, 4.026107490062714e-06, 4.721805453300476e-06, 5.4175034165382385e-06, 6.113201379776001e-06, 6.8088993430137634e-06, 7.504597306251526e-06, 8.200295269489288e-06, 8.89599323272705e-06, 9.591691195964813e-06, 1.0287389159202576e-05, 1.0983087122440338e-05, 1.16787850856781e-05, 1.2374483048915863e-05, 1.3070181012153625e-05, 1.3765878975391388e-05, 1.446157693862915e-05, 1.5157274901866913e-05, 1.5852972865104675e-05, 1.6548670828342438e-05, 1.72443687915802e-05, 1.7940066754817963e-05, 1.8635764718055725e-05, 1.9331462681293488e-05, 2.002716064453125e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 7.0, 12.0, 18.0, 36.0, 42.0, 63.0, 72.0, 139.0, 195.0, 318.0, 559.0, 1172.0, 3501.0, 24299.0, 855156.0, 149600.0, 9192.0, 2107.0, 779.0, 470.0, 257.0, 179.0, 119.0, 77.0, 64.0, 43.0, 19.0, 18.0, 13.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.26708984375, -0.2606983184814453, -0.2543067932128906, -0.24791526794433594, -0.24152374267578125, -0.23513221740722656, -0.22874069213867188, -0.2223491668701172, -0.2159576416015625, -0.2095661163330078, -0.20317459106445312, -0.19678306579589844, -0.19039154052734375, -0.18400001525878906, -0.17760848999023438, -0.1712169647216797, -0.164825439453125, -0.1584339141845703, -0.15204238891601562, -0.14565086364746094, -0.13925933837890625, -0.13286781311035156, -0.12647628784179688, -0.12008476257324219, -0.1136932373046875, -0.10730171203613281, -0.10091018676757812, -0.09451866149902344, -0.08812713623046875, -0.08173561096191406, -0.07534408569335938, -0.06895256042480469, -0.06256103515625, -0.05616950988769531, -0.049777984619140625, -0.04338645935058594, -0.03699493408203125, -0.030603408813476562, -0.024211883544921875, -0.017820358276367188, -0.0114288330078125, -0.0050373077392578125, 0.001354217529296875, 0.0077457427978515625, 0.01413726806640625, 0.020528793334960938, 0.026920318603515625, 0.03331184387207031, 0.039703369140625, 0.04609489440917969, 0.052486419677734375, 0.05887794494628906, 0.06526947021484375, 0.07166099548339844, 0.07805252075195312, 0.08444404602050781, 0.0908355712890625, 0.09722709655761719, 0.10361862182617188, 0.11001014709472656, 0.11640167236328125, 0.12279319763183594, 0.12918472290039062, 0.1355762481689453, 0.1419677734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 8.0, 13.0, 20.0, 25.0, 36.0, 48.0, 66.0, 114.0, 311.0, 107.0, 64.0, 47.0, 32.0, 28.0, 21.0, 9.0, 8.0, 9.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0455322265625, -0.04398965835571289, -0.04244709014892578, -0.04090452194213867, -0.03936195373535156, -0.03781938552856445, -0.036276817321777344, -0.034734249114990234, -0.033191680908203125, -0.031649112701416016, -0.030106544494628906, -0.028563976287841797, -0.027021408081054688, -0.025478839874267578, -0.02393627166748047, -0.02239370346069336, -0.02085113525390625, -0.01930856704711914, -0.01776599884033203, -0.016223430633544922, -0.014680862426757812, -0.013138294219970703, -0.011595726013183594, -0.010053157806396484, -0.008510589599609375, -0.006968021392822266, -0.005425453186035156, -0.003882884979248047, -0.0023403167724609375, -0.0007977485656738281, 0.0007448196411132812, 0.0022873878479003906, 0.0038299560546875, 0.005372524261474609, 0.006915092468261719, 0.008457660675048828, 0.010000228881835938, 0.011542797088623047, 0.013085365295410156, 0.014627933502197266, 0.016170501708984375, 0.017713069915771484, 0.019255638122558594, 0.020798206329345703, 0.022340774536132812, 0.023883342742919922, 0.02542591094970703, 0.02696847915649414, 0.02851104736328125, 0.03005361557006836, 0.03159618377685547, 0.03313875198364258, 0.03468132019042969, 0.0362238883972168, 0.037766456604003906, 0.039309024810791016, 0.040851593017578125, 0.042394161224365234, 0.043936729431152344, 0.04547929763793945, 0.04702186584472656, 0.04856443405151367, 0.05010700225830078, 0.05164957046508789, 0.053192138671875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 11.0, 19.0, 35.0, 85.0, 199.0, 253.0, 203.0, 92.0, 53.0, 25.0, 11.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.837075710296631, -2.7774691581726074, -2.717862606048584, -2.6582562923431396, -2.598649740219116, -2.5390431880950928, -2.4794368743896484, -2.419830322265625, -2.3602237701416016, -2.300617218017578, -2.2410106658935547, -2.1814043521881104, -2.121797800064087, -2.0621912479400635, -2.002584934234619, -1.9429783821105957, -1.8833718299865723, -1.8237652778625488, -1.764158844947815, -1.704552412033081, -1.6449458599090576, -1.5853393077850342, -1.5257328748703003, -1.4661264419555664, -1.406519889831543, -1.3469133377075195, -1.2873069047927856, -1.2277004718780518, -1.1680939197540283, -1.1084873676300049, -1.048880934715271, -0.9892744421958923, -0.9296679496765137, -0.870061457157135, -0.8104549646377563, -0.7508484721183777, -0.691241979598999, -0.6316354870796204, -0.5720289945602417, -0.512422502040863, -0.4528160095214844, -0.3932095170021057, -0.33360302448272705, -0.2739965319633484, -0.21439003944396973, -0.15478354692459106, -0.0951770544052124, -0.03557056188583374, 0.024035930633544922, 0.08364242315292358, 0.14324891567230225, 0.2028554081916809, 0.26246190071105957, 0.32206839323043823, 0.3816748857498169, 0.44128137826919556, 0.5008878707885742, 0.5604943633079529, 0.6201008558273315, 0.6797073483467102, 0.7393138408660889, 0.7989203333854675, 0.8585268259048462, 0.9181333184242249, 0.9777398109436035]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 6.0, 12.0, 13.0, 13.0, 30.0, 16.0, 18.0, 26.0, 30.0, 27.0, 35.0, 32.0, 28.0, 37.0, 41.0, 37.0, 48.0, 40.0, 42.0, 55.0, 45.0, 37.0, 31.0, 32.0, 34.0, 30.0, 21.0, 19.0, 23.0, 17.0, 21.0, 12.0, 9.0, 15.0, 12.0, 8.0, 8.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7865099310874939, -0.7614437937736511, -0.7363776564598083, -0.7113115191459656, -0.6862453818321228, -0.66117924451828, -0.6361130475997925, -0.6110469102859497, -0.5859807729721069, -0.5609146356582642, -0.5358484983444214, -0.5107823610305786, -0.48571622371673584, -0.46065008640289307, -0.4355839192867279, -0.41051778197288513, -0.38545167446136475, -0.360385537147522, -0.3353193998336792, -0.3102532625198364, -0.28518712520599365, -0.2601209878921509, -0.23505482077598572, -0.20998868346214294, -0.18492254614830017, -0.1598564088344574, -0.13479027152061462, -0.10972411930561066, -0.08465798199176788, -0.05959184467792511, -0.03452569246292114, -0.00945955514907837, 0.01560664176940918, 0.04067278280854225, 0.06573892384767532, 0.0908050686120987, 0.11587120592594147, 0.14093734323978424, 0.1660034954547882, 0.19106963276863098, 0.21613577008247375, 0.24120190739631653, 0.2662680447101593, 0.29133421182632446, 0.31640034914016724, 0.34146648645401, 0.3665326237678528, 0.39159876108169556, 0.41666489839553833, 0.4417310357093811, 0.4667971730232239, 0.49186331033706665, 0.5169294476509094, 0.5419955849647522, 0.5670617818832397, 0.5921279191970825, 0.6171940565109253, 0.6422601938247681, 0.6673263311386108, 0.6923924684524536, 0.7174586057662964, 0.7425247430801392, 0.7675908803939819, 0.7926570177078247, 0.8177231550216675]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 10.0, 5.0, 11.0, 22.0, 18.0, 27.0, 37.0, 55.0, 81.0, 117.0, 172.0, 257.0, 393.0, 598.0, 1036.0, 2005.0, 4166.0, 14365.0, 147184.0, 3508166.0, 478432.0, 25545.0, 5891.0, 2398.0, 1238.0, 743.0, 417.0, 270.0, 196.0, 122.0, 88.0, 68.0, 47.0, 19.0, 24.0, 10.0, 10.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.6826171875, -0.6587905883789062, -0.6349639892578125, -0.6111373901367188, -0.587310791015625, -0.5634841918945312, -0.5396575927734375, -0.5158309936523438, -0.49200439453125, -0.46817779541015625, -0.4443511962890625, -0.42052459716796875, -0.396697998046875, -0.37287139892578125, -0.3490447998046875, -0.32521820068359375, -0.3013916015625, -0.27756500244140625, -0.2537384033203125, -0.22991180419921875, -0.206085205078125, -0.18225860595703125, -0.1584320068359375, -0.13460540771484375, -0.11077880859375, -0.08695220947265625, -0.0631256103515625, -0.03929901123046875, -0.015472412109375, 0.00835418701171875, 0.0321807861328125, 0.05600738525390625, 0.079833984375, 0.10366058349609375, 0.1274871826171875, 0.15131378173828125, 0.175140380859375, 0.19896697998046875, 0.2227935791015625, 0.24662017822265625, 0.27044677734375, 0.29427337646484375, 0.3180999755859375, 0.34192657470703125, 0.365753173828125, 0.38957977294921875, 0.4134063720703125, 0.43723297119140625, 0.4610595703125, 0.48488616943359375, 0.5087127685546875, 0.5325393676757812, 0.556365966796875, 0.5801925659179688, 0.6040191650390625, 0.6278457641601562, 0.65167236328125, 0.6754989624023438, 0.6993255615234375, 0.7231521606445312, 0.746978759765625, 0.7708053588867188, 0.7946319580078125, 0.8184585571289062, 0.84228515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 11.0, 5.0, 3.0, 8.0, 6.0, 20.0, 22.0, 18.0, 36.0, 33.0, 36.0, 40.0, 42.0, 56.0, 53.0, 63.0, 65.0, 70.0, 74.0, 51.0, 53.0, 55.0, 37.0, 47.0, 25.0, 13.0, 18.0, 10.0, 8.0, 10.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3595390319824219, -0.34871673583984375, -0.3378944396972656, -0.3270721435546875, -0.3162498474121094, -0.30542755126953125, -0.2946052551269531, -0.283782958984375, -0.2729606628417969, -0.26213836669921875, -0.2513160705566406, -0.2404937744140625, -0.22967147827148438, -0.21884918212890625, -0.20802688598632812, -0.19720458984375, -0.18638229370117188, -0.17555999755859375, -0.16473770141601562, -0.1539154052734375, -0.14309310913085938, -0.13227081298828125, -0.12144851684570312, -0.110626220703125, -0.09980392456054688, -0.08898162841796875, -0.07815933227539062, -0.0673370361328125, -0.056514739990234375, -0.04569244384765625, -0.034870147705078125, -0.0240478515625, -0.013225555419921875, -0.00240325927734375, 0.008419036865234375, 0.0192413330078125, 0.030063629150390625, 0.04088592529296875, 0.051708221435546875, 0.062530517578125, 0.07335281372070312, 0.08417510986328125, 0.09499740600585938, 0.1058197021484375, 0.11664199829101562, 0.12746429443359375, 0.13828659057617188, 0.14910888671875, 0.15993118286132812, 0.17075347900390625, 0.18157577514648438, 0.1923980712890625, 0.20322036743164062, 0.21404266357421875, 0.22486495971679688, 0.235687255859375, 0.24650955200195312, 0.25733184814453125, 0.2681541442871094, 0.2789764404296875, 0.2897987365722656, 0.30062103271484375, 0.3114433288574219, 0.322265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 13.0, 14.0, 21.0, 28.0, 28.0, 60.0, 116.0, 174.0, 354.0, 801.0, 2048.0, 6818.0, 41918.0, 3486077.0, 627117.0, 21514.0, 4472.0, 1479.0, 618.0, 235.0, 146.0, 84.0, 59.0, 23.0, 17.0, 11.0, 9.0, 12.0, 10.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.076171875, -1.046966552734375, -1.01776123046875, -0.988555908203125, -0.9593505859375, -0.930145263671875, -0.90093994140625, -0.871734619140625, -0.842529296875, -0.813323974609375, -0.78411865234375, -0.754913330078125, -0.7257080078125, -0.696502685546875, -0.66729736328125, -0.638092041015625, -0.60888671875, -0.579681396484375, -0.55047607421875, -0.521270751953125, -0.4920654296875, -0.462860107421875, -0.43365478515625, -0.404449462890625, -0.375244140625, -0.346038818359375, -0.31683349609375, -0.287628173828125, -0.2584228515625, -0.229217529296875, -0.20001220703125, -0.170806884765625, -0.1416015625, -0.112396240234375, -0.08319091796875, -0.053985595703125, -0.0247802734375, 0.004425048828125, 0.03363037109375, 0.062835693359375, 0.092041015625, 0.121246337890625, 0.15045166015625, 0.179656982421875, 0.2088623046875, 0.238067626953125, 0.26727294921875, 0.296478271484375, 0.32568359375, 0.354888916015625, 0.38409423828125, 0.413299560546875, 0.4425048828125, 0.471710205078125, 0.50091552734375, 0.530120849609375, 0.559326171875, 0.588531494140625, 0.61773681640625, 0.646942138671875, 0.6761474609375, 0.705352783203125, 0.73455810546875, 0.763763427734375, 0.79296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 4.0, 8.0, 13.0, 13.0, 19.0, 21.0, 32.0, 62.0, 141.0, 290.0, 764.0, 1202.0, 791.0, 330.0, 155.0, 85.0, 39.0, 28.0, 35.0, 10.0, 9.0, 11.0, 1.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.1463298797607422, -0.13921737670898438, -0.13210487365722656, -0.12499237060546875, -0.11787986755371094, -0.11076736450195312, -0.10365486145019531, -0.0965423583984375, -0.08942985534667969, -0.08231735229492188, -0.07520484924316406, -0.06809234619140625, -0.06097984313964844, -0.053867340087890625, -0.04675483703613281, -0.039642333984375, -0.03252983093261719, -0.025417327880859375, -0.018304824829101562, -0.01119232177734375, -0.0040798187255859375, 0.003032684326171875, 0.010145187377929688, 0.0172576904296875, 0.024370193481445312, 0.031482696533203125, 0.03859519958496094, 0.04570770263671875, 0.05282020568847656, 0.059932708740234375, 0.06704521179199219, 0.07415771484375, 0.08127021789550781, 0.08838272094726562, 0.09549522399902344, 0.10260772705078125, 0.10972023010253906, 0.11683273315429688, 0.12394523620605469, 0.1310577392578125, 0.1381702423095703, 0.14528274536132812, 0.15239524841308594, 0.15950775146484375, 0.16662025451660156, 0.17373275756835938, 0.1808452606201172, 0.187957763671875, 0.1950702667236328, 0.20218276977539062, 0.20929527282714844, 0.21640777587890625, 0.22352027893066406, 0.23063278198242188, 0.2377452850341797, 0.2448577880859375, 0.2519702911376953, 0.2590827941894531, 0.26619529724121094, 0.27330780029296875, 0.28042030334472656, 0.2875328063964844, 0.2946453094482422, 0.3017578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 12.0, 37.0, 76.0, 108.0, 170.0, 216.0, 152.0, 95.0, 48.0, 36.0, 14.0, 15.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3474003076553345, -1.3131623268127441, -1.2789243459701538, -1.2446863651275635, -1.2104483842849731, -1.1762104034423828, -1.1419724225997925, -1.1077344417572021, -1.0734963417053223, -1.039258360862732, -1.0050203800201416, -0.9707823991775513, -0.9365444183349609, -0.9023064374923706, -0.8680683970451355, -0.8338304162025452, -0.7995924949645996, -0.7653545141220093, -0.731116533279419, -0.6968785524368286, -0.6626405715942383, -0.628402590751648, -0.5941645503044128, -0.5599265694618225, -0.5256885886192322, -0.49145060777664185, -0.4572126269340515, -0.4229746162891388, -0.38873663544654846, -0.35449865460395813, -0.3202606439590454, -0.2860226631164551, -0.2517847418785095, -0.2175467610359192, -0.18330876529216766, -0.14907076954841614, -0.1148327887058258, -0.08059480786323547, -0.04635681211948395, -0.012118816375732422, 0.02211916446685791, 0.05635715276002884, 0.09059514105319977, 0.1248331293463707, 0.15907111763954163, 0.19330909848213196, 0.22754709422588348, 0.261785089969635, 0.29602307081222534, 0.3302610516548157, 0.364499032497406, 0.3987370431423187, 0.43297502398490906, 0.4672130048274994, 0.5014510154724121, 0.5356889963150024, 0.5699269771575928, 0.6041649580001831, 0.6384029388427734, 0.6726409196853638, 0.7068789005279541, 0.7411168813705444, 0.7753549218177795, 0.8095929026603699, 0.8438308835029602]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 12.0, 17.0, 12.0, 11.0, 26.0, 20.0, 22.0, 27.0, 26.0, 28.0, 33.0, 38.0, 44.0, 33.0, 43.0, 51.0, 39.0, 52.0, 44.0, 42.0, 51.0, 30.0, 32.0, 45.0, 45.0, 25.0, 20.0, 23.0, 21.0, 20.0, 14.0, 14.0, 5.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3229515254497528, -0.31225916743278503, -0.3015667796134949, -0.2908744215965271, -0.2801820635795593, -0.26948967576026917, -0.2587973177433014, -0.24810494482517242, -0.23741257190704346, -0.2267201989889145, -0.21602782607078552, -0.20533546805381775, -0.19464309513568878, -0.18395072221755981, -0.17325836420059204, -0.16256599128246307, -0.1518736183643341, -0.14118124544620514, -0.13048887252807617, -0.1197965145111084, -0.10910414159297943, -0.09841176867485046, -0.0877194032073021, -0.07702703773975372, -0.06633466482162476, -0.05564229562878609, -0.04494992643594742, -0.03425755724310875, -0.02356518805027008, -0.012872818857431412, -0.002180449664592743, 0.008511915802955627, 0.019204288721084595, 0.029896657913923264, 0.04058902710676193, 0.0512813962996006, 0.06197376549243927, 0.07266613841056824, 0.08335850387811661, 0.09405086934566498, 0.10474324226379395, 0.11543561518192291, 0.12612798810005188, 0.13682034611701965, 0.14751271903514862, 0.1582050919532776, 0.16889744997024536, 0.17958982288837433, 0.1902821958065033, 0.20097456872463226, 0.21166694164276123, 0.222359299659729, 0.23305167257785797, 0.24374404549598694, 0.2544364035129547, 0.2651287913322449, 0.27582114934921265, 0.2865135073661804, 0.2972058951854706, 0.30789825320243835, 0.3185906410217285, 0.3292829990386963, 0.33997535705566406, 0.35066771507263184, 0.361360102891922]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 9.0, 9.0, 19.0, 21.0, 25.0, 34.0, 57.0, 116.0, 186.0, 384.0, 750.0, 1617.0, 3582.0, 9799.0, 36458.0, 391295.0, 539358.0, 45711.0, 11466.0, 4125.0, 1749.0, 838.0, 388.0, 217.0, 139.0, 69.0, 39.0, 33.0, 19.0, 14.0, 9.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.265869140625, -0.25806427001953125, -0.2502593994140625, -0.24245452880859375, -0.234649658203125, -0.22684478759765625, -0.2190399169921875, -0.21123504638671875, -0.20343017578125, -0.19562530517578125, -0.1878204345703125, -0.18001556396484375, -0.172210693359375, -0.16440582275390625, -0.1566009521484375, -0.14879608154296875, -0.1409912109375, -0.13318634033203125, -0.1253814697265625, -0.11757659912109375, -0.109771728515625, -0.10196685791015625, -0.0941619873046875, -0.08635711669921875, -0.07855224609375, -0.07074737548828125, -0.0629425048828125, -0.05513763427734375, -0.047332763671875, -0.03952789306640625, -0.0317230224609375, -0.02391815185546875, -0.01611328125, -0.00830841064453125, -0.0005035400390625, 0.00730133056640625, 0.015106201171875, 0.02291107177734375, 0.0307159423828125, 0.03852081298828125, 0.04632568359375, 0.05413055419921875, 0.0619354248046875, 0.06974029541015625, 0.077545166015625, 0.08535003662109375, 0.0931549072265625, 0.10095977783203125, 0.1087646484375, 0.11656951904296875, 0.1243743896484375, 0.13217926025390625, 0.139984130859375, 0.14778900146484375, 0.1555938720703125, 0.16339874267578125, 0.17120361328125, 0.17900848388671875, 0.1868133544921875, 0.19461822509765625, 0.202423095703125, 0.21022796630859375, 0.2180328369140625, 0.22583770751953125, 0.233642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 5.0, 12.0, 22.0, 18.0, 20.0, 20.0, 19.0, 31.0, 34.0, 39.0, 32.0, 46.0, 37.0, 42.0, 52.0, 41.0, 46.0, 53.0, 50.0, 31.0, 29.0, 45.0, 35.0, 39.0, 37.0, 15.0, 22.0, 23.0, 15.0, 17.0, 13.0, 15.0, 5.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22100448608398438, -0.21361541748046875, -0.20622634887695312, -0.1988372802734375, -0.19144821166992188, -0.18405914306640625, -0.17667007446289062, -0.169281005859375, -0.16189193725585938, -0.15450286865234375, -0.14711380004882812, -0.1397247314453125, -0.13233566284179688, -0.12494659423828125, -0.11755752563476562, -0.11016845703125, -0.10277938842773438, -0.09539031982421875, -0.08800125122070312, -0.0806121826171875, -0.07322311401367188, -0.06583404541015625, -0.058444976806640625, -0.051055908203125, -0.043666839599609375, -0.03627777099609375, -0.028888702392578125, -0.0214996337890625, -0.014110565185546875, -0.00672149658203125, 0.000667572021484375, 0.008056640625, 0.015445709228515625, 0.02283477783203125, 0.030223846435546875, 0.0376129150390625, 0.045001983642578125, 0.05239105224609375, 0.059780120849609375, 0.067169189453125, 0.07455825805664062, 0.08194732666015625, 0.08933639526367188, 0.0967254638671875, 0.10411453247070312, 0.11150360107421875, 0.11889266967773438, 0.12628173828125, 0.13367080688476562, 0.14105987548828125, 0.14844894409179688, 0.1558380126953125, 0.16322708129882812, 0.17061614990234375, 0.17800521850585938, 0.185394287109375, 0.19278335571289062, 0.20017242431640625, 0.20756149291992188, 0.2149505615234375, 0.22233963012695312, 0.22972869873046875, 0.23711776733398438, 0.2445068359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 11.0, 20.0, 28.0, 37.0, 68.0, 85.0, 120.0, 170.0, 279.0, 448.0, 691.0, 1181.0, 1945.0, 3568.0, 6779.0, 14572.0, 35874.0, 114657.0, 422093.0, 312213.0, 81087.0, 27549.0, 11791.0, 5752.0, 3030.0, 1722.0, 1043.0, 618.0, 391.0, 225.0, 150.0, 128.0, 75.0, 53.0, 30.0, 16.0, 14.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09893798828125, -0.09583282470703125, -0.0927276611328125, -0.08962249755859375, -0.086517333984375, -0.08341217041015625, -0.0803070068359375, -0.07720184326171875, -0.0740966796875, -0.07099151611328125, -0.0678863525390625, -0.06478118896484375, -0.061676025390625, -0.05857086181640625, -0.0554656982421875, -0.05236053466796875, -0.04925537109375, -0.04615020751953125, -0.0430450439453125, -0.03993988037109375, -0.036834716796875, -0.03372955322265625, -0.0306243896484375, -0.02751922607421875, -0.0244140625, -0.02130889892578125, -0.0182037353515625, -0.01509857177734375, -0.011993408203125, -0.00888824462890625, -0.0057830810546875, -0.00267791748046875, 0.00042724609375, 0.00353240966796875, 0.0066375732421875, 0.00974273681640625, 0.012847900390625, 0.01595306396484375, 0.0190582275390625, 0.02216339111328125, 0.0252685546875, 0.02837371826171875, 0.0314788818359375, 0.03458404541015625, 0.037689208984375, 0.04079437255859375, 0.0438995361328125, 0.04700469970703125, 0.05010986328125, 0.05321502685546875, 0.0563201904296875, 0.05942535400390625, 0.062530517578125, 0.06563568115234375, 0.0687408447265625, 0.07184600830078125, 0.074951171875, 0.07805633544921875, 0.0811614990234375, 0.08426666259765625, 0.087371826171875, 0.09047698974609375, 0.0935821533203125, 0.09668731689453125, 0.09979248046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 8.0, 5.0, 5.0, 13.0, 22.0, 14.0, 29.0, 25.0, 31.0, 25.0, 28.0, 41.0, 46.0, 59.0, 49.0, 62.0, 52.0, 55.0, 48.0, 55.0, 41.0, 34.0, 32.0, 32.0, 32.0, 37.0, 23.0, 12.0, 15.0, 9.0, 13.0, 9.0, 12.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5111312866210938, -0.4944305419921875, -0.47772979736328125, -0.461029052734375, -0.44432830810546875, -0.4276275634765625, -0.41092681884765625, -0.39422607421875, -0.37752532958984375, -0.3608245849609375, -0.34412384033203125, -0.327423095703125, -0.31072235107421875, -0.2940216064453125, -0.27732086181640625, -0.2606201171875, -0.24391937255859375, -0.2272186279296875, -0.21051788330078125, -0.193817138671875, -0.17711639404296875, -0.1604156494140625, -0.14371490478515625, -0.12701416015625, -0.11031341552734375, -0.0936126708984375, -0.07691192626953125, -0.060211181640625, -0.04351043701171875, -0.0268096923828125, -0.01010894775390625, 0.006591796875, 0.02329254150390625, 0.0399932861328125, 0.05669403076171875, 0.073394775390625, 0.09009552001953125, 0.1067962646484375, 0.12349700927734375, 0.14019775390625, 0.15689849853515625, 0.1735992431640625, 0.19029998779296875, 0.207000732421875, 0.22370147705078125, 0.2404022216796875, 0.25710296630859375, 0.2738037109375, 0.29050445556640625, 0.3072052001953125, 0.32390594482421875, 0.340606689453125, 0.35730743408203125, 0.3740081787109375, 0.39070892333984375, 0.40740966796875, 0.42411041259765625, 0.4408111572265625, 0.45751190185546875, 0.474212646484375, 0.49091339111328125, 0.5076141357421875, 0.5243148803710938, 0.541015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 5.0, 12.0, 10.0, 25.0, 27.0, 75.0, 99.0, 182.0, 334.0, 607.0, 1370.0, 3362.0, 9684.0, 35866.0, 181399.0, 567005.0, 194186.0, 37909.0, 10132.0, 3474.0, 1347.0, 643.0, 345.0, 188.0, 100.0, 53.0, 42.0, 22.0, 19.0, 12.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0241241455078125, -0.023247480392456055, -0.02237081527709961, -0.021494150161743164, -0.02061748504638672, -0.019740819931030273, -0.018864154815673828, -0.017987489700317383, -0.017110824584960938, -0.016234159469604492, -0.015357494354248047, -0.014480829238891602, -0.013604164123535156, -0.012727499008178711, -0.011850833892822266, -0.01097416877746582, -0.010097503662109375, -0.00922083854675293, -0.008344173431396484, -0.007467508316040039, -0.006590843200683594, -0.0057141780853271484, -0.004837512969970703, -0.003960847854614258, -0.0030841827392578125, -0.002207517623901367, -0.0013308525085449219, -0.00045418739318847656, 0.00042247772216796875, 0.001299142837524414, 0.0021758079528808594, 0.0030524730682373047, 0.00392913818359375, 0.004805803298950195, 0.005682468414306641, 0.006559133529663086, 0.007435798645019531, 0.008312463760375977, 0.009189128875732422, 0.010065793991088867, 0.010942459106445312, 0.011819124221801758, 0.012695789337158203, 0.013572454452514648, 0.014449119567871094, 0.015325784683227539, 0.016202449798583984, 0.01707911491394043, 0.017955780029296875, 0.01883244514465332, 0.019709110260009766, 0.02058577537536621, 0.021462440490722656, 0.0223391056060791, 0.023215770721435547, 0.024092435836791992, 0.024969100952148438, 0.025845766067504883, 0.026722431182861328, 0.027599096298217773, 0.02847576141357422, 0.029352426528930664, 0.03022909164428711, 0.031105756759643555, 0.031982421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 10.0, 9.0, 16.0, 11.0, 27.0, 29.0, 36.0, 61.0, 42.0, 83.0, 82.0, 107.0, 83.0, 84.0, 67.0, 66.0, 41.0, 38.0, 21.0, 22.0, 18.0, 6.0, 8.0, 3.0, 2.0, 7.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0398216545581818e-05, -1.0007992386817932e-05, -9.617768228054047e-06, -9.227544069290161e-06, -8.837319910526276e-06, -8.44709575176239e-06, -8.056871592998505e-06, -7.666647434234619e-06, -7.276423275470734e-06, -6.886199116706848e-06, -6.495974957942963e-06, -6.105750799179077e-06, -5.715526640415192e-06, -5.325302481651306e-06, -4.935078322887421e-06, -4.544854164123535e-06, -4.15463000535965e-06, -3.764405846595764e-06, -3.3741816878318787e-06, -2.983957529067993e-06, -2.5937333703041077e-06, -2.203509211540222e-06, -1.8132850527763367e-06, -1.4230608940124512e-06, -1.0328367352485657e-06, -6.426125764846802e-07, -2.523884177207947e-07, 1.3783574104309082e-07, 5.280598998069763e-07, 9.182840585708618e-07, 1.3085082173347473e-06, 1.6987323760986328e-06, 2.0889565348625183e-06, 2.479180693626404e-06, 2.8694048523902893e-06, 3.259629011154175e-06, 3.6498531699180603e-06, 4.040077328681946e-06, 4.430301487445831e-06, 4.820525646209717e-06, 5.210749804973602e-06, 5.600973963737488e-06, 5.991198122501373e-06, 6.381422281265259e-06, 6.771646440029144e-06, 7.16187059879303e-06, 7.552094757556915e-06, 7.9423189163208e-06, 8.332543075084686e-06, 8.722767233848572e-06, 9.112991392612457e-06, 9.503215551376343e-06, 9.893439710140228e-06, 1.0283663868904114e-05, 1.0673888027668e-05, 1.1064112186431885e-05, 1.145433634519577e-05, 1.1844560503959656e-05, 1.2234784662723541e-05, 1.2625008821487427e-05, 1.3015232980251312e-05, 1.3405457139015198e-05, 1.3795681297779083e-05, 1.4185905456542969e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 11.0, 9.0, 19.0, 29.0, 38.0, 62.0, 78.0, 104.0, 197.0, 279.0, 495.0, 903.0, 1738.0, 3275.0, 7195.0, 16942.0, 45026.0, 129020.0, 318710.0, 319082.0, 128580.0, 45373.0, 16915.0, 7134.0, 3276.0, 1751.0, 878.0, 533.0, 297.0, 205.0, 120.0, 83.0, 57.0, 41.0, 20.0, 26.0, 16.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0204010009765625, -0.019763469696044922, -0.019125938415527344, -0.018488407135009766, -0.017850875854492188, -0.01721334457397461, -0.01657581329345703, -0.015938282012939453, -0.015300750732421875, -0.014663219451904297, -0.014025688171386719, -0.01338815689086914, -0.012750625610351562, -0.012113094329833984, -0.011475563049316406, -0.010838031768798828, -0.01020050048828125, -0.009562969207763672, -0.008925437927246094, -0.008287906646728516, -0.0076503753662109375, -0.007012844085693359, -0.006375312805175781, -0.005737781524658203, -0.005100250244140625, -0.004462718963623047, -0.0038251876831054688, -0.0031876564025878906, -0.0025501251220703125, -0.0019125938415527344, -0.0012750625610351562, -0.0006375312805175781, 0.0, 0.0006375312805175781, 0.0012750625610351562, 0.0019125938415527344, 0.0025501251220703125, 0.0031876564025878906, 0.0038251876831054688, 0.004462718963623047, 0.005100250244140625, 0.005737781524658203, 0.006375312805175781, 0.007012844085693359, 0.0076503753662109375, 0.008287906646728516, 0.008925437927246094, 0.009562969207763672, 0.01020050048828125, 0.010838031768798828, 0.011475563049316406, 0.012113094329833984, 0.012750625610351562, 0.01338815689086914, 0.014025688171386719, 0.014663219451904297, 0.015300750732421875, 0.015938282012939453, 0.01657581329345703, 0.01721334457397461, 0.017850875854492188, 0.018488407135009766, 0.019125938415527344, 0.019763469696044922, 0.0204010009765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 7.0, 4.0, 7.0, 8.0, 12.0, 18.0, 13.0, 18.0, 23.0, 13.0, 29.0, 31.0, 42.0, 44.0, 39.0, 55.0, 47.0, 53.0, 60.0, 49.0, 59.0, 27.0, 56.0, 39.0, 38.0, 23.0, 24.0, 31.0, 18.0, 16.0, 23.0, 15.0, 15.0, 7.0, 8.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005664825439453125, -0.005479335784912109, -0.005293846130371094, -0.005108356475830078, -0.0049228668212890625, -0.004737377166748047, -0.004551887512207031, -0.004366397857666016, -0.004180908203125, -0.003995418548583984, -0.0038099288940429688, -0.003624439239501953, -0.0034389495849609375, -0.003253459930419922, -0.0030679702758789062, -0.0028824806213378906, -0.002696990966796875, -0.0025115013122558594, -0.0023260116577148438, -0.002140522003173828, -0.0019550323486328125, -0.0017695426940917969, -0.0015840530395507812, -0.0013985633850097656, -0.00121307373046875, -0.0010275840759277344, -0.0008420944213867188, -0.0006566047668457031, -0.0004711151123046875, -0.0002856254577636719, -0.00010013580322265625, 8.535385131835938e-05, 0.000270843505859375, 0.0004563331604003906, 0.0006418228149414062, 0.0008273124694824219, 0.0010128021240234375, 0.0011982917785644531, 0.0013837814331054688, 0.0015692710876464844, 0.0017547607421875, 0.0019402503967285156, 0.0021257400512695312, 0.002311229705810547, 0.0024967193603515625, 0.002682209014892578, 0.0028676986694335938, 0.0030531883239746094, 0.003238677978515625, 0.0034241676330566406, 0.0036096572875976562, 0.003795146942138672, 0.0039806365966796875, 0.004166126251220703, 0.004351615905761719, 0.004537105560302734, 0.00472259521484375, 0.004908084869384766, 0.005093574523925781, 0.005279064178466797, 0.0054645538330078125, 0.005650043487548828, 0.005835533142089844, 0.006021022796630859, 0.006206512451171875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 8.0, 13.0, 29.0, 49.0, 80.0, 137.0, 202.0, 185.0, 124.0, 74.0, 37.0, 16.0, 19.0, 11.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7547540664672852, -0.7331125736236572, -0.7114710807800293, -0.6898295879364014, -0.6681880950927734, -0.6465466022491455, -0.6249051094055176, -0.6032635569572449, -0.5816220641136169, -0.559980571269989, -0.5383390784263611, -0.5166975855827332, -0.49505606293678284, -0.4734145700931549, -0.451773077249527, -0.43013155460357666, -0.4084900915622711, -0.3868485987186432, -0.36520710587501526, -0.34356558322906494, -0.321924090385437, -0.3002825975418091, -0.27864110469818115, -0.2569996118545532, -0.2353581041097641, -0.21371661126613617, -0.19207510352134705, -0.17043361067771912, -0.1487921178340912, -0.12715061008930206, -0.10550911724567413, -0.08386760950088501, -0.06222611665725708, -0.04058461636304855, -0.018943119794130325, 0.002698376774787903, 0.02433987706899643, 0.045981377363204956, 0.06762287020683289, 0.08926437795162201, 0.11090587079524994, 0.13254736363887787, 0.154188871383667, 0.17583036422729492, 0.19747185707092285, 0.21911336481571198, 0.2407548576593399, 0.26239636540412903, 0.28403785824775696, 0.3056793510913849, 0.3273208439350128, 0.34896236658096313, 0.37060385942459106, 0.392245352268219, 0.4138868451118469, 0.43552833795547485, 0.4571698307991028, 0.4788113236427307, 0.5004528164863586, 0.5220943093299866, 0.5437358021736145, 0.5653773546218872, 0.5870188474655151, 0.6086603403091431, 0.630301833152771]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 13.0, 13.0, 10.0, 13.0, 16.0, 23.0, 20.0, 26.0, 21.0, 28.0, 41.0, 39.0, 40.0, 36.0, 38.0, 48.0, 36.0, 49.0, 45.0, 56.0, 44.0, 32.0, 43.0, 37.0, 47.0, 24.0, 20.0, 31.0, 21.0, 21.0, 14.0, 15.0, 8.0, 6.0, 5.0, 2.0, 5.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22479639947414398, -0.21756847202777863, -0.21034054458141327, -0.2031126171350479, -0.19588468968868256, -0.1886567622423172, -0.18142881989479065, -0.1742008924484253, -0.16697296500205994, -0.15974503755569458, -0.15251711010932922, -0.14528918266296387, -0.1380612552165985, -0.13083332777023315, -0.1236053928732872, -0.11637746542692184, -0.10914954543113708, -0.10192161798477173, -0.09469369053840637, -0.08746576309204102, -0.08023783564567566, -0.0730099081993103, -0.06578197330236435, -0.05855404585599899, -0.051326118409633636, -0.04409819096326828, -0.036870263516902924, -0.02964233234524727, -0.022414404898881912, -0.015186477452516556, -0.007958546280860901, -0.0007306188344955444, 0.006497308611869812, 0.013725236989557743, 0.020953165367245674, 0.02818109467625618, 0.035409022122621536, 0.04263694956898689, 0.04986488074064255, 0.057092808187007904, 0.06432073563337326, 0.07154866307973862, 0.07877659052610397, 0.08600452542304993, 0.09323245286941528, 0.10046038031578064, 0.107688307762146, 0.11491623520851135, 0.12214416265487671, 0.12937209010124207, 0.13660001754760742, 0.14382794499397278, 0.15105587244033813, 0.1582837998867035, 0.16551172733306885, 0.1727396547794342, 0.17996758222579956, 0.18719550967216492, 0.19442343711853027, 0.20165136456489563, 0.208879292011261, 0.21610721945762634, 0.2233351469039917, 0.23056307435035706, 0.2377910166978836]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 18.0, 8.0, 20.0, 31.0, 31.0, 45.0, 80.0, 112.0, 152.0, 240.0, 400.0, 767.0, 1277.0, 2590.0, 7216.0, 26726.0, 163875.0, 704753.0, 109247.0, 19914.0, 5934.0, 2303.0, 1104.0, 628.0, 356.0, 244.0, 157.0, 96.0, 50.0, 48.0, 35.0, 27.0, 19.0, 13.0, 7.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29833984375, -0.28745269775390625, -0.2765655517578125, -0.26567840576171875, -0.254791259765625, -0.24390411376953125, -0.2330169677734375, -0.22212982177734375, -0.21124267578125, -0.20035552978515625, -0.1894683837890625, -0.17858123779296875, -0.167694091796875, -0.15680694580078125, -0.1459197998046875, -0.13503265380859375, -0.1241455078125, -0.11325836181640625, -0.1023712158203125, -0.09148406982421875, -0.080596923828125, -0.06970977783203125, -0.0588226318359375, -0.04793548583984375, -0.03704833984375, -0.02616119384765625, -0.0152740478515625, -0.00438690185546875, 0.006500244140625, 0.01738739013671875, 0.0282745361328125, 0.03916168212890625, 0.050048828125, 0.06093597412109375, 0.0718231201171875, 0.08271026611328125, 0.093597412109375, 0.10448455810546875, 0.1153717041015625, 0.12625885009765625, 0.13714599609375, 0.14803314208984375, 0.1589202880859375, 0.16980743408203125, 0.180694580078125, 0.19158172607421875, 0.2024688720703125, 0.21335601806640625, 0.2242431640625, 0.23513031005859375, 0.2460174560546875, 0.25690460205078125, 0.267791748046875, 0.27867889404296875, 0.2895660400390625, 0.30045318603515625, 0.31134033203125, 0.32222747802734375, 0.3331146240234375, 0.34400177001953125, 0.354888916015625, 0.36577606201171875, 0.3766632080078125, 0.38755035400390625, 0.3984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 10.0, 14.0, 9.0, 16.0, 12.0, 29.0, 20.0, 38.0, 33.0, 52.0, 38.0, 50.0, 53.0, 51.0, 53.0, 40.0, 47.0, 58.0, 56.0, 48.0, 43.0, 37.0, 26.0, 35.0, 26.0, 21.0, 14.0, 17.0, 8.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.43991851806640625, -0.4242706298828125, -0.40862274169921875, -0.392974853515625, -0.37732696533203125, -0.3616790771484375, -0.34603118896484375, -0.33038330078125, -0.31473541259765625, -0.2990875244140625, -0.28343963623046875, -0.267791748046875, -0.25214385986328125, -0.2364959716796875, -0.22084808349609375, -0.2052001953125, -0.18955230712890625, -0.1739044189453125, -0.15825653076171875, -0.142608642578125, -0.12696075439453125, -0.1113128662109375, -0.09566497802734375, -0.08001708984375, -0.06436920166015625, -0.0487213134765625, -0.03307342529296875, -0.017425537109375, -0.00177764892578125, 0.0138702392578125, 0.02951812744140625, 0.045166015625, 0.06081390380859375, 0.0764617919921875, 0.09210968017578125, 0.107757568359375, 0.12340545654296875, 0.1390533447265625, 0.15470123291015625, 0.17034912109375, 0.18599700927734375, 0.2016448974609375, 0.21729278564453125, 0.232940673828125, 0.24858856201171875, 0.2642364501953125, 0.27988433837890625, 0.2955322265625, 0.31118011474609375, 0.3268280029296875, 0.34247589111328125, 0.358123779296875, 0.37377166748046875, 0.3894195556640625, 0.40506744384765625, 0.42071533203125, 0.43636322021484375, 0.4520111083984375, 0.46765899658203125, 0.483306884765625, 0.49895477294921875, 0.5146026611328125, 0.5302505493164062, 0.5458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 4.0, 6.0, 15.0, 9.0, 11.0, 17.0, 29.0, 30.0, 43.0, 50.0, 112.0, 236.0, 646.0, 3289.0, 110254.0, 923446.0, 8400.0, 1210.0, 341.0, 138.0, 72.0, 39.0, 33.0, 26.0, 28.0, 13.0, 14.0, 9.0, 8.0, 9.0, 4.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3251953125, -1.2895736694335938, -1.2539520263671875, -1.2183303833007812, -1.182708740234375, -1.1470870971679688, -1.1114654541015625, -1.0758438110351562, -1.04022216796875, -1.0046005249023438, -0.9689788818359375, -0.9333572387695312, -0.897735595703125, -0.8621139526367188, -0.8264923095703125, -0.7908706665039062, -0.7552490234375, -0.7196273803710938, -0.6840057373046875, -0.6483840942382812, -0.612762451171875, -0.5771408081054688, -0.5415191650390625, -0.5058975219726562, -0.47027587890625, -0.43465423583984375, -0.3990325927734375, -0.36341094970703125, -0.327789306640625, -0.29216766357421875, -0.2565460205078125, -0.22092437744140625, -0.185302734375, -0.14968109130859375, -0.1140594482421875, -0.07843780517578125, -0.042816162109375, -0.00719451904296875, 0.0284271240234375, 0.06404876708984375, 0.09967041015625, 0.13529205322265625, 0.1709136962890625, 0.20653533935546875, 0.242156982421875, 0.27777862548828125, 0.3134002685546875, 0.34902191162109375, 0.3846435546875, 0.42026519775390625, 0.4558868408203125, 0.49150848388671875, 0.527130126953125, 0.5627517700195312, 0.5983734130859375, 0.6339950561523438, 0.66961669921875, 0.7052383422851562, 0.7408599853515625, 0.7764816284179688, 0.812103271484375, 0.8477249145507812, 0.8833465576171875, 0.9189682006835938, 0.95458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 9.0, 7.0, 12.0, 19.0, 30.0, 31.0, 35.0, 30.0, 56.0, 54.0, 42.0, 52.0, 58.0, 63.0, 68.0, 63.0, 61.0, 55.0, 43.0, 24.0, 30.0, 27.0, 26.0, 18.0, 12.0, 11.0, 10.0, 11.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73046875, -0.7108688354492188, -0.6912689208984375, -0.6716690063476562, -0.652069091796875, -0.6324691772460938, -0.6128692626953125, -0.5932693481445312, -0.57366943359375, -0.5540695190429688, -0.5344696044921875, -0.5148696899414062, -0.495269775390625, -0.47566986083984375, -0.4560699462890625, -0.43647003173828125, -0.4168701171875, -0.39727020263671875, -0.3776702880859375, -0.35807037353515625, -0.338470458984375, -0.31887054443359375, -0.2992706298828125, -0.27967071533203125, -0.26007080078125, -0.24047088623046875, -0.2208709716796875, -0.20127105712890625, -0.181671142578125, -0.16207122802734375, -0.1424713134765625, -0.12287139892578125, -0.103271484375, -0.08367156982421875, -0.0640716552734375, -0.04447174072265625, -0.024871826171875, -0.00527191162109375, 0.0143280029296875, 0.03392791748046875, 0.05352783203125, 0.07312774658203125, 0.0927276611328125, 0.11232757568359375, 0.131927490234375, 0.15152740478515625, 0.1711273193359375, 0.19072723388671875, 0.2103271484375, 0.22992706298828125, 0.2495269775390625, 0.26912689208984375, 0.288726806640625, 0.30832672119140625, 0.3279266357421875, 0.34752655029296875, 0.36712646484375, 0.38672637939453125, 0.4063262939453125, 0.42592620849609375, 0.445526123046875, 0.46512603759765625, 0.4847259521484375, 0.5043258666992188, 0.52392578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 15.0, 23.0, 21.0, 46.0, 63.0, 100.0, 177.0, 366.0, 776.0, 2459.0, 9830.0, 60643.0, 791727.0, 158488.0, 17575.0, 3980.0, 1181.0, 472.0, 204.0, 117.0, 71.0, 47.0, 29.0, 25.0, 14.0, 19.0, 15.0, 13.0, 5.0, 8.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1466064453125, -0.14225387573242188, -0.13790130615234375, -0.13354873657226562, -0.1291961669921875, -0.12484359741210938, -0.12049102783203125, -0.11613845825195312, -0.111785888671875, -0.10743331909179688, -0.10308074951171875, -0.09872817993164062, -0.0943756103515625, -0.09002304077148438, -0.08567047119140625, -0.08131790161132812, -0.07696533203125, -0.07261276245117188, -0.06826019287109375, -0.06390762329101562, -0.0595550537109375, -0.055202484130859375, -0.05084991455078125, -0.046497344970703125, -0.042144775390625, -0.037792205810546875, -0.03343963623046875, -0.029087066650390625, -0.0247344970703125, -0.020381927490234375, -0.01602935791015625, -0.011676788330078125, -0.00732421875, -0.002971649169921875, 0.00138092041015625, 0.005733489990234375, 0.0100860595703125, 0.014438629150390625, 0.01879119873046875, 0.023143768310546875, 0.027496337890625, 0.031848907470703125, 0.03620147705078125, 0.040554046630859375, 0.0449066162109375, 0.049259185791015625, 0.05361175537109375, 0.057964324951171875, 0.06231689453125, 0.06666946411132812, 0.07102203369140625, 0.07537460327148438, 0.0797271728515625, 0.08407974243164062, 0.08843231201171875, 0.09278488159179688, 0.097137451171875, 0.10149002075195312, 0.10584259033203125, 0.11019515991210938, 0.1145477294921875, 0.11890029907226562, 0.12325286865234375, 0.12760543823242188, 0.1319580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 6.0, 10.0, 12.0, 23.0, 31.0, 41.0, 54.0, 72.0, 127.0, 144.0, 127.0, 100.0, 68.0, 46.0, 35.0, 23.0, 15.0, 18.0, 7.0, 5.0, 4.0, 6.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7762184143066406e-05, -1.7202459275722504e-05, -1.66427344083786e-05, -1.60830095410347e-05, -1.5523284673690796e-05, -1.4963559806346893e-05, -1.440383493900299e-05, -1.3844110071659088e-05, -1.3284385204315186e-05, -1.2724660336971283e-05, -1.216493546962738e-05, -1.1605210602283478e-05, -1.1045485734939575e-05, -1.0485760867595673e-05, -9.92603600025177e-06, -9.366311132907867e-06, -8.806586265563965e-06, -8.246861398220062e-06, -7.68713653087616e-06, -7.127411663532257e-06, -6.5676867961883545e-06, -6.007961928844452e-06, -5.448237061500549e-06, -4.888512194156647e-06, -4.328787326812744e-06, -3.7690624594688416e-06, -3.209337592124939e-06, -2.6496127247810364e-06, -2.089887857437134e-06, -1.5301629900932312e-06, -9.704381227493286e-07, -4.10713255405426e-07, 1.4901161193847656e-07, 7.087364792823792e-07, 1.2684613466262817e-06, 1.8281862139701843e-06, 2.387911081314087e-06, 2.9476359486579895e-06, 3.507360816001892e-06, 4.067085683345795e-06, 4.626810550689697e-06, 5.1865354180336e-06, 5.7462602853775024e-06, 6.305985152721405e-06, 6.865710020065308e-06, 7.42543488740921e-06, 7.985159754753113e-06, 8.544884622097015e-06, 9.104609489440918e-06, 9.66433435678482e-06, 1.0224059224128723e-05, 1.0783784091472626e-05, 1.1343508958816528e-05, 1.1903233826160431e-05, 1.2462958693504333e-05, 1.3022683560848236e-05, 1.3582408428192139e-05, 1.4142133295536041e-05, 1.4701858162879944e-05, 1.5261583030223846e-05, 1.582130789756775e-05, 1.638103276491165e-05, 1.6940757632255554e-05, 1.7500482499599457e-05, 1.806020736694336e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 16.0, 27.0, 44.0, 47.0, 63.0, 114.0, 168.0, 267.0, 492.0, 1093.0, 3180.0, 16029.0, 311102.0, 684747.0, 24267.0, 4068.0, 1328.0, 590.0, 329.0, 219.0, 134.0, 78.0, 58.0, 34.0, 12.0, 12.0, 4.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.224609375, -0.21871376037597656, -0.21281814575195312, -0.2069225311279297, -0.20102691650390625, -0.1951313018798828, -0.18923568725585938, -0.18334007263183594, -0.1774444580078125, -0.17154884338378906, -0.16565322875976562, -0.1597576141357422, -0.15386199951171875, -0.1479663848876953, -0.14207077026367188, -0.13617515563964844, -0.130279541015625, -0.12438392639160156, -0.11848831176757812, -0.11259269714355469, -0.10669708251953125, -0.10080146789550781, -0.09490585327148438, -0.08901023864746094, -0.0831146240234375, -0.07721900939941406, -0.07132339477539062, -0.06542778015136719, -0.05953216552734375, -0.05363655090332031, -0.047740936279296875, -0.04184532165527344, -0.03594970703125, -0.030054092407226562, -0.024158477783203125, -0.018262863159179688, -0.01236724853515625, -0.0064716339111328125, -0.000576019287109375, 0.0053195953369140625, 0.0112152099609375, 0.017110824584960938, 0.023006439208984375, 0.028902053833007812, 0.03479766845703125, 0.04069328308105469, 0.046588897705078125, 0.05248451232910156, 0.058380126953125, 0.06427574157714844, 0.07017135620117188, 0.07606697082519531, 0.08196258544921875, 0.08785820007324219, 0.09375381469726562, 0.09964942932128906, 0.1055450439453125, 0.11144065856933594, 0.11733627319335938, 0.12323188781738281, 0.12912750244140625, 0.1350231170654297, 0.14091873168945312, 0.14681434631347656, 0.1527099609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 10.0, 17.0, 19.0, 16.0, 22.0, 53.0, 72.0, 121.0, 192.0, 161.0, 110.0, 67.0, 51.0, 24.0, 19.0, 13.0, 16.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053070068359375, -0.051023006439208984, -0.04897594451904297, -0.04692888259887695, -0.04488182067871094, -0.04283475875854492, -0.040787696838378906, -0.03874063491821289, -0.036693572998046875, -0.03464651107788086, -0.032599449157714844, -0.030552387237548828, -0.028505325317382812, -0.026458263397216797, -0.02441120147705078, -0.022364139556884766, -0.02031707763671875, -0.018270015716552734, -0.01622295379638672, -0.014175891876220703, -0.012128829956054688, -0.010081768035888672, -0.008034706115722656, -0.005987644195556641, -0.003940582275390625, -0.0018935203552246094, 0.00015354156494140625, 0.002200603485107422, 0.0042476654052734375, 0.006294727325439453, 0.008341789245605469, 0.010388851165771484, 0.0124359130859375, 0.014482975006103516, 0.01653003692626953, 0.018577098846435547, 0.020624160766601562, 0.022671222686767578, 0.024718284606933594, 0.02676534652709961, 0.028812408447265625, 0.03085947036743164, 0.032906532287597656, 0.03495359420776367, 0.03700065612792969, 0.0390477180480957, 0.04109477996826172, 0.043141841888427734, 0.04518890380859375, 0.047235965728759766, 0.04928302764892578, 0.0513300895690918, 0.05337715148925781, 0.05542421340942383, 0.057471275329589844, 0.05951833724975586, 0.061565399169921875, 0.06361246109008789, 0.0656595230102539, 0.06770658493041992, 0.06975364685058594, 0.07180070877075195, 0.07384777069091797, 0.07589483261108398, 0.07794189453125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 10.0, 14.0, 28.0, 24.0, 63.0, 90.0, 151.0, 158.0, 169.0, 114.0, 77.0, 36.0, 28.0, 15.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4249154329299927, -1.3880575895309448, -1.351199746131897, -1.3143419027328491, -1.2774841785430908, -1.240626335144043, -1.2037684917449951, -1.1669106483459473, -1.1300528049468994, -1.0931949615478516, -1.0563371181488037, -1.0194792747497559, -0.9826214909553528, -0.9457636475563049, -0.9089058637619019, -0.872048020362854, -0.8351901769638062, -0.7983323335647583, -0.7614744901657104, -0.7246167063713074, -0.6877588629722595, -0.6509010195732117, -0.6140432357788086, -0.5771853923797607, -0.5403275489807129, -0.503469705581665, -0.4666118919849396, -0.4297540783882141, -0.39289623498916626, -0.3560383915901184, -0.31918057799339294, -0.2823227643966675, -0.24546504020690918, -0.20860721170902252, -0.17174938321113586, -0.1348915547132492, -0.09803372621536255, -0.06117589771747589, -0.024318069219589233, 0.01253974437713623, 0.04939758777618408, 0.08625541627407074, 0.1231132447719574, 0.15997107326984406, 0.1968289017677307, 0.23368673026561737, 0.27054455876350403, 0.3074023723602295, 0.34426021575927734, 0.3811180591583252, 0.41797587275505066, 0.4548336863517761, 0.491691529750824, 0.5285493731498718, 0.5654071569442749, 0.6022650003433228, 0.6391228437423706, 0.6759806871414185, 0.7128385305404663, 0.7496963143348694, 0.7865541577339172, 0.8234120011329651, 0.8602697849273682, 0.897127628326416, 0.9339854717254639]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 13.0, 20.0, 12.0, 15.0, 13.0, 14.0, 21.0, 35.0, 37.0, 23.0, 30.0, 29.0, 38.0, 39.0, 41.0, 41.0, 42.0, 36.0, 36.0, 43.0, 34.0, 35.0, 44.0, 37.0, 30.0, 26.0, 32.0, 33.0, 19.0, 13.0, 18.0, 15.0, 21.0, 6.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.8621527552604675, -0.8366901874542236, -0.8112276196479797, -0.7857650518417358, -0.7603024840354919, -0.734839916229248, -0.7093773484230042, -0.6839147806167603, -0.6584522128105164, -0.6329896450042725, -0.6075270771980286, -0.5820645093917847, -0.5566019415855408, -0.5311393737792969, -0.505676805973053, -0.4802142381668091, -0.4547517001628876, -0.4292891323566437, -0.4038265645503998, -0.3783639967441559, -0.352901428937912, -0.3274388909339905, -0.3019763231277466, -0.2765137553215027, -0.2510511875152588, -0.2255886197090149, -0.200126051902771, -0.1746634840965271, -0.1492009162902832, -0.1237383633852005, -0.0982757955789566, -0.07281322777271271, -0.04735064506530762, -0.02188807912170887, 0.0035744868218898773, 0.029037050902843475, 0.05449961870908737, 0.07996217906475067, 0.10542474687099457, 0.13088731467723846, 0.15634988248348236, 0.18181245028972626, 0.20727501809597015, 0.23273757100105286, 0.25820013880729675, 0.28366270661354065, 0.30912527441978455, 0.33458784222602844, 0.36005041003227234, 0.38551297783851624, 0.41097554564476013, 0.43643811345100403, 0.4619006812572479, 0.48736321926116943, 0.5128257870674133, 0.5382883548736572, 0.5637509226799011, 0.589213490486145, 0.6146760582923889, 0.6401386260986328, 0.6656011939048767, 0.6910637617111206, 0.7165263295173645, 0.7419888973236084, 0.7674514651298523]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 10.0, 3.0, 5.0, 8.0, 8.0, 13.0, 23.0, 35.0, 34.0, 42.0, 85.0, 127.0, 216.0, 316.0, 538.0, 1035.0, 2078.0, 5484.0, 34678.0, 1549681.0, 2533678.0, 53223.0, 7802.0, 2492.0, 1086.0, 581.0, 345.0, 229.0, 131.0, 93.0, 61.0, 49.0, 22.0, 24.0, 13.0, 11.0, 10.0, 11.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.890625, -0.8666000366210938, -0.8425750732421875, -0.8185501098632812, -0.794525146484375, -0.7705001831054688, -0.7464752197265625, -0.7224502563476562, -0.69842529296875, -0.6744003295898438, -0.6503753662109375, -0.6263504028320312, -0.602325439453125, -0.5783004760742188, -0.5542755126953125, -0.5302505493164062, -0.5062255859375, -0.48220062255859375, -0.4581756591796875, -0.43415069580078125, -0.410125732421875, -0.38610076904296875, -0.3620758056640625, -0.33805084228515625, -0.31402587890625, -0.29000091552734375, -0.2659759521484375, -0.24195098876953125, -0.217926025390625, -0.19390106201171875, -0.1698760986328125, -0.14585113525390625, -0.121826171875, -0.09780120849609375, -0.0737762451171875, -0.04975128173828125, -0.025726318359375, -0.00170135498046875, 0.0223236083984375, 0.04634857177734375, 0.07037353515625, 0.09439849853515625, 0.1184234619140625, 0.14244842529296875, 0.166473388671875, 0.19049835205078125, 0.2145233154296875, 0.23854827880859375, 0.2625732421875, 0.28659820556640625, 0.3106231689453125, 0.33464813232421875, 0.358673095703125, 0.38269805908203125, 0.4067230224609375, 0.43074798583984375, 0.45477294921875, 0.47879791259765625, 0.5028228759765625, 0.5268478393554688, 0.550872802734375, 0.5748977661132812, 0.5989227294921875, 0.6229476928710938, 0.64697265625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 11.0, 14.0, 18.0, 18.0, 27.0, 17.0, 26.0, 35.0, 43.0, 41.0, 46.0, 35.0, 64.0, 69.0, 60.0, 53.0, 51.0, 66.0, 34.0, 50.0, 33.0, 33.0, 28.0, 28.0, 21.0, 21.0, 11.0, 9.0, 8.0, 8.0, 7.0, 2.0, 6.0, 4.0, 0.0, 1.0, 3.0], "bins": [-0.413330078125, -0.4033489227294922, -0.3933677673339844, -0.38338661193847656, -0.37340545654296875, -0.36342430114746094, -0.3534431457519531, -0.3434619903564453, -0.3334808349609375, -0.3234996795654297, -0.3135185241699219, -0.30353736877441406, -0.29355621337890625, -0.28357505798339844, -0.2735939025878906, -0.2636127471923828, -0.253631591796875, -0.2436504364013672, -0.23366928100585938, -0.22368812561035156, -0.21370697021484375, -0.20372581481933594, -0.19374465942382812, -0.1837635040283203, -0.1737823486328125, -0.1638011932373047, -0.15382003784179688, -0.14383888244628906, -0.13385772705078125, -0.12387657165527344, -0.11389541625976562, -0.10391426086425781, -0.09393310546875, -0.08395195007324219, -0.07397079467773438, -0.06398963928222656, -0.05400848388671875, -0.04402732849121094, -0.034046173095703125, -0.024065017700195312, -0.0140838623046875, -0.0041027069091796875, 0.005878448486328125, 0.015859603881835938, 0.02584075927734375, 0.03582191467285156, 0.045803070068359375, 0.05578422546386719, 0.065765380859375, 0.07574653625488281, 0.08572769165039062, 0.09570884704589844, 0.10569000244140625, 0.11567115783691406, 0.12565231323242188, 0.1356334686279297, 0.1456146240234375, 0.1555957794189453, 0.16557693481445312, 0.17555809020996094, 0.18553924560546875, 0.19552040100097656, 0.20550155639648438, 0.2154827117919922, 0.2254638671875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 13.0, 16.0, 21.0, 42.0, 54.0, 138.0, 259.0, 469.0, 1027.0, 2764.0, 9440.0, 67206.0, 3656740.0, 426244.0, 22098.0, 4744.0, 1601.0, 619.0, 330.0, 178.0, 98.0, 63.0, 30.0, 19.0, 19.0, 11.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8544921875, -0.8299026489257812, -0.8053131103515625, -0.7807235717773438, -0.756134033203125, -0.7315444946289062, -0.7069549560546875, -0.6823654174804688, -0.65777587890625, -0.6331863403320312, -0.6085968017578125, -0.5840072631835938, -0.559417724609375, -0.5348281860351562, -0.5102386474609375, -0.48564910888671875, -0.4610595703125, -0.43647003173828125, -0.4118804931640625, -0.38729095458984375, -0.362701416015625, -0.33811187744140625, -0.3135223388671875, -0.28893280029296875, -0.26434326171875, -0.23975372314453125, -0.2151641845703125, -0.19057464599609375, -0.165985107421875, -0.14139556884765625, -0.1168060302734375, -0.09221649169921875, -0.067626953125, -0.04303741455078125, -0.0184478759765625, 0.00614166259765625, 0.030731201171875, 0.05532073974609375, 0.0799102783203125, 0.10449981689453125, 0.12908935546875, 0.15367889404296875, 0.1782684326171875, 0.20285797119140625, 0.227447509765625, 0.25203704833984375, 0.2766265869140625, 0.30121612548828125, 0.3258056640625, 0.35039520263671875, 0.3749847412109375, 0.39957427978515625, 0.424163818359375, 0.44875335693359375, 0.4733428955078125, 0.49793243408203125, 0.52252197265625, 0.5471115112304688, 0.5717010498046875, 0.5962905883789062, 0.620880126953125, 0.6454696655273438, 0.6700592041015625, 0.6946487426757812, 0.71923828125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 8.0, 6.0, 3.0, 11.0, 12.0, 15.0, 33.0, 22.0, 44.0, 94.0, 142.0, 341.0, 593.0, 906.0, 779.0, 498.0, 239.0, 128.0, 72.0, 42.0, 24.0, 14.0, 15.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1684112548828125, -0.162750244140625, -0.1570892333984375, -0.15142822265625, -0.1457672119140625, -0.140106201171875, -0.1344451904296875, -0.1287841796875, -0.1231231689453125, -0.117462158203125, -0.1118011474609375, -0.10614013671875, -0.1004791259765625, -0.094818115234375, -0.0891571044921875, -0.08349609375, -0.0778350830078125, -0.072174072265625, -0.0665130615234375, -0.06085205078125, -0.0551910400390625, -0.049530029296875, -0.0438690185546875, -0.0382080078125, -0.0325469970703125, -0.026885986328125, -0.0212249755859375, -0.01556396484375, -0.0099029541015625, -0.004241943359375, 0.0014190673828125, 0.007080078125, 0.0127410888671875, 0.018402099609375, 0.0240631103515625, 0.02972412109375, 0.0353851318359375, 0.041046142578125, 0.0467071533203125, 0.0523681640625, 0.0580291748046875, 0.063690185546875, 0.0693511962890625, 0.07501220703125, 0.0806732177734375, 0.086334228515625, 0.0919952392578125, 0.09765625, 0.1033172607421875, 0.108978271484375, 0.1146392822265625, 0.12030029296875, 0.1259613037109375, 0.131622314453125, 0.1372833251953125, 0.1429443359375, 0.1486053466796875, 0.154266357421875, 0.1599273681640625, 0.16558837890625, 0.1712493896484375, 0.176910400390625, 0.1825714111328125, 0.188232421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 13.0, 13.0, 23.0, 22.0, 35.0, 43.0, 62.0, 81.0, 117.0, 100.0, 107.0, 87.0, 86.0, 65.0, 35.0, 34.0, 21.0, 11.0, 14.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6039164662361145, -0.5869348645210266, -0.5699533224105835, -0.5529717206954956, -0.5359901785850525, -0.5190085768699646, -0.5020270347595215, -0.4850454330444336, -0.4680638313293457, -0.4510822594165802, -0.4341006875038147, -0.4171190857887268, -0.4001375138759613, -0.3831559419631958, -0.3661743700504303, -0.3491927981376648, -0.3322112262248993, -0.3152296543121338, -0.2982480823993683, -0.2812665104866028, -0.2642849087715149, -0.2473033368587494, -0.2303217649459839, -0.21334019303321838, -0.1963586062192917, -0.17937703430652618, -0.1623954474925995, -0.14541387557983398, -0.12843230366706848, -0.11145071685314178, -0.09446914494037628, -0.07748756557703018, -0.06050598621368408, -0.04352440685033798, -0.02654283121228218, -0.00956125557422638, 0.0074203237891197205, 0.02440190315246582, 0.04138347506523132, 0.05836505442857742, 0.07534663379192352, 0.09232821315526962, 0.10930979251861572, 0.12629136443138123, 0.14327293634414673, 0.16025452315807343, 0.17723609507083893, 0.19421768188476562, 0.21119925379753113, 0.22818082571029663, 0.24516241252422333, 0.26214396953582764, 0.2791255712509155, 0.29610714316368103, 0.31308871507644653, 0.33007028698921204, 0.34705185890197754, 0.36403343081474304, 0.38101500272750854, 0.39799660444259644, 0.41497817635536194, 0.43195974826812744, 0.44894132018089294, 0.46592289209365845, 0.48290449380874634]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 5.0, 13.0, 11.0, 22.0, 20.0, 23.0, 26.0, 31.0, 33.0, 32.0, 26.0, 34.0, 24.0, 38.0, 49.0, 40.0, 41.0, 48.0, 37.0, 44.0, 36.0, 35.0, 40.0, 24.0, 22.0, 28.0, 28.0, 28.0, 20.0, 18.0, 15.0, 14.0, 12.0, 19.0, 6.0, 8.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23238198459148407, -0.22363820672035217, -0.21489444375038147, -0.20615066587924957, -0.19740688800811768, -0.18866312503814697, -0.17991934716701508, -0.17117556929588318, -0.16243180632591248, -0.15368802845478058, -0.14494426548480988, -0.13620048761367798, -0.12745672464370728, -0.11871294677257538, -0.10996916890144348, -0.10122539848089218, -0.09248162806034088, -0.08373785763978958, -0.07499408721923828, -0.06625030934810638, -0.057506538927555084, -0.048762768507003784, -0.040018994361162186, -0.03127522021532059, -0.022531449794769287, -0.013787677511572838, -0.0050439052283763885, 0.0036998670548200607, 0.01244363933801651, 0.02118740975856781, 0.02993118390440941, 0.03867495805025101, 0.04741871356964111, 0.05616248399019241, 0.06490625441074371, 0.07365003228187561, 0.08239380270242691, 0.09113757312297821, 0.09988135099411011, 0.10862512141466141, 0.11736889183521271, 0.1261126697063446, 0.1348564326763153, 0.1436002105474472, 0.1523439884185791, 0.1610877513885498, 0.1698315292596817, 0.1785753071308136, 0.1873190701007843, 0.1960628479719162, 0.2048066109418869, 0.2135503888130188, 0.2222941517829895, 0.2310379296541214, 0.2397817075252533, 0.248525470495224, 0.2572692632675171, 0.2660130262374878, 0.2747568190097809, 0.2835005819797516, 0.2922443449497223, 0.3009881377220154, 0.3097319006919861, 0.3184756636619568, 0.3272194266319275]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 10.0, 13.0, 20.0, 27.0, 39.0, 73.0, 84.0, 118.0, 214.0, 312.0, 460.0, 759.0, 1270.0, 2170.0, 4156.0, 9171.0, 24218.0, 98379.0, 586832.0, 248921.0, 43965.0, 14166.0, 5990.0, 2918.0, 1600.0, 933.0, 591.0, 389.0, 262.0, 170.0, 106.0, 62.0, 45.0, 36.0, 20.0, 15.0, 9.0, 5.0, 12.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1444091796875, -0.13955307006835938, -0.13469696044921875, -0.12984085083007812, -0.1249847412109375, -0.12012863159179688, -0.11527252197265625, -0.11041641235351562, -0.105560302734375, -0.10070419311523438, -0.09584808349609375, -0.09099197387695312, -0.0861358642578125, -0.08127975463867188, -0.07642364501953125, -0.07156753540039062, -0.06671142578125, -0.061855316162109375, -0.05699920654296875, -0.052143096923828125, -0.0472869873046875, -0.042430877685546875, -0.03757476806640625, -0.032718658447265625, -0.027862548828125, -0.023006439208984375, -0.01815032958984375, -0.013294219970703125, -0.0084381103515625, -0.003582000732421875, 0.00127410888671875, 0.006130218505859375, 0.010986328125, 0.015842437744140625, 0.02069854736328125, 0.025554656982421875, 0.0304107666015625, 0.035266876220703125, 0.04012298583984375, 0.044979095458984375, 0.049835205078125, 0.054691314697265625, 0.05954742431640625, 0.06440353393554688, 0.0692596435546875, 0.07411575317382812, 0.07897186279296875, 0.08382797241210938, 0.08868408203125, 0.09354019165039062, 0.09839630126953125, 0.10325241088867188, 0.1081085205078125, 0.11296463012695312, 0.11782073974609375, 0.12267684936523438, 0.127532958984375, 0.13238906860351562, 0.13724517822265625, 0.14210128784179688, 0.1469573974609375, 0.15181350708007812, 0.15666961669921875, 0.16152572631835938, 0.1663818359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 11.0, 10.0, 13.0, 16.0, 15.0, 23.0, 27.0, 22.0, 37.0, 26.0, 33.0, 33.0, 37.0, 40.0, 42.0, 50.0, 47.0, 46.0, 47.0, 54.0, 46.0, 35.0, 41.0, 31.0, 33.0, 25.0, 32.0, 17.0, 19.0, 13.0, 17.0, 10.0, 6.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163330078125, -0.15766334533691406, -0.15199661254882812, -0.1463298797607422, -0.14066314697265625, -0.1349964141845703, -0.12932968139648438, -0.12366294860839844, -0.1179962158203125, -0.11232948303222656, -0.10666275024414062, -0.10099601745605469, -0.09532928466796875, -0.08966255187988281, -0.08399581909179688, -0.07832908630371094, -0.072662353515625, -0.06699562072753906, -0.061328887939453125, -0.05566215515136719, -0.04999542236328125, -0.04432868957519531, -0.038661956787109375, -0.03299522399902344, -0.0273284912109375, -0.021661758422851562, -0.015995025634765625, -0.010328292846679688, -0.00466156005859375, 0.0010051727294921875, 0.006671905517578125, 0.012338638305664062, 0.01800537109375, 0.023672103881835938, 0.029338836669921875, 0.03500556945800781, 0.04067230224609375, 0.04633903503417969, 0.052005767822265625, 0.05767250061035156, 0.0633392333984375, 0.06900596618652344, 0.07467269897460938, 0.08033943176269531, 0.08600616455078125, 0.09167289733886719, 0.09733963012695312, 0.10300636291503906, 0.108673095703125, 0.11433982849121094, 0.12000656127929688, 0.1256732940673828, 0.13134002685546875, 0.1370067596435547, 0.14267349243164062, 0.14834022521972656, 0.1540069580078125, 0.15967369079589844, 0.16534042358398438, 0.1710071563720703, 0.17667388916015625, 0.1823406219482422, 0.18800735473632812, 0.19367408752441406, 0.1993408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 15.0, 12.0, 18.0, 29.0, 36.0, 57.0, 64.0, 122.0, 171.0, 243.0, 386.0, 551.0, 914.0, 1617.0, 2973.0, 5527.0, 11247.0, 24351.0, 59996.0, 167231.0, 394070.0, 235657.0, 81571.0, 32087.0, 14017.0, 6841.0, 3598.0, 2021.0, 1147.0, 668.0, 437.0, 303.0, 168.0, 112.0, 85.0, 61.0, 52.0, 35.0, 17.0, 9.0, 9.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.0687255859375, -0.06668376922607422, -0.06464195251464844, -0.06260013580322266, -0.060558319091796875, -0.058516502380371094, -0.05647468566894531, -0.05443286895751953, -0.05239105224609375, -0.05034923553466797, -0.04830741882324219, -0.046265602111816406, -0.044223785400390625, -0.042181968688964844, -0.04014015197753906, -0.03809833526611328, -0.0360565185546875, -0.03401470184326172, -0.03197288513183594, -0.029931068420410156, -0.027889251708984375, -0.025847434997558594, -0.023805618286132812, -0.02176380157470703, -0.01972198486328125, -0.01768016815185547, -0.015638351440429688, -0.013596534729003906, -0.011554718017578125, -0.009512901306152344, -0.0074710845947265625, -0.005429267883300781, -0.003387451171875, -0.0013456344604492188, 0.0006961822509765625, 0.0027379989624023438, 0.004779815673828125, 0.006821632385253906, 0.008863449096679688, 0.010905265808105469, 0.01294708251953125, 0.014988899230957031, 0.017030715942382812, 0.019072532653808594, 0.021114349365234375, 0.023156166076660156, 0.025197982788085938, 0.02723979949951172, 0.0292816162109375, 0.03132343292236328, 0.03336524963378906, 0.035407066345214844, 0.037448883056640625, 0.039490699768066406, 0.04153251647949219, 0.04357433319091797, 0.04561614990234375, 0.04765796661376953, 0.04969978332519531, 0.051741600036621094, 0.053783416748046875, 0.055825233459472656, 0.05786705017089844, 0.05990886688232422, 0.06195068359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 7.0, 6.0, 9.0, 28.0, 8.0, 17.0, 22.0, 27.0, 15.0, 25.0, 37.0, 37.0, 35.0, 45.0, 40.0, 44.0, 39.0, 34.0, 64.0, 46.0, 37.0, 41.0, 29.0, 45.0, 36.0, 35.0, 21.0, 21.0, 14.0, 18.0, 17.0, 18.0, 16.0, 11.0, 13.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.3994140625, -0.387939453125, -0.37646484375, -0.364990234375, -0.353515625, -0.342041015625, -0.33056640625, -0.319091796875, -0.3076171875, -0.296142578125, -0.28466796875, -0.273193359375, -0.26171875, -0.250244140625, -0.23876953125, -0.227294921875, -0.2158203125, -0.204345703125, -0.19287109375, -0.181396484375, -0.169921875, -0.158447265625, -0.14697265625, -0.135498046875, -0.1240234375, -0.112548828125, -0.10107421875, -0.089599609375, -0.078125, -0.066650390625, -0.05517578125, -0.043701171875, -0.0322265625, -0.020751953125, -0.00927734375, 0.002197265625, 0.013671875, 0.025146484375, 0.03662109375, 0.048095703125, 0.0595703125, 0.071044921875, 0.08251953125, 0.093994140625, 0.10546875, 0.116943359375, 0.12841796875, 0.139892578125, 0.1513671875, 0.162841796875, 0.17431640625, 0.185791015625, 0.197265625, 0.208740234375, 0.22021484375, 0.231689453125, 0.2431640625, 0.254638671875, 0.26611328125, 0.277587890625, 0.2890625, 0.300537109375, 0.31201171875, 0.323486328125, 0.3349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 8.0, 13.0, 12.0, 20.0, 25.0, 43.0, 74.0, 108.0, 191.0, 301.0, 527.0, 1107.0, 2395.0, 6390.0, 21525.0, 109799.0, 570345.0, 273751.0, 44278.0, 10650.0, 3658.0, 1579.0, 773.0, 376.0, 214.0, 126.0, 88.0, 59.0, 31.0, 32.0, 15.0, 8.0, 10.0, 2.0, 6.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031890869140625, -0.030818462371826172, -0.029746055603027344, -0.028673648834228516, -0.027601242065429688, -0.02652883529663086, -0.02545642852783203, -0.024384021759033203, -0.023311614990234375, -0.022239208221435547, -0.02116680145263672, -0.02009439468383789, -0.019021987915039062, -0.017949581146240234, -0.016877174377441406, -0.015804767608642578, -0.01473236083984375, -0.013659954071044922, -0.012587547302246094, -0.011515140533447266, -0.010442733764648438, -0.00937032699584961, -0.008297920227050781, -0.007225513458251953, -0.006153106689453125, -0.005080699920654297, -0.004008293151855469, -0.0029358863830566406, -0.0018634796142578125, -0.0007910728454589844, 0.00028133392333984375, 0.0013537406921386719, 0.0024261474609375, 0.003498554229736328, 0.004570960998535156, 0.005643367767333984, 0.0067157745361328125, 0.007788181304931641, 0.008860588073730469, 0.009932994842529297, 0.011005401611328125, 0.012077808380126953, 0.013150215148925781, 0.01422262191772461, 0.015295028686523438, 0.016367435455322266, 0.017439842224121094, 0.018512248992919922, 0.01958465576171875, 0.020657062530517578, 0.021729469299316406, 0.022801876068115234, 0.023874282836914062, 0.02494668960571289, 0.02601909637451172, 0.027091503143310547, 0.028163909912109375, 0.029236316680908203, 0.03030872344970703, 0.03138113021850586, 0.03245353698730469, 0.033525943756103516, 0.034598350524902344, 0.03567075729370117, 0.0367431640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 16.0, 16.0, 25.0, 27.0, 31.0, 53.0, 65.0, 77.0, 99.0, 91.0, 105.0, 85.0, 56.0, 60.0, 40.0, 24.0, 27.0, 11.0, 16.0, 8.0, 7.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0347925126552582e-05, -9.90740954875946e-06, -9.466893970966339e-06, -9.026378393173218e-06, -8.585862815380096e-06, -8.145347237586975e-06, -7.704831659793854e-06, -7.264316082000732e-06, -6.823800504207611e-06, -6.38328492641449e-06, -5.942769348621368e-06, -5.502253770828247e-06, -5.061738193035126e-06, -4.621222615242004e-06, -4.180707037448883e-06, -3.7401914596557617e-06, -3.2996758818626404e-06, -2.859160304069519e-06, -2.4186447262763977e-06, -1.9781291484832764e-06, -1.537613570690155e-06, -1.0970979928970337e-06, -6.565824151039124e-07, -2.1606683731079102e-07, 2.2444874048233032e-07, 6.649643182754517e-07, 1.105479896068573e-06, 1.5459954738616943e-06, 1.9865110516548157e-06, 2.427026629447937e-06, 2.8675422072410583e-06, 3.3080577850341797e-06, 3.748573362827301e-06, 4.189088940620422e-06, 4.629604518413544e-06, 5.070120096206665e-06, 5.510635673999786e-06, 5.951151251792908e-06, 6.391666829586029e-06, 6.83218240737915e-06, 7.272697985172272e-06, 7.713213562965393e-06, 8.153729140758514e-06, 8.594244718551636e-06, 9.034760296344757e-06, 9.475275874137878e-06, 9.915791451931e-06, 1.0356307029724121e-05, 1.0796822607517242e-05, 1.1237338185310364e-05, 1.1677853763103485e-05, 1.2118369340896606e-05, 1.2558884918689728e-05, 1.2999400496482849e-05, 1.343991607427597e-05, 1.3880431652069092e-05, 1.4320947229862213e-05, 1.4761462807655334e-05, 1.5201978385448456e-05, 1.5642493963241577e-05, 1.60830095410347e-05, 1.652352511882782e-05, 1.696404069662094e-05, 1.7404556274414062e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 5.0, 7.0, 11.0, 13.0, 24.0, 24.0, 52.0, 77.0, 129.0, 216.0, 391.0, 614.0, 1201.0, 2307.0, 4991.0, 11319.0, 27877.0, 75350.0, 209710.0, 380238.0, 209781.0, 75007.0, 27908.0, 11228.0, 4973.0, 2362.0, 1213.0, 630.0, 358.0, 215.0, 124.0, 79.0, 47.0, 20.0, 24.0, 9.0, 7.0, 4.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0277862548828125, -0.02700352668762207, -0.02622079849243164, -0.02543807029724121, -0.02465534210205078, -0.02387261390686035, -0.023089885711669922, -0.022307157516479492, -0.021524429321289062, -0.020741701126098633, -0.019958972930908203, -0.019176244735717773, -0.018393516540527344, -0.017610788345336914, -0.016828060150146484, -0.016045331954956055, -0.015262603759765625, -0.014479875564575195, -0.013697147369384766, -0.012914419174194336, -0.012131690979003906, -0.011348962783813477, -0.010566234588623047, -0.009783506393432617, -0.009000778198242188, -0.008218050003051758, -0.007435321807861328, -0.0066525936126708984, -0.005869865417480469, -0.005087137222290039, -0.004304409027099609, -0.0035216808319091797, -0.00273895263671875, -0.0019562244415283203, -0.0011734962463378906, -0.00039076805114746094, 0.00039196014404296875, 0.0011746883392333984, 0.001957416534423828, 0.002740144729614258, 0.0035228729248046875, 0.004305601119995117, 0.005088329315185547, 0.0058710575103759766, 0.006653785705566406, 0.007436513900756836, 0.008219242095947266, 0.009001970291137695, 0.009784698486328125, 0.010567426681518555, 0.011350154876708984, 0.012132883071899414, 0.012915611267089844, 0.013698339462280273, 0.014481067657470703, 0.015263795852661133, 0.016046524047851562, 0.016829252243041992, 0.017611980438232422, 0.01839470863342285, 0.01917743682861328, 0.01996016502380371, 0.02074289321899414, 0.02152562141418457, 0.022308349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 6.0, 5.0, 8.0, 9.0, 15.0, 14.0, 25.0, 21.0, 22.0, 26.0, 38.0, 33.0, 61.0, 58.0, 56.0, 59.0, 56.0, 66.0, 63.0, 48.0, 54.0, 44.0, 35.0, 32.0, 40.0, 33.0, 10.0, 9.0, 12.0, 12.0, 9.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005947113037109375, -0.005723774433135986, -0.005500435829162598, -0.005277097225189209, -0.00505375862121582, -0.004830420017242432, -0.004607081413269043, -0.004383742809295654, -0.004160404205322266, -0.003937065601348877, -0.0037137269973754883, -0.0034903883934020996, -0.003267049789428711, -0.0030437111854553223, -0.0028203725814819336, -0.002597033977508545, -0.0023736953735351562, -0.0021503567695617676, -0.001927018165588379, -0.0017036795616149902, -0.0014803409576416016, -0.0012570023536682129, -0.0010336637496948242, -0.0008103251457214355, -0.0005869865417480469, -0.0003636479377746582, -0.00014030933380126953, 8.302927017211914e-05, 0.0003063678741455078, 0.0005297064781188965, 0.0007530450820922852, 0.0009763836860656738, 0.0011997222900390625, 0.0014230608940124512, 0.0016463994979858398, 0.0018697381019592285, 0.002093076705932617, 0.002316415309906006, 0.0025397539138793945, 0.002763092517852783, 0.002986431121826172, 0.0032097697257995605, 0.0034331083297729492, 0.003656446933746338, 0.0038797855377197266, 0.004103124141693115, 0.004326462745666504, 0.004549801349639893, 0.004773139953613281, 0.00499647855758667, 0.005219817161560059, 0.005443155765533447, 0.005666494369506836, 0.005889832973480225, 0.006113171577453613, 0.006336510181427002, 0.006559848785400391, 0.006783187389373779, 0.007006525993347168, 0.007229864597320557, 0.007453203201293945, 0.007676541805267334, 0.007899880409240723, 0.008123219013214111, 0.0083465576171875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 14.0, 14.0, 23.0, 36.0, 61.0, 63.0, 98.0, 109.0, 145.0, 129.0, 78.0, 75.0, 42.0, 45.0, 18.0, 14.0, 11.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.373170405626297, -0.3620213270187378, -0.3508722484111786, -0.3397231698036194, -0.32857412099838257, -0.31742504239082336, -0.30627596378326416, -0.29512688517570496, -0.28397780656814575, -0.27282872796058655, -0.26167964935302734, -0.2505306005477905, -0.23938152194023132, -0.22823244333267212, -0.21708336472511292, -0.2059342861175537, -0.1947852373123169, -0.1836361587047577, -0.17248709499835968, -0.16133801639080048, -0.15018895268440247, -0.13903987407684326, -0.12789079546928406, -0.11674172431230545, -0.10559265315532684, -0.09444358199834824, -0.08329451084136963, -0.07214543223381042, -0.06099636107683182, -0.04984728991985321, -0.038698211312294006, -0.0275491401553154, -0.016400068998336792, -0.005250995978713036, 0.005898077040910721, 0.017047151923179626, 0.028196223080158234, 0.03934529423713684, 0.050494372844696045, 0.06164344400167465, 0.07279251515865326, 0.08394158631563187, 0.09509065747261047, 0.10623973608016968, 0.11738880723714828, 0.1285378783941269, 0.1396869570016861, 0.1508360207080841, 0.1619850993156433, 0.17313417792320251, 0.18428324162960052, 0.19543232023715973, 0.20658138394355774, 0.21773046255111694, 0.22887954115867615, 0.24002861976623535, 0.25117766857147217, 0.26232674717903137, 0.2734758257865906, 0.2846248745918274, 0.2957739531993866, 0.3069230318069458, 0.318072110414505, 0.3292211890220642, 0.3403702676296234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 13.0, 9.0, 14.0, 22.0, 21.0, 35.0, 31.0, 42.0, 33.0, 42.0, 42.0, 48.0, 54.0, 54.0, 62.0, 52.0, 48.0, 49.0, 44.0, 38.0, 35.0, 40.0, 30.0, 33.0, 17.0, 14.0, 12.0, 18.0, 15.0, 5.0, 5.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.22568418085575104, -0.21931801736354828, -0.2129518687725067, -0.20658570528030396, -0.2002195417881012, -0.19385339319705963, -0.18748722970485687, -0.1811210811138153, -0.17475491762161255, -0.1683887541294098, -0.16202260553836823, -0.15565644204616547, -0.1492902785539627, -0.14292412996292114, -0.13655796647071838, -0.13019180297851562, -0.12382564693689346, -0.1174594908952713, -0.11109332740306854, -0.10472717136144638, -0.09836101531982422, -0.09199485182762146, -0.0856286957859993, -0.07926253974437714, -0.07289637625217438, -0.06653022021055222, -0.060164060443639755, -0.053797900676727295, -0.04743174463510513, -0.04106558486819267, -0.03469942510128021, -0.02833326905965805, -0.02196711301803589, -0.015600955113768578, -0.009234796278178692, -0.002868637442588806, 0.003497520461678505, 0.009863678365945816, 0.016229838132858276, 0.022595994174480438, 0.0289621539413929, 0.03532831370830536, 0.04169446974992752, 0.04806062951683998, 0.05442678928375244, 0.0607929453253746, 0.06715910136699677, 0.07352526485919952, 0.07989142090082169, 0.08625757694244385, 0.0926237404346466, 0.09898989647626877, 0.10535605251789093, 0.11172221601009369, 0.11808837205171585, 0.12445452809333801, 0.13082069158554077, 0.13718685507774353, 0.1435530036687851, 0.14991916716098785, 0.1562853306531906, 0.16265147924423218, 0.16901764273643494, 0.1753838062286377, 0.18174995481967926]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 17.0, 14.0, 17.0, 21.0, 40.0, 68.0, 79.0, 135.0, 229.0, 315.0, 435.0, 766.0, 1268.0, 2184.0, 3842.0, 7524.0, 15444.0, 36895.0, 110461.0, 471382.0, 277656.0, 68769.0, 25994.0, 11590.0, 5701.0, 3065.0, 1735.0, 1045.0, 644.0, 411.0, 275.0, 170.0, 107.0, 85.0, 50.0, 31.0, 19.0, 19.0, 15.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27685546875, -0.2678680419921875, -0.258880615234375, -0.2498931884765625, -0.24090576171875, -0.2319183349609375, -0.222930908203125, -0.2139434814453125, -0.2049560546875, -0.1959686279296875, -0.186981201171875, -0.1779937744140625, -0.16900634765625, -0.1600189208984375, -0.151031494140625, -0.1420440673828125, -0.133056640625, -0.1240692138671875, -0.115081787109375, -0.1060943603515625, -0.09710693359375, -0.0881195068359375, -0.079132080078125, -0.0701446533203125, -0.0611572265625, -0.0521697998046875, -0.043182373046875, -0.0341949462890625, -0.02520751953125, -0.0162200927734375, -0.007232666015625, 0.0017547607421875, 0.0107421875, 0.0197296142578125, 0.028717041015625, 0.0377044677734375, 0.04669189453125, 0.0556793212890625, 0.064666748046875, 0.0736541748046875, 0.0826416015625, 0.0916290283203125, 0.100616455078125, 0.1096038818359375, 0.11859130859375, 0.1275787353515625, 0.136566162109375, 0.1455535888671875, 0.154541015625, 0.1635284423828125, 0.172515869140625, 0.1815032958984375, 0.19049072265625, 0.1994781494140625, 0.208465576171875, 0.2174530029296875, 0.2264404296875, 0.2354278564453125, 0.244415283203125, 0.2534027099609375, 0.26239013671875, 0.2713775634765625, 0.280364990234375, 0.2893524169921875, 0.29833984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 4.0, 12.0, 8.0, 15.0, 21.0, 20.0, 24.0, 24.0, 23.0, 37.0, 41.0, 44.0, 44.0, 46.0, 44.0, 41.0, 52.0, 58.0, 64.0, 41.0, 52.0, 28.0, 43.0, 37.0, 25.0, 27.0, 22.0, 16.0, 18.0, 16.0, 8.0, 12.0, 9.0, 6.0, 5.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4253082275390625, -0.413360595703125, -0.4014129638671875, -0.38946533203125, -0.3775177001953125, -0.365570068359375, -0.3536224365234375, -0.3416748046875, -0.3297271728515625, -0.317779541015625, -0.3058319091796875, -0.29388427734375, -0.2819366455078125, -0.269989013671875, -0.2580413818359375, -0.24609375, -0.2341461181640625, -0.222198486328125, -0.2102508544921875, -0.19830322265625, -0.1863555908203125, -0.174407958984375, -0.1624603271484375, -0.1505126953125, -0.1385650634765625, -0.126617431640625, -0.1146697998046875, -0.10272216796875, -0.0907745361328125, -0.078826904296875, -0.0668792724609375, -0.054931640625, -0.0429840087890625, -0.031036376953125, -0.0190887451171875, -0.00714111328125, 0.0048065185546875, 0.016754150390625, 0.0287017822265625, 0.0406494140625, 0.0525970458984375, 0.064544677734375, 0.0764923095703125, 0.08843994140625, 0.1003875732421875, 0.112335205078125, 0.1242828369140625, 0.13623046875, 0.1481781005859375, 0.160125732421875, 0.1720733642578125, 0.18402099609375, 0.1959686279296875, 0.207916259765625, 0.2198638916015625, 0.2318115234375, 0.2437591552734375, 0.255706787109375, 0.2676544189453125, 0.27960205078125, 0.2915496826171875, 0.303497314453125, 0.3154449462890625, 0.327392578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 15.0, 15.0, 18.0, 21.0, 27.0, 42.0, 76.0, 101.0, 161.0, 368.0, 782.0, 2165.0, 8315.0, 42808.0, 537312.0, 409296.0, 36514.0, 7090.0, 2018.0, 665.0, 300.0, 147.0, 113.0, 64.0, 33.0, 18.0, 20.0, 14.0, 10.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.489990234375, -0.4724617004394531, -0.45493316650390625, -0.4374046325683594, -0.4198760986328125, -0.4023475646972656, -0.38481903076171875, -0.3672904968261719, -0.349761962890625, -0.3322334289550781, -0.31470489501953125, -0.2971763610839844, -0.2796478271484375, -0.2621192932128906, -0.24459075927734375, -0.22706222534179688, -0.20953369140625, -0.19200515747070312, -0.17447662353515625, -0.15694808959960938, -0.1394195556640625, -0.12189102172851562, -0.10436248779296875, -0.08683395385742188, -0.069305419921875, -0.051776885986328125, -0.03424835205078125, -0.016719818115234375, 0.0008087158203125, 0.018337249755859375, 0.03586578369140625, 0.053394317626953125, 0.0709228515625, 0.08845138549804688, 0.10597991943359375, 0.12350845336914062, 0.1410369873046875, 0.15856552124023438, 0.17609405517578125, 0.19362258911132812, 0.211151123046875, 0.22867965698242188, 0.24620819091796875, 0.2637367248535156, 0.2812652587890625, 0.2987937927246094, 0.31632232666015625, 0.3338508605957031, 0.35137939453125, 0.3689079284667969, 0.38643646240234375, 0.4039649963378906, 0.4214935302734375, 0.4390220642089844, 0.45655059814453125, 0.4740791320800781, 0.491607666015625, 0.5091361999511719, 0.5266647338867188, 0.5441932678222656, 0.5617218017578125, 0.5792503356933594, 0.5967788696289062, 0.6143074035644531, 0.6318359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 6.0, 7.0, 9.0, 12.0, 11.0, 12.0, 11.0, 22.0, 20.0, 26.0, 41.0, 36.0, 48.0, 48.0, 41.0, 50.0, 43.0, 65.0, 54.0, 51.0, 57.0, 48.0, 51.0, 35.0, 30.0, 29.0, 33.0, 23.0, 12.0, 15.0, 9.0, 13.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.4971504211425781, -0.48258209228515625, -0.4680137634277344, -0.4534454345703125, -0.4388771057128906, -0.42430877685546875, -0.4097404479980469, -0.395172119140625, -0.3806037902832031, -0.36603546142578125, -0.3514671325683594, -0.3368988037109375, -0.3223304748535156, -0.30776214599609375, -0.2931938171386719, -0.27862548828125, -0.2640571594238281, -0.24948883056640625, -0.23492050170898438, -0.2203521728515625, -0.20578384399414062, -0.19121551513671875, -0.17664718627929688, -0.162078857421875, -0.14751052856445312, -0.13294219970703125, -0.11837387084960938, -0.1038055419921875, -0.08923721313476562, -0.07466888427734375, -0.060100555419921875, -0.0455322265625, -0.030963897705078125, -0.01639556884765625, -0.001827239990234375, 0.0127410888671875, 0.027309417724609375, 0.04187774658203125, 0.056446075439453125, 0.071014404296875, 0.08558273315429688, 0.10015106201171875, 0.11471939086914062, 0.1292877197265625, 0.14385604858398438, 0.15842437744140625, 0.17299270629882812, 0.18756103515625, 0.20212936401367188, 0.21669769287109375, 0.23126602172851562, 0.2458343505859375, 0.2604026794433594, 0.27497100830078125, 0.2895393371582031, 0.304107666015625, 0.3186759948730469, 0.33324432373046875, 0.3478126525878906, 0.3623809814453125, 0.3769493103027344, 0.39151763916015625, 0.4060859680175781, 0.420654296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 17.0, 33.0, 57.0, 155.0, 397.0, 1425.0, 8287.0, 141495.0, 853355.0, 38279.0, 3683.0, 804.0, 263.0, 119.0, 47.0, 41.0, 13.0, 7.0, 11.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1829833984375, -0.17731857299804688, -0.17165374755859375, -0.16598892211914062, -0.1603240966796875, -0.15465927124023438, -0.14899444580078125, -0.14332962036132812, -0.137664794921875, -0.13199996948242188, -0.12633514404296875, -0.12067031860351562, -0.1150054931640625, -0.10934066772460938, -0.10367584228515625, -0.09801101684570312, -0.09234619140625, -0.08668136596679688, -0.08101654052734375, -0.07535171508789062, -0.0696868896484375, -0.06402206420898438, -0.05835723876953125, -0.052692413330078125, -0.047027587890625, -0.041362762451171875, -0.03569793701171875, -0.030033111572265625, -0.0243682861328125, -0.018703460693359375, -0.01303863525390625, -0.007373809814453125, -0.001708984375, 0.003955841064453125, 0.00962066650390625, 0.015285491943359375, 0.0209503173828125, 0.026615142822265625, 0.03227996826171875, 0.037944793701171875, 0.043609619140625, 0.049274444580078125, 0.05493927001953125, 0.060604095458984375, 0.0662689208984375, 0.07193374633789062, 0.07759857177734375, 0.08326339721679688, 0.08892822265625, 0.09459304809570312, 0.10025787353515625, 0.10592269897460938, 0.1115875244140625, 0.11725234985351562, 0.12291717529296875, 0.12858200073242188, 0.134246826171875, 0.13991165161132812, 0.14557647705078125, 0.15124130249023438, 0.1569061279296875, 0.16257095336914062, 0.16823577880859375, 0.17390060424804688, 0.1795654296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 8.0, 9.0, 18.0, 30.0, 27.0, 69.0, 79.0, 102.0, 191.0, 155.0, 88.0, 70.0, 39.0, 30.0, 19.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2024305760860443e-05, -1.1472031474113464e-05, -1.0919757187366486e-05, -1.0367482900619507e-05, -9.815208613872528e-06, -9.26293432712555e-06, -8.71066004037857e-06, -8.158385753631592e-06, -7.606111466884613e-06, -7.053837180137634e-06, -6.5015628933906555e-06, -5.949288606643677e-06, -5.397014319896698e-06, -4.844740033149719e-06, -4.2924657464027405e-06, -3.7401914596557617e-06, -3.187917172908783e-06, -2.635642886161804e-06, -2.0833685994148254e-06, -1.5310943126678467e-06, -9.78820025920868e-07, -4.2654573917388916e-07, 1.257285475730896e-07, 6.780028343200684e-07, 1.2302771210670471e-06, 1.7825514078140259e-06, 2.3348256945610046e-06, 2.8870999813079834e-06, 3.439374268054962e-06, 3.991648554801941e-06, 4.54392284154892e-06, 5.0961971282958984e-06, 5.648471415042877e-06, 6.200745701789856e-06, 6.753019988536835e-06, 7.3052942752838135e-06, 7.857568562030792e-06, 8.409842848777771e-06, 8.96211713552475e-06, 9.514391422271729e-06, 1.0066665709018707e-05, 1.0618939995765686e-05, 1.1171214282512665e-05, 1.1723488569259644e-05, 1.2275762856006622e-05, 1.2828037142753601e-05, 1.338031142950058e-05, 1.3932585716247559e-05, 1.4484860002994537e-05, 1.5037134289741516e-05, 1.5589408576488495e-05, 1.6141682863235474e-05, 1.6693957149982452e-05, 1.724623143672943e-05, 1.779850572347641e-05, 1.835078001022339e-05, 1.8903054296970367e-05, 1.9455328583717346e-05, 2.0007602870464325e-05, 2.0559877157211304e-05, 2.1112151443958282e-05, 2.166442573070526e-05, 2.221670001745224e-05, 2.276897430419922e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 21.0, 40.0, 60.0, 110.0, 210.0, 425.0, 826.0, 1726.0, 4588.0, 19135.0, 193150.0, 753078.0, 60098.0, 9558.0, 2974.0, 1238.0, 609.0, 338.0, 146.0, 75.0, 53.0, 29.0, 10.0, 15.0, 9.0, 5.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.151336669921875, -0.14678955078125, -0.142242431640625, -0.1376953125, -0.133148193359375, -0.12860107421875, -0.124053955078125, -0.1195068359375, -0.114959716796875, -0.11041259765625, -0.105865478515625, -0.101318359375, -0.096771240234375, -0.09222412109375, -0.087677001953125, -0.0831298828125, -0.078582763671875, -0.07403564453125, -0.069488525390625, -0.06494140625, -0.060394287109375, -0.05584716796875, -0.051300048828125, -0.0467529296875, -0.042205810546875, -0.03765869140625, -0.033111572265625, -0.028564453125, -0.024017333984375, -0.01947021484375, -0.014923095703125, -0.0103759765625, -0.005828857421875, -0.00128173828125, 0.003265380859375, 0.0078125, 0.012359619140625, 0.01690673828125, 0.021453857421875, 0.0260009765625, 0.030548095703125, 0.03509521484375, 0.039642333984375, 0.044189453125, 0.048736572265625, 0.05328369140625, 0.057830810546875, 0.0623779296875, 0.066925048828125, 0.07147216796875, 0.076019287109375, 0.08056640625, 0.085113525390625, 0.08966064453125, 0.094207763671875, 0.0987548828125, 0.103302001953125, 0.10784912109375, 0.112396240234375, 0.116943359375, 0.121490478515625, 0.12603759765625, 0.130584716796875, 0.1351318359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 4.0, 10.0, 13.0, 10.0, 29.0, 51.0, 73.0, 104.0, 118.0, 178.0, 128.0, 95.0, 51.0, 41.0, 25.0, 18.0, 12.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.062290191650390625, -0.06024932861328125, -0.058208465576171875, -0.0561676025390625, -0.054126739501953125, -0.05208587646484375, -0.050045013427734375, -0.048004150390625, -0.045963287353515625, -0.04392242431640625, -0.041881561279296875, -0.0398406982421875, -0.037799835205078125, -0.03575897216796875, -0.033718109130859375, -0.03167724609375, -0.029636383056640625, -0.02759552001953125, -0.025554656982421875, -0.0235137939453125, -0.021472930908203125, -0.01943206787109375, -0.017391204833984375, -0.015350341796875, -0.013309478759765625, -0.01126861572265625, -0.009227752685546875, -0.0071868896484375, -0.005146026611328125, -0.00310516357421875, -0.001064300537109375, 0.0009765625, 0.003017425537109375, 0.00505828857421875, 0.007099151611328125, 0.0091400146484375, 0.011180877685546875, 0.01322174072265625, 0.015262603759765625, 0.017303466796875, 0.019344329833984375, 0.02138519287109375, 0.023426055908203125, 0.0254669189453125, 0.027507781982421875, 0.02954864501953125, 0.031589508056640625, 0.03363037109375, 0.035671234130859375, 0.03771209716796875, 0.039752960205078125, 0.0417938232421875, 0.043834686279296875, 0.04587554931640625, 0.047916412353515625, 0.049957275390625, 0.051998138427734375, 0.05403900146484375, 0.056079864501953125, 0.0581207275390625, 0.060161590576171875, 0.06220245361328125, 0.06424331665039062, 0.0662841796875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [19.0, 112.0, 500.0, 333.0, 45.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33184677362442017, -0.2141825258731842, -0.09651826322078705, 0.021145999431610107, 0.13881024718284607, 0.25647449493408203, 0.3741387724876404, 0.49180299043655396, 0.6094672679901123, 0.7271315455436707, 0.8447957634925842, 0.9624600410461426, 1.0801242589950562, 1.1977884769439697, 1.3154528141021729, 1.4331170320510864, 1.55078125, 1.6684454679489136, 1.7861098051071167, 1.9037740230560303, 2.0214383602142334, 2.1391024589538574, 2.2567667961120605, 2.3744311332702637, 2.492095470428467, 2.60975980758667, 2.727423906326294, 2.845088243484497, 2.9627525806427, 3.080416679382324, 3.1980810165405273, 3.3157453536987305, 3.4334094524383545, 3.5510737895965576, 3.6687378883361816, 3.7864022254943848, 3.904066562652588, 4.021730899810791, 4.139394760131836, 4.257059097290039, 4.374723434448242, 4.492387771606445, 4.610052108764648, 4.727716445922852, 4.8453803062438965, 4.9630446434021, 5.080708980560303, 5.198373317718506, 5.316037654876709, 5.433701992034912, 5.551366329193115, 5.66903018951416, 5.786694526672363, 5.904358863830566, 6.0220232009887695, 6.139687538146973, 6.257351398468018, 6.375015735626221, 6.492680072784424, 6.610343933105469, 6.728008270263672, 6.845672607421875, 6.963336944580078, 7.081001281738281, 7.198665618896484]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 7.0, 2.0, 5.0, 9.0, 10.0, 24.0, 17.0, 14.0, 13.0, 21.0, 23.0, 26.0, 38.0, 26.0, 38.0, 33.0, 41.0, 48.0, 49.0, 40.0, 37.0, 36.0, 47.0, 42.0, 42.0, 37.0, 28.0, 25.0, 33.0, 34.0, 20.0, 24.0, 11.0, 18.0, 17.0, 13.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5970219373703003, -0.5782413482666016, -0.5594608187675476, -0.5406802296638489, -0.5218996405601501, -0.5031190514564514, -0.48433852195739746, -0.46555793285369873, -0.44677734375, -0.42799678444862366, -0.4092161953449249, -0.3904356360435486, -0.37165504693984985, -0.3528744876384735, -0.33409392833709717, -0.31531333923339844, -0.2965327799320221, -0.27775222063064575, -0.258971631526947, -0.24019107222557068, -0.22141048312187195, -0.2026299238204956, -0.18384934961795807, -0.16506877541542053, -0.146288201212883, -0.12750762701034546, -0.10872705280780792, -0.08994648605585098, -0.07116591185331345, -0.05238533765077591, -0.03360477089881897, -0.014824196696281433, 0.0039563775062561035, 0.02273694984614849, 0.04151752218604088, 0.060298092663288116, 0.07907866686582565, 0.09785924106836319, 0.11663980782032013, 0.13542038202285767, 0.1542009562253952, 0.17298153042793274, 0.19176210463047028, 0.2105426788330078, 0.22932323813438416, 0.24810382723808289, 0.26688438653945923, 0.28566497564315796, 0.3044455349445343, 0.32322609424591064, 0.3420066833496094, 0.3607872426509857, 0.37956783175468445, 0.3983483910560608, 0.4171289801597595, 0.43590953946113586, 0.4546900987625122, 0.47347065806388855, 0.4922512471675873, 0.5110318064689636, 0.5298123955726624, 0.5485929846763611, 0.567373514175415, 0.5861541032791138, 0.6049346923828125]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 7.0, 13.0, 16.0, 27.0, 31.0, 61.0, 100.0, 172.0, 319.0, 516.0, 973.0, 1792.0, 3760.0, 10696.0, 85813.0, 3086244.0, 961500.0, 29456.0, 6998.0, 2727.0, 1274.0, 713.0, 425.0, 251.0, 126.0, 90.0, 55.0, 50.0, 26.0, 21.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48095703125, -0.4630126953125, -0.445068359375, -0.4271240234375, -0.4091796875, -0.3912353515625, -0.373291015625, -0.3553466796875, -0.33740234375, -0.3194580078125, -0.301513671875, -0.2835693359375, -0.265625, -0.2476806640625, -0.229736328125, -0.2117919921875, -0.19384765625, -0.1759033203125, -0.157958984375, -0.1400146484375, -0.1220703125, -0.1041259765625, -0.086181640625, -0.0682373046875, -0.05029296875, -0.0323486328125, -0.014404296875, 0.0035400390625, 0.021484375, 0.0394287109375, 0.057373046875, 0.0753173828125, 0.09326171875, 0.1112060546875, 0.129150390625, 0.1470947265625, 0.1650390625, 0.1829833984375, 0.200927734375, 0.2188720703125, 0.23681640625, 0.2547607421875, 0.272705078125, 0.2906494140625, 0.30859375, 0.3265380859375, 0.344482421875, 0.3624267578125, 0.38037109375, 0.3983154296875, 0.416259765625, 0.4342041015625, 0.4521484375, 0.4700927734375, 0.488037109375, 0.5059814453125, 0.52392578125, 0.5418701171875, 0.559814453125, 0.5777587890625, 0.595703125, 0.6136474609375, 0.631591796875, 0.6495361328125, 0.66748046875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 13.0, 17.0, 15.0, 26.0, 30.0, 41.0, 34.0, 47.0, 61.0, 65.0, 68.0, 57.0, 67.0, 49.0, 47.0, 50.0, 50.0, 42.0, 37.0, 35.0, 32.0, 24.0, 16.0, 13.0, 8.0, 9.0, 15.0, 4.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2706260681152344, -0.26317596435546875, -0.2557258605957031, -0.2482757568359375, -0.24082565307617188, -0.23337554931640625, -0.22592544555664062, -0.218475341796875, -0.21102523803710938, -0.20357513427734375, -0.19612503051757812, -0.1886749267578125, -0.18122482299804688, -0.17377471923828125, -0.16632461547851562, -0.15887451171875, -0.15142440795898438, -0.14397430419921875, -0.13652420043945312, -0.1290740966796875, -0.12162399291992188, -0.11417388916015625, -0.10672378540039062, -0.099273681640625, -0.09182357788085938, -0.08437347412109375, -0.07692337036132812, -0.0694732666015625, -0.062023162841796875, -0.05457305908203125, -0.047122955322265625, -0.0396728515625, -0.032222747802734375, -0.02477264404296875, -0.017322540283203125, -0.0098724365234375, -0.002422332763671875, 0.00502777099609375, 0.012477874755859375, 0.019927978515625, 0.027378082275390625, 0.03482818603515625, 0.042278289794921875, 0.0497283935546875, 0.057178497314453125, 0.06462860107421875, 0.07207870483398438, 0.07952880859375, 0.08697891235351562, 0.09442901611328125, 0.10187911987304688, 0.1093292236328125, 0.11677932739257812, 0.12422943115234375, 0.13167953491210938, 0.139129638671875, 0.14657974243164062, 0.15402984619140625, 0.16147994995117188, 0.1689300537109375, 0.17638015747070312, 0.18383026123046875, 0.19128036499023438, 0.19873046875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 4.0, 6.0, 8.0, 6.0, 9.0, 8.0, 16.0, 23.0, 30.0, 38.0, 66.0, 92.0, 202.0, 407.0, 802.0, 1862.0, 4985.0, 17688.0, 124414.0, 3458518.0, 535635.0, 36028.0, 8119.0, 2907.0, 1196.0, 536.0, 270.0, 141.0, 79.0, 49.0, 38.0, 18.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.478515625, -0.4629364013671875, -0.447357177734375, -0.4317779541015625, -0.41619873046875, -0.4006195068359375, -0.385040283203125, -0.3694610595703125, -0.3538818359375, -0.3383026123046875, -0.322723388671875, -0.3071441650390625, -0.29156494140625, -0.2759857177734375, -0.260406494140625, -0.2448272705078125, -0.229248046875, -0.2136688232421875, -0.198089599609375, -0.1825103759765625, -0.16693115234375, -0.1513519287109375, -0.135772705078125, -0.1201934814453125, -0.1046142578125, -0.0890350341796875, -0.073455810546875, -0.0578765869140625, -0.04229736328125, -0.0267181396484375, -0.011138916015625, 0.0044403076171875, 0.02001953125, 0.0355987548828125, 0.051177978515625, 0.0667572021484375, 0.08233642578125, 0.0979156494140625, 0.113494873046875, 0.1290740966796875, 0.1446533203125, 0.1602325439453125, 0.175811767578125, 0.1913909912109375, 0.20697021484375, 0.2225494384765625, 0.238128662109375, 0.2537078857421875, 0.269287109375, 0.2848663330078125, 0.300445556640625, 0.3160247802734375, 0.33160400390625, 0.3471832275390625, 0.362762451171875, 0.3783416748046875, 0.3939208984375, 0.4095001220703125, 0.425079345703125, 0.4406585693359375, 0.45623779296875, 0.4718170166015625, 0.487396240234375, 0.5029754638671875, 0.5185546875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 9.0, 12.0, 6.0, 19.0, 22.0, 38.0, 44.0, 69.0, 124.0, 188.0, 284.0, 484.0, 588.0, 653.0, 509.0, 355.0, 219.0, 131.0, 87.0, 56.0, 44.0, 26.0, 18.0, 14.0, 14.0, 7.0, 10.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.12042236328125, -0.11680030822753906, -0.11317825317382812, -0.10955619812011719, -0.10593414306640625, -0.10231208801269531, -0.09869003295898438, -0.09506797790527344, -0.0914459228515625, -0.08782386779785156, -0.08420181274414062, -0.08057975769042969, -0.07695770263671875, -0.07333564758300781, -0.06971359252929688, -0.06609153747558594, -0.062469482421875, -0.05884742736816406, -0.055225372314453125, -0.05160331726074219, -0.04798126220703125, -0.04435920715332031, -0.040737152099609375, -0.03711509704589844, -0.0334930419921875, -0.029870986938476562, -0.026248931884765625, -0.022626876831054688, -0.01900482177734375, -0.015382766723632812, -0.011760711669921875, -0.008138656616210938, -0.0045166015625, -0.0008945465087890625, 0.002727508544921875, 0.0063495635986328125, 0.00997161865234375, 0.013593673706054688, 0.017215728759765625, 0.020837783813476562, 0.0244598388671875, 0.028081893920898438, 0.031703948974609375, 0.03532600402832031, 0.03894805908203125, 0.04257011413574219, 0.046192169189453125, 0.04981422424316406, 0.053436279296875, 0.05705833435058594, 0.060680389404296875, 0.06430244445800781, 0.06792449951171875, 0.07154655456542969, 0.07516860961914062, 0.07879066467285156, 0.0824127197265625, 0.08603477478027344, 0.08965682983398438, 0.09327888488769531, 0.09690093994140625, 0.10052299499511719, 0.10414505004882812, 0.10776710510253906, 0.11138916015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 12.0, 3.0, 12.0, 13.0, 20.0, 21.0, 17.0, 23.0, 42.0, 36.0, 60.0, 67.0, 66.0, 67.0, 87.0, 72.0, 73.0, 50.0, 62.0, 43.0, 30.0, 25.0, 25.0, 21.0, 13.0, 4.0, 5.0, 7.0, 5.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20238716900348663, -0.19300851225852966, -0.1836298406124115, -0.17425118386745453, -0.16487252712249756, -0.1554938554763794, -0.14611519873142242, -0.13673654198646545, -0.1273578703403473, -0.11797920614480972, -0.10860054939985275, -0.09922188520431519, -0.08984322845935822, -0.08046456426382065, -0.07108590006828308, -0.06170724332332611, -0.05232858657836914, -0.04294992610812187, -0.0335712656378746, -0.024192601442337036, -0.014813940972089767, -0.005435280501842499, 0.003943383693695068, 0.013322040438652039, 0.022700704634189606, 0.032079365104436874, 0.04145802557468414, 0.05083668977022171, 0.06021535024046898, 0.06959401071071625, 0.07897267490625381, 0.08835133165121078, 0.09773001074790955, 0.10710867494344711, 0.11648733168840408, 0.12586599588394165, 0.13524465262889862, 0.1446233093738556, 0.15400198101997375, 0.16338063776493073, 0.1727592945098877, 0.18213795125484467, 0.19151662290096283, 0.2008952796459198, 0.21027393639087677, 0.21965259313583374, 0.2290312647819519, 0.23840992152690887, 0.24778859317302704, 0.257167249917984, 0.2665459215641022, 0.27592456340789795, 0.2853032350540161, 0.2946819067001343, 0.30406057834625244, 0.3134392201900482, 0.3228178918361664, 0.33219656348228455, 0.3415752053260803, 0.3509538769721985, 0.36033254861831665, 0.3697111904621124, 0.3790898621082306, 0.38846850395202637, 0.39784717559814453]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 9.0, 9.0, 4.0, 12.0, 10.0, 18.0, 18.0, 19.0, 25.0, 30.0, 36.0, 30.0, 36.0, 33.0, 35.0, 34.0, 44.0, 40.0, 33.0, 41.0, 44.0, 51.0, 37.0, 32.0, 33.0, 37.0, 39.0, 39.0, 18.0, 19.0, 17.0, 19.0, 18.0, 25.0, 12.0, 13.0, 5.0, 8.0, 11.0, 1.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2659854292869568, -0.25872915983200073, -0.2514728903770447, -0.24421659111976624, -0.23696032166481018, -0.22970405220985413, -0.22244776785373688, -0.21519148349761963, -0.20793521404266357, -0.20067894458770752, -0.19342266023159027, -0.18616637587547302, -0.17891010642051697, -0.1716538369655609, -0.16439755260944366, -0.15714126825332642, -0.14988499879837036, -0.1426287293434143, -0.13537244498729706, -0.1281161606311798, -0.12085989117622375, -0.1136036142706871, -0.10634733736515045, -0.0990910604596138, -0.09183478355407715, -0.0845785066485405, -0.07732222974300385, -0.0700659528374672, -0.06280967593193054, -0.05555339902639389, -0.04829712212085724, -0.04104084521532059, -0.033784568309783936, -0.026528291404247284, -0.019272014498710632, -0.01201573759317398, -0.004759460687637329, 0.0024968162178993225, 0.009753093123435974, 0.017009370028972626, 0.024265646934509277, 0.03152192384004593, 0.03877820074558258, 0.04603447765111923, 0.053290754556655884, 0.060547031462192535, 0.06780330836772919, 0.07505958527326584, 0.08231586217880249, 0.08957213908433914, 0.0968284159898758, 0.10408469289541245, 0.1113409698009491, 0.11859724670648575, 0.1258535236120224, 0.13310980796813965, 0.1403660774230957, 0.14762234687805176, 0.154878631234169, 0.16213491559028625, 0.1693911850452423, 0.17664745450019836, 0.1839037388563156, 0.19116002321243286, 0.19841629266738892]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 19.0, 18.0, 34.0, 52.0, 90.0, 129.0, 179.0, 304.0, 418.0, 773.0, 1115.0, 1853.0, 3273.0, 5801.0, 11487.0, 28428.0, 114740.0, 574439.0, 229119.0, 43601.0, 15247.0, 7480.0, 3943.0, 2185.0, 1382.0, 866.0, 543.0, 365.0, 225.0, 121.0, 95.0, 71.0, 51.0, 29.0, 20.0, 17.0, 10.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08251953125, -0.07953834533691406, -0.07655715942382812, -0.07357597351074219, -0.07059478759765625, -0.06761360168457031, -0.06463241577148438, -0.06165122985839844, -0.0586700439453125, -0.05568885803222656, -0.052707672119140625, -0.04972648620605469, -0.04674530029296875, -0.04376411437988281, -0.040782928466796875, -0.03780174255371094, -0.034820556640625, -0.03183937072753906, -0.028858184814453125, -0.025876998901367188, -0.02289581298828125, -0.019914627075195312, -0.016933441162109375, -0.013952255249023438, -0.0109710693359375, -0.007989883422851562, -0.005008697509765625, -0.0020275115966796875, 0.00095367431640625, 0.0039348602294921875, 0.006916046142578125, 0.009897232055664062, 0.01287841796875, 0.015859603881835938, 0.018840789794921875, 0.021821975708007812, 0.02480316162109375, 0.027784347534179688, 0.030765533447265625, 0.03374671936035156, 0.0367279052734375, 0.03970909118652344, 0.042690277099609375, 0.04567146301269531, 0.04865264892578125, 0.05163383483886719, 0.054615020751953125, 0.05759620666503906, 0.060577392578125, 0.06355857849121094, 0.06653976440429688, 0.06952095031738281, 0.07250213623046875, 0.07548332214355469, 0.07846450805664062, 0.08144569396972656, 0.0844268798828125, 0.08740806579589844, 0.09038925170898438, 0.09337043762207031, 0.09635162353515625, 0.09933280944824219, 0.10231399536132812, 0.10529518127441406, 0.1082763671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 14.0, 15.0, 5.0, 5.0, 19.0, 21.0, 22.0, 26.0, 30.0, 35.0, 32.0, 46.0, 43.0, 41.0, 45.0, 41.0, 46.0, 35.0, 40.0, 41.0, 49.0, 41.0, 29.0, 28.0, 43.0, 44.0, 15.0, 22.0, 19.0, 17.0, 19.0, 18.0, 9.0, 13.0, 9.0, 4.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.19140625, -0.1866168975830078, -0.18182754516601562, -0.17703819274902344, -0.17224884033203125, -0.16745948791503906, -0.16267013549804688, -0.1578807830810547, -0.1530914306640625, -0.1483020782470703, -0.14351272583007812, -0.13872337341308594, -0.13393402099609375, -0.12914466857910156, -0.12435531616210938, -0.11956596374511719, -0.114776611328125, -0.10998725891113281, -0.10519790649414062, -0.10040855407714844, -0.09561920166015625, -0.09082984924316406, -0.08604049682617188, -0.08125114440917969, -0.0764617919921875, -0.07167243957519531, -0.06688308715820312, -0.06209373474121094, -0.05730438232421875, -0.05251502990722656, -0.047725677490234375, -0.04293632507324219, -0.03814697265625, -0.03335762023925781, -0.028568267822265625, -0.023778915405273438, -0.01898956298828125, -0.014200210571289062, -0.009410858154296875, -0.0046215057373046875, 0.0001678466796875, 0.0049571990966796875, 0.009746551513671875, 0.014535903930664062, 0.01932525634765625, 0.024114608764648438, 0.028903961181640625, 0.03369331359863281, 0.038482666015625, 0.04327201843261719, 0.048061370849609375, 0.05285072326660156, 0.05764007568359375, 0.06242942810058594, 0.06721878051757812, 0.07200813293457031, 0.0767974853515625, 0.08158683776855469, 0.08637619018554688, 0.09116554260253906, 0.09595489501953125, 0.10074424743652344, 0.10553359985351562, 0.11032295227050781, 0.1151123046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 13.0, 21.0, 22.0, 24.0, 57.0, 99.0, 171.0, 328.0, 565.0, 1197.0, 2599.0, 5967.0, 15438.0, 49752.0, 223505.0, 546030.0, 145001.0, 36168.0, 12377.0, 4911.0, 2184.0, 985.0, 497.0, 262.0, 161.0, 87.0, 47.0, 30.0, 25.0, 7.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.08016490936279297, -0.07768821716308594, -0.0752115249633789, -0.07273483276367188, -0.07025814056396484, -0.06778144836425781, -0.06530475616455078, -0.06282806396484375, -0.06035137176513672, -0.05787467956542969, -0.055397987365722656, -0.052921295166015625, -0.050444602966308594, -0.04796791076660156, -0.04549121856689453, -0.0430145263671875, -0.04053783416748047, -0.03806114196777344, -0.035584449768066406, -0.033107757568359375, -0.030631065368652344, -0.028154373168945312, -0.02567768096923828, -0.02320098876953125, -0.02072429656982422, -0.018247604370117188, -0.015770912170410156, -0.013294219970703125, -0.010817527770996094, -0.008340835571289062, -0.005864143371582031, -0.003387451171875, -0.0009107589721679688, 0.0015659332275390625, 0.004042625427246094, 0.006519317626953125, 0.008996009826660156, 0.011472702026367188, 0.013949394226074219, 0.01642608642578125, 0.01890277862548828, 0.021379470825195312, 0.023856163024902344, 0.026332855224609375, 0.028809547424316406, 0.03128623962402344, 0.03376293182373047, 0.0362396240234375, 0.03871631622314453, 0.04119300842285156, 0.043669700622558594, 0.046146392822265625, 0.048623085021972656, 0.05109977722167969, 0.05357646942138672, 0.05605316162109375, 0.05852985382080078, 0.06100654602050781, 0.06348323822021484, 0.06595993041992188, 0.0684366226196289, 0.07091331481933594, 0.07339000701904297, 0.07586669921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 9.0, 10.0, 20.0, 22.0, 15.0, 32.0, 45.0, 30.0, 37.0, 35.0, 47.0, 44.0, 48.0, 56.0, 42.0, 54.0, 44.0, 35.0, 47.0, 34.0, 40.0, 31.0, 34.0, 31.0, 19.0, 24.0, 29.0, 10.0, 18.0, 4.0, 7.0, 4.0, 3.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3564453125, -0.3443489074707031, -0.33225250244140625, -0.3201560974121094, -0.3080596923828125, -0.2959632873535156, -0.28386688232421875, -0.2717704772949219, -0.259674072265625, -0.24757766723632812, -0.23548126220703125, -0.22338485717773438, -0.2112884521484375, -0.19919204711914062, -0.18709564208984375, -0.17499923706054688, -0.16290283203125, -0.15080642700195312, -0.13871002197265625, -0.12661361694335938, -0.1145172119140625, -0.10242080688476562, -0.09032440185546875, -0.07822799682617188, -0.066131591796875, -0.054035186767578125, -0.04193878173828125, -0.029842376708984375, -0.0177459716796875, -0.005649566650390625, 0.00644683837890625, 0.018543243408203125, 0.0306396484375, 0.042736053466796875, 0.05483245849609375, 0.06692886352539062, 0.0790252685546875, 0.09112167358398438, 0.10321807861328125, 0.11531448364257812, 0.127410888671875, 0.13950729370117188, 0.15160369873046875, 0.16370010375976562, 0.1757965087890625, 0.18789291381835938, 0.19998931884765625, 0.21208572387695312, 0.22418212890625, 0.23627853393554688, 0.24837493896484375, 0.2604713439941406, 0.2725677490234375, 0.2846641540527344, 0.29676055908203125, 0.3088569641113281, 0.320953369140625, 0.3330497741699219, 0.34514617919921875, 0.3572425842285156, 0.3693389892578125, 0.3814353942871094, 0.39353179931640625, 0.4056282043457031, 0.417724609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 13.0, 16.0, 22.0, 22.0, 30.0, 38.0, 68.0, 129.0, 193.0, 344.0, 568.0, 1093.0, 2389.0, 5629.0, 16717.0, 75272.0, 487436.0, 380813.0, 54924.0, 13451.0, 4867.0, 2117.0, 1002.0, 567.0, 292.0, 180.0, 132.0, 63.0, 54.0, 33.0, 23.0, 13.0, 13.0, 7.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035400390625, -0.03435659408569336, -0.03331279754638672, -0.03226900100708008, -0.031225204467773438, -0.030181407928466797, -0.029137611389160156, -0.028093814849853516, -0.027050018310546875, -0.026006221771240234, -0.024962425231933594, -0.023918628692626953, -0.022874832153320312, -0.021831035614013672, -0.02078723907470703, -0.01974344253540039, -0.01869964599609375, -0.01765584945678711, -0.01661205291748047, -0.015568256378173828, -0.014524459838867188, -0.013480663299560547, -0.012436866760253906, -0.011393070220947266, -0.010349273681640625, -0.009305477142333984, -0.008261680603027344, -0.007217884063720703, -0.0061740875244140625, -0.005130290985107422, -0.004086494445800781, -0.0030426979064941406, -0.0019989013671875, -0.0009551048278808594, 8.869171142578125e-05, 0.0011324882507324219, 0.0021762847900390625, 0.003220081329345703, 0.004263877868652344, 0.005307674407958984, 0.006351470947265625, 0.007395267486572266, 0.008439064025878906, 0.009482860565185547, 0.010526657104492188, 0.011570453643798828, 0.012614250183105469, 0.01365804672241211, 0.01470184326171875, 0.01574563980102539, 0.01678943634033203, 0.017833232879638672, 0.018877029418945312, 0.019920825958251953, 0.020964622497558594, 0.022008419036865234, 0.023052215576171875, 0.024096012115478516, 0.025139808654785156, 0.026183605194091797, 0.027227401733398438, 0.028271198272705078, 0.02931499481201172, 0.03035879135131836, 0.031402587890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 9.0, 10.0, 20.0, 22.0, 35.0, 46.0, 54.0, 106.0, 107.0, 117.0, 113.0, 92.0, 100.0, 53.0, 46.0, 19.0, 11.0, 9.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2040138244628906e-05, -1.1427327990531921e-05, -1.0814517736434937e-05, -1.0201707482337952e-05, -9.588897228240967e-06, -8.976086974143982e-06, -8.363276720046997e-06, -7.750466465950012e-06, -7.137656211853027e-06, -6.5248459577560425e-06, -5.912035703659058e-06, -5.299225449562073e-06, -4.686415195465088e-06, -4.073604941368103e-06, -3.460794687271118e-06, -2.8479844331741333e-06, -2.2351741790771484e-06, -1.6223639249801636e-06, -1.0095536708831787e-06, -3.9674341678619385e-07, 2.1606683731079102e-07, 8.288770914077759e-07, 1.4416873455047607e-06, 2.0544975996017456e-06, 2.6673078536987305e-06, 3.2801181077957153e-06, 3.8929283618927e-06, 4.505738615989685e-06, 5.11854887008667e-06, 5.731359124183655e-06, 6.34416937828064e-06, 6.9569796323776245e-06, 7.569789886474609e-06, 8.182600140571594e-06, 8.795410394668579e-06, 9.408220648765564e-06, 1.0021030902862549e-05, 1.0633841156959534e-05, 1.1246651411056519e-05, 1.1859461665153503e-05, 1.2472271919250488e-05, 1.3085082173347473e-05, 1.3697892427444458e-05, 1.4310702681541443e-05, 1.4923512935638428e-05, 1.5536323189735413e-05, 1.6149133443832397e-05, 1.6761943697929382e-05, 1.7374753952026367e-05, 1.7987564206123352e-05, 1.8600374460220337e-05, 1.9213184714317322e-05, 1.9825994968414307e-05, 2.043880522251129e-05, 2.1051615476608276e-05, 2.166442573070526e-05, 2.2277235984802246e-05, 2.289004623889923e-05, 2.3502856492996216e-05, 2.41156667470932e-05, 2.4728477001190186e-05, 2.534128725528717e-05, 2.5954097509384155e-05, 2.656690776348114e-05, 2.7179718017578125e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 13.0, 19.0, 19.0, 43.0, 44.0, 60.0, 89.0, 105.0, 199.0, 282.0, 348.0, 500.0, 744.0, 1144.0, 1693.0, 2571.0, 4011.0, 6581.0, 11892.0, 22024.0, 45239.0, 98604.0, 201733.0, 274090.0, 190721.0, 92569.0, 42840.0, 21263.0, 11322.0, 6342.0, 3860.0, 2412.0, 1595.0, 1064.0, 667.0, 478.0, 357.0, 262.0, 177.0, 137.0, 109.0, 86.0, 66.0, 38.0, 35.0, 31.0, 17.0, 15.0, 9.0, 6.0, 8.0, 7.0, 1.0, 0.0, 1.0], "bins": [-0.0149078369140625, -0.014448404312133789, -0.013988971710205078, -0.013529539108276367, -0.013070106506347656, -0.012610673904418945, -0.012151241302490234, -0.011691808700561523, -0.011232376098632812, -0.010772943496704102, -0.01031351089477539, -0.00985407829284668, -0.009394645690917969, -0.008935213088989258, -0.008475780487060547, -0.008016347885131836, -0.007556915283203125, -0.007097482681274414, -0.006638050079345703, -0.006178617477416992, -0.005719184875488281, -0.00525975227355957, -0.004800319671630859, -0.0043408870697021484, -0.0038814544677734375, -0.0034220218658447266, -0.0029625892639160156, -0.0025031566619873047, -0.0020437240600585938, -0.0015842914581298828, -0.0011248588562011719, -0.0006654262542724609, -0.00020599365234375, 0.00025343894958496094, 0.0007128715515136719, 0.0011723041534423828, 0.0016317367553710938, 0.0020911693572998047, 0.0025506019592285156, 0.0030100345611572266, 0.0034694671630859375, 0.0039288997650146484, 0.004388332366943359, 0.00484776496887207, 0.005307197570800781, 0.005766630172729492, 0.006226062774658203, 0.006685495376586914, 0.007144927978515625, 0.007604360580444336, 0.008063793182373047, 0.008523225784301758, 0.008982658386230469, 0.00944209098815918, 0.00990152359008789, 0.010360956192016602, 0.010820388793945312, 0.011279821395874023, 0.011739253997802734, 0.012198686599731445, 0.012658119201660156, 0.013117551803588867, 0.013576984405517578, 0.014036417007446289, 0.014495849609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 7.0, 6.0, 5.0, 6.0, 8.0, 13.0, 16.0, 16.0, 23.0, 22.0, 39.0, 43.0, 59.0, 57.0, 67.0, 66.0, 67.0, 56.0, 65.0, 64.0, 41.0, 46.0, 35.0, 28.0, 29.0, 20.0, 19.0, 12.0, 9.0, 9.0, 12.0, 5.0, 4.0, 4.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006160736083984375, -0.005951225757598877, -0.005741715431213379, -0.005532205104827881, -0.005322694778442383, -0.005113184452056885, -0.004903674125671387, -0.004694163799285889, -0.004484653472900391, -0.004275143146514893, -0.0040656328201293945, -0.0038561224937438965, -0.0036466121673583984, -0.0034371018409729004, -0.0032275915145874023, -0.0030180811882019043, -0.0028085708618164062, -0.002599060535430908, -0.00238955020904541, -0.002180039882659912, -0.001970529556274414, -0.001761019229888916, -0.001551508903503418, -0.00134199857711792, -0.0011324882507324219, -0.0009229779243469238, -0.0007134675979614258, -0.0005039572715759277, -0.0002944469451904297, -8.493661880493164e-05, 0.0001245737075805664, 0.00033408403396606445, 0.0005435943603515625, 0.0007531046867370605, 0.0009626150131225586, 0.0011721253395080566, 0.0013816356658935547, 0.0015911459922790527, 0.0018006563186645508, 0.002010166645050049, 0.002219676971435547, 0.002429187297821045, 0.002638697624206543, 0.002848207950592041, 0.003057718276977539, 0.003267228603363037, 0.003476738929748535, 0.003686249256134033, 0.0038957595825195312, 0.004105269908905029, 0.004314780235290527, 0.004524290561676025, 0.0047338008880615234, 0.0049433112144470215, 0.0051528215408325195, 0.005362331867218018, 0.005571842193603516, 0.005781352519989014, 0.005990862846374512, 0.00620037317276001, 0.006409883499145508, 0.006619393825531006, 0.006828904151916504, 0.007038414478302002, 0.0072479248046875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 8.0, 13.0, 15.0, 39.0, 38.0, 34.0, 70.0, 73.0, 80.0, 93.0, 78.0, 96.0, 72.0, 75.0, 50.0, 34.0, 34.0, 20.0, 12.0, 13.0, 15.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22945018112659454, -0.2225847691297531, -0.21571935713291168, -0.20885394513607025, -0.20198851823806763, -0.1951231062412262, -0.18825769424438477, -0.18139228224754333, -0.1745268702507019, -0.16766145825386047, -0.16079604625701904, -0.1539306342601776, -0.14706522226333618, -0.14019981026649475, -0.13333438336849213, -0.1264689713716507, -0.11960355937480927, -0.11273814737796783, -0.1058727353811264, -0.09900731593370438, -0.09214190393686295, -0.08527649194002151, -0.07841107249259949, -0.07154566049575806, -0.06468024849891663, -0.057814836502075195, -0.050949420779943466, -0.04408400505781174, -0.037218593060970306, -0.030353181064128876, -0.023487765341997147, -0.016622349619865417, -0.00975695252418518, -0.0028915386646986008, 0.003973875194787979, 0.010839289054274559, 0.01770470291376114, 0.02457011491060257, 0.0314355306327343, 0.03830094635486603, 0.04516635835170746, 0.05203177034854889, 0.05889718607068062, 0.06576260179281235, 0.07262801378965378, 0.07949342578649521, 0.08635884523391724, 0.09322425723075867, 0.1000896692276001, 0.10695508122444153, 0.11382049322128296, 0.12068591266870499, 0.12755131721496582, 0.13441672921180725, 0.14128215610980988, 0.1481475681066513, 0.15501298010349274, 0.16187839210033417, 0.1687438040971756, 0.17560921609401703, 0.18247464299201965, 0.18934005498886108, 0.19620546698570251, 0.20307087898254395, 0.20993629097938538]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 4.0, 3.0, 7.0, 6.0, 18.0, 9.0, 10.0, 10.0, 10.0, 30.0, 34.0, 25.0, 29.0, 36.0, 32.0, 36.0, 36.0, 36.0, 42.0, 37.0, 36.0, 40.0, 47.0, 36.0, 44.0, 36.0, 46.0, 35.0, 38.0, 31.0, 21.0, 17.0, 18.0, 17.0, 28.0, 15.0, 15.0, 8.0, 11.0, 6.0, 3.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16031111776828766, -0.15586137771606445, -0.15141162276268005, -0.14696188271045685, -0.14251214265823364, -0.13806240260601044, -0.13361266255378723, -0.12916290760040283, -0.12471316754817963, -0.12026342749595642, -0.11581367999315262, -0.11136393249034882, -0.10691419243812561, -0.1024644523859024, -0.0980147048830986, -0.0935649573802948, -0.0891152173280716, -0.08466547727584839, -0.08021572977304459, -0.07576598227024078, -0.07131624221801758, -0.06686650216579437, -0.06241675466299057, -0.057967010885477066, -0.05351726710796356, -0.04906752333045006, -0.044617779552936554, -0.04016803577542305, -0.035718291997909546, -0.03126854822039604, -0.026818804442882538, -0.022369060665369034, -0.017919331789016724, -0.01346958801150322, -0.009019844233989716, -0.0045701004564762115, -0.00012035667896270752, 0.0043293870985507965, 0.0087791308760643, 0.013228874653577805, 0.01767861843109131, 0.022128362208604813, 0.026578105986118317, 0.03102784976363182, 0.035477593541145325, 0.03992733731865883, 0.04437708109617233, 0.04882682487368584, 0.05327656865119934, 0.057726312428712845, 0.06217605620622635, 0.06662580370903015, 0.07107554376125336, 0.07552528381347656, 0.07997503131628036, 0.08442477881908417, 0.08887451887130737, 0.09332425892353058, 0.09777400642633438, 0.10222375392913818, 0.10667349398136139, 0.1111232340335846, 0.1155729815363884, 0.1200227290391922, 0.1244724690914154]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 14.0, 14.0, 17.0, 30.0, 37.0, 62.0, 100.0, 154.0, 268.0, 411.0, 744.0, 1389.0, 2810.0, 6139.0, 14752.0, 38698.0, 118393.0, 378727.0, 329570.0, 99067.0, 33253.0, 12937.0, 5363.0, 2515.0, 1335.0, 715.0, 382.0, 244.0, 135.0, 79.0, 50.0, 37.0, 32.0, 25.0, 12.0, 9.0, 9.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.292236328125, -0.28386878967285156, -0.2755012512207031, -0.2671337127685547, -0.25876617431640625, -0.2503986358642578, -0.24203109741210938, -0.23366355895996094, -0.2252960205078125, -0.21692848205566406, -0.20856094360351562, -0.2001934051513672, -0.19182586669921875, -0.1834583282470703, -0.17509078979492188, -0.16672325134277344, -0.158355712890625, -0.14998817443847656, -0.14162063598632812, -0.1332530975341797, -0.12488555908203125, -0.11651802062988281, -0.10815048217773438, -0.09978294372558594, -0.0914154052734375, -0.08304786682128906, -0.07468032836914062, -0.06631278991699219, -0.05794525146484375, -0.04957771301269531, -0.041210174560546875, -0.03284263610839844, -0.02447509765625, -0.016107559204101562, -0.007740020751953125, 0.0006275177001953125, 0.00899505615234375, 0.017362594604492188, 0.025730133056640625, 0.03409767150878906, 0.0424652099609375, 0.05083274841308594, 0.059200286865234375, 0.06756782531738281, 0.07593536376953125, 0.08430290222167969, 0.09267044067382812, 0.10103797912597656, 0.109405517578125, 0.11777305603027344, 0.12614059448242188, 0.1345081329345703, 0.14287567138671875, 0.1512432098388672, 0.15961074829101562, 0.16797828674316406, 0.1763458251953125, 0.18471336364746094, 0.19308090209960938, 0.2014484405517578, 0.20981597900390625, 0.2181835174560547, 0.22655105590820312, 0.23491859436035156, 0.2432861328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 12.0, 3.0, 7.0, 13.0, 21.0, 13.0, 21.0, 27.0, 29.0, 27.0, 38.0, 23.0, 32.0, 38.0, 44.0, 40.0, 45.0, 37.0, 39.0, 51.0, 47.0, 37.0, 40.0, 41.0, 39.0, 33.0, 26.0, 32.0, 15.0, 13.0, 17.0, 19.0, 17.0, 10.0, 16.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2841796875, -0.27631568908691406, -0.2684516906738281, -0.2605876922607422, -0.25272369384765625, -0.2448596954345703, -0.23699569702148438, -0.22913169860839844, -0.2212677001953125, -0.21340370178222656, -0.20553970336914062, -0.1976757049560547, -0.18981170654296875, -0.1819477081298828, -0.17408370971679688, -0.16621971130371094, -0.158355712890625, -0.15049171447753906, -0.14262771606445312, -0.1347637176513672, -0.12689971923828125, -0.11903572082519531, -0.11117172241210938, -0.10330772399902344, -0.0954437255859375, -0.08757972717285156, -0.07971572875976562, -0.07185173034667969, -0.06398773193359375, -0.05612373352050781, -0.048259735107421875, -0.04039573669433594, -0.03253173828125, -0.024667739868164062, -0.016803741455078125, -0.008939743041992188, -0.00107574462890625, 0.0067882537841796875, 0.014652252197265625, 0.022516250610351562, 0.0303802490234375, 0.03824424743652344, 0.046108245849609375, 0.05397224426269531, 0.06183624267578125, 0.06970024108886719, 0.07756423950195312, 0.08542823791503906, 0.093292236328125, 0.10115623474121094, 0.10902023315429688, 0.11688423156738281, 0.12474822998046875, 0.1326122283935547, 0.14047622680664062, 0.14834022521972656, 0.1562042236328125, 0.16406822204589844, 0.17193222045898438, 0.1797962188720703, 0.18766021728515625, 0.1955242156982422, 0.20338821411132812, 0.21125221252441406, 0.2191162109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 4.0, 4.0, 5.0, 9.0, 9.0, 21.0, 22.0, 19.0, 31.0, 45.0, 56.0, 82.0, 112.0, 156.0, 246.0, 466.0, 871.0, 1654.0, 3908.0, 10491.0, 30112.0, 97532.0, 342546.0, 389966.0, 114590.0, 35145.0, 11808.0, 4508.0, 1867.0, 879.0, 480.0, 286.0, 173.0, 120.0, 86.0, 68.0, 43.0, 27.0, 31.0, 19.0, 13.0, 18.0, 6.0, 5.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.35302734375, -0.34323883056640625, -0.3334503173828125, -0.32366180419921875, -0.313873291015625, -0.30408477783203125, -0.2942962646484375, -0.28450775146484375, -0.27471923828125, -0.26493072509765625, -0.2551422119140625, -0.24535369873046875, -0.235565185546875, -0.22577667236328125, -0.2159881591796875, -0.20619964599609375, -0.1964111328125, -0.18662261962890625, -0.1768341064453125, -0.16704559326171875, -0.157257080078125, -0.14746856689453125, -0.1376800537109375, -0.12789154052734375, -0.11810302734375, -0.10831451416015625, -0.0985260009765625, -0.08873748779296875, -0.078948974609375, -0.06916046142578125, -0.0593719482421875, -0.04958343505859375, -0.039794921875, -0.03000640869140625, -0.0202178955078125, -0.01042938232421875, -0.000640869140625, 0.00914764404296875, 0.0189361572265625, 0.02872467041015625, 0.03851318359375, 0.04830169677734375, 0.0580902099609375, 0.06787872314453125, 0.077667236328125, 0.08745574951171875, 0.0972442626953125, 0.10703277587890625, 0.1168212890625, 0.12660980224609375, 0.1363983154296875, 0.14618682861328125, 0.155975341796875, 0.16576385498046875, 0.1755523681640625, 0.18534088134765625, 0.19512939453125, 0.20491790771484375, 0.2147064208984375, 0.22449493408203125, 0.234283447265625, 0.24407196044921875, 0.2538604736328125, 0.26364898681640625, 0.2734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 10.0, 9.0, 8.0, 8.0, 7.0, 11.0, 17.0, 15.0, 21.0, 23.0, 23.0, 31.0, 43.0, 37.0, 35.0, 42.0, 49.0, 41.0, 53.0, 41.0, 46.0, 49.0, 40.0, 49.0, 40.0, 38.0, 28.0, 27.0, 24.0, 19.0, 28.0, 19.0, 16.0, 10.0, 10.0, 11.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3027076721191406, -0.29389190673828125, -0.2850761413574219, -0.2762603759765625, -0.2674446105957031, -0.25862884521484375, -0.24981307983398438, -0.240997314453125, -0.23218154907226562, -0.22336578369140625, -0.21455001831054688, -0.2057342529296875, -0.19691848754882812, -0.18810272216796875, -0.17928695678710938, -0.17047119140625, -0.16165542602539062, -0.15283966064453125, -0.14402389526367188, -0.1352081298828125, -0.12639236450195312, -0.11757659912109375, -0.10876083374023438, -0.099945068359375, -0.09112930297851562, -0.08231353759765625, -0.07349777221679688, -0.0646820068359375, -0.055866241455078125, -0.04705047607421875, -0.038234710693359375, -0.0294189453125, -0.020603179931640625, -0.01178741455078125, -0.002971649169921875, 0.0058441162109375, 0.014659881591796875, 0.02347564697265625, 0.032291412353515625, 0.041107177734375, 0.049922943115234375, 0.05873870849609375, 0.06755447387695312, 0.0763702392578125, 0.08518600463867188, 0.09400177001953125, 0.10281753540039062, 0.11163330078125, 0.12044906616210938, 0.12926483154296875, 0.13808059692382812, 0.1468963623046875, 0.15571212768554688, 0.16452789306640625, 0.17334365844726562, 0.182159423828125, 0.19097518920898438, 0.19979095458984375, 0.20860671997070312, 0.2174224853515625, 0.22623825073242188, 0.23505401611328125, 0.24386978149414062, 0.252685546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 7.0, 10.0, 22.0, 46.0, 65.0, 127.0, 245.0, 622.0, 1580.0, 5052.0, 24667.0, 224744.0, 690497.0, 83476.0, 12304.0, 3158.0, 1045.0, 445.0, 181.0, 106.0, 51.0, 36.0, 17.0, 14.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0909423828125, -0.08803653717041016, -0.08513069152832031, -0.08222484588623047, -0.07931900024414062, -0.07641315460205078, -0.07350730895996094, -0.0706014633178711, -0.06769561767578125, -0.0647897720336914, -0.06188392639160156, -0.05897808074951172, -0.056072235107421875, -0.05316638946533203, -0.05026054382324219, -0.047354698181152344, -0.0444488525390625, -0.041543006896972656, -0.03863716125488281, -0.03573131561279297, -0.032825469970703125, -0.02991962432861328, -0.027013778686523438, -0.024107933044433594, -0.02120208740234375, -0.018296241760253906, -0.015390396118164062, -0.012484550476074219, -0.009578704833984375, -0.006672859191894531, -0.0037670135498046875, -0.0008611679077148438, 0.002044677734375, 0.004950523376464844, 0.007856369018554688, 0.010762214660644531, 0.013668060302734375, 0.01657390594482422, 0.019479751586914062, 0.022385597229003906, 0.02529144287109375, 0.028197288513183594, 0.031103134155273438, 0.03400897979736328, 0.036914825439453125, 0.03982067108154297, 0.04272651672363281, 0.045632362365722656, 0.0485382080078125, 0.051444053649902344, 0.05434989929199219, 0.05725574493408203, 0.060161590576171875, 0.06306743621826172, 0.06597328186035156, 0.0688791275024414, 0.07178497314453125, 0.0746908187866211, 0.07759666442871094, 0.08050251007080078, 0.08340835571289062, 0.08631420135498047, 0.08922004699707031, 0.09212589263916016, 0.09503173828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 9.0, 16.0, 12.0, 31.0, 37.0, 54.0, 55.0, 89.0, 84.0, 128.0, 132.0, 79.0, 69.0, 39.0, 45.0, 36.0, 18.0, 16.0, 6.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.404254913330078e-06, -8.063390851020813e-06, -7.722526788711548e-06, -7.381662726402283e-06, -7.040798664093018e-06, -6.6999346017837524e-06, -6.359070539474487e-06, -6.018206477165222e-06, -5.677342414855957e-06, -5.336478352546692e-06, -4.995614290237427e-06, -4.654750227928162e-06, -4.3138861656188965e-06, -3.973022103309631e-06, -3.632158041000366e-06, -3.291293978691101e-06, -2.950429916381836e-06, -2.609565854072571e-06, -2.2687017917633057e-06, -1.9278377294540405e-06, -1.5869736671447754e-06, -1.2461096048355103e-06, -9.052455425262451e-07, -5.6438148021698e-07, -2.2351741790771484e-07, 1.1734664440155029e-07, 4.5821070671081543e-07, 7.990747690200806e-07, 1.1399388313293457e-06, 1.4808028936386108e-06, 1.821666955947876e-06, 2.162531018257141e-06, 2.5033950805664062e-06, 2.8442591428756714e-06, 3.1851232051849365e-06, 3.5259872674942017e-06, 3.866851329803467e-06, 4.207715392112732e-06, 4.548579454421997e-06, 4.889443516731262e-06, 5.230307579040527e-06, 5.5711716413497925e-06, 5.912035703659058e-06, 6.252899765968323e-06, 6.593763828277588e-06, 6.934627890586853e-06, 7.275491952896118e-06, 7.616356015205383e-06, 7.957220077514648e-06, 8.298084139823914e-06, 8.638948202133179e-06, 8.979812264442444e-06, 9.320676326751709e-06, 9.661540389060974e-06, 1.000240445137024e-05, 1.0343268513679504e-05, 1.068413257598877e-05, 1.1024996638298035e-05, 1.13658607006073e-05, 1.1706724762916565e-05, 1.204758882522583e-05, 1.2388452887535095e-05, 1.272931694984436e-05, 1.3070181012153625e-05, 1.341104507446289e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 7.0, 18.0, 14.0, 27.0, 33.0, 56.0, 61.0, 97.0, 135.0, 191.0, 328.0, 480.0, 814.0, 1340.0, 2402.0, 4478.0, 8968.0, 21609.0, 67303.0, 276748.0, 486810.0, 117863.0, 32819.0, 12601.0, 5998.0, 3001.0, 1646.0, 915.0, 610.0, 382.0, 257.0, 162.0, 109.0, 83.0, 53.0, 36.0, 21.0, 23.0, 12.0, 3.0, 15.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.058563232421875, -0.0566864013671875, -0.0548095703125, -0.0529327392578125, -0.051055908203125, -0.0491790771484375, -0.04730224609375, -0.0454254150390625, -0.043548583984375, -0.0416717529296875, -0.039794921875, -0.0379180908203125, -0.036041259765625, -0.0341644287109375, -0.03228759765625, -0.0304107666015625, -0.028533935546875, -0.0266571044921875, -0.0247802734375, -0.0229034423828125, -0.021026611328125, -0.0191497802734375, -0.01727294921875, -0.0153961181640625, -0.013519287109375, -0.0116424560546875, -0.009765625, -0.0078887939453125, -0.006011962890625, -0.0041351318359375, -0.00225830078125, -0.0003814697265625, 0.001495361328125, 0.0033721923828125, 0.0052490234375, 0.0071258544921875, 0.009002685546875, 0.0108795166015625, 0.01275634765625, 0.0146331787109375, 0.016510009765625, 0.0183868408203125, 0.020263671875, 0.0221405029296875, 0.024017333984375, 0.0258941650390625, 0.02777099609375, 0.0296478271484375, 0.031524658203125, 0.0334014892578125, 0.0352783203125, 0.0371551513671875, 0.039031982421875, 0.0409088134765625, 0.04278564453125, 0.0446624755859375, 0.046539306640625, 0.0484161376953125, 0.05029296875, 0.0521697998046875, 0.054046630859375, 0.0559234619140625, 0.05780029296875, 0.0596771240234375, 0.061553955078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 7.0, 6.0, 4.0, 13.0, 21.0, 18.0, 16.0, 40.0, 65.0, 87.0, 98.0, 186.0, 118.0, 91.0, 77.0, 44.0, 35.0, 20.0, 14.0, 8.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04608154296875, -0.04462718963623047, -0.04317283630371094, -0.041718482971191406, -0.040264129638671875, -0.038809776306152344, -0.03735542297363281, -0.03590106964111328, -0.03444671630859375, -0.03299236297607422, -0.03153800964355469, -0.030083656311035156, -0.028629302978515625, -0.027174949645996094, -0.025720596313476562, -0.02426624298095703, -0.0228118896484375, -0.02135753631591797, -0.019903182983398438, -0.018448829650878906, -0.016994476318359375, -0.015540122985839844, -0.014085769653320312, -0.012631416320800781, -0.01117706298828125, -0.009722709655761719, -0.008268356323242188, -0.006814002990722656, -0.005359649658203125, -0.0039052963256835938, -0.0024509429931640625, -0.0009965896606445312, 0.000457763671875, 0.0019121170043945312, 0.0033664703369140625, 0.004820823669433594, 0.006275177001953125, 0.007729530334472656, 0.009183883666992188, 0.010638236999511719, 0.01209259033203125, 0.013546943664550781, 0.015001296997070312, 0.016455650329589844, 0.017910003662109375, 0.019364356994628906, 0.020818710327148438, 0.02227306365966797, 0.0237274169921875, 0.02518177032470703, 0.026636123657226562, 0.028090476989746094, 0.029544830322265625, 0.030999183654785156, 0.03245353698730469, 0.03390789031982422, 0.03536224365234375, 0.03681659698486328, 0.03827095031738281, 0.039725303649902344, 0.041179656982421875, 0.042634010314941406, 0.04408836364746094, 0.04554271697998047, 0.0469970703125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 5.0, 18.0, 30.0, 44.0, 76.0, 147.0, 185.0, 146.0, 118.0, 82.0, 49.0, 38.0, 25.0, 8.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8316740989685059, -0.8072460889816284, -0.7828181385993958, -0.7583901286125183, -0.7339621782302856, -0.7095341682434082, -0.6851061582565308, -0.6606782078742981, -0.6362502574920654, -0.611822247505188, -0.5873942971229553, -0.5629662871360779, -0.5385383367538452, -0.5141103267669678, -0.4896823465824127, -0.46525436639785767, -0.4408263564109802, -0.41639837622642517, -0.3919703960418701, -0.3675423860549927, -0.34311443567276, -0.31868642568588257, -0.2942584455013275, -0.26983046531677246, -0.2454024851322174, -0.22097450494766235, -0.1965465247631073, -0.17211852967739105, -0.147690549492836, -0.12326256930828094, -0.0988345742225647, -0.07440659403800964, -0.049978673458099365, -0.025550689548254013, -0.0011227056384086609, 0.02330528199672699, 0.04773326218128204, 0.0721612423658371, 0.09658923745155334, 0.1210172176361084, 0.14544519782066345, 0.1698731780052185, 0.19430115818977356, 0.2187291532754898, 0.24315713346004486, 0.2675850987434387, 0.29201310873031616, 0.3164410889148712, 0.34086906909942627, 0.3652970492839813, 0.3897250294685364, 0.4141530394554138, 0.4385809898376465, 0.4630089998245239, 0.487436980009079, 0.511864960193634, 0.5362929105758667, 0.5607209205627441, 0.5851488709449768, 0.6095768809318542, 0.6340048313140869, 0.6584328413009644, 0.6828608512878418, 0.7072888016700745, 0.7317168116569519]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 10.0, 19.0, 15.0, 21.0, 13.0, 27.0, 35.0, 34.0, 33.0, 34.0, 48.0, 26.0, 37.0, 30.0, 38.0, 46.0, 35.0, 45.0, 33.0, 35.0, 52.0, 34.0, 37.0, 29.0, 35.0, 27.0, 23.0, 21.0, 16.0, 19.0, 13.0, 15.0, 8.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5037117600440979, -0.4893195927143097, -0.4749274253845215, -0.4605352282524109, -0.4461430609226227, -0.4317508935928345, -0.4173586964607239, -0.40296652913093567, -0.38857436180114746, -0.37418219447135925, -0.35979002714157104, -0.34539783000946045, -0.33100566267967224, -0.31661349534988403, -0.30222129821777344, -0.28782913088798523, -0.273436963558197, -0.2590447962284088, -0.2446526139974594, -0.23026043176651, -0.2158682644367218, -0.2014760971069336, -0.1870839148759842, -0.1726917326450348, -0.15829956531524658, -0.14390739798545837, -0.12951521575450897, -0.11512304097414017, -0.10073086619377136, -0.08633869141340256, -0.07194651663303375, -0.05755434185266495, -0.043162137269973755, -0.02876996248960495, -0.014377787709236145, 1.4387071132659912e-05, 0.014406561851501465, 0.02879873663187027, 0.043190911412239075, 0.05758308619260788, 0.07197526097297668, 0.08636743575334549, 0.1007596105337143, 0.1151517853140831, 0.1295439600944519, 0.1439361274242401, 0.15832830965518951, 0.17272049188613892, 0.18711265921592712, 0.20150482654571533, 0.21589700877666473, 0.23028919100761414, 0.24468135833740234, 0.25907352566719055, 0.27346569299697876, 0.28785789012908936, 0.30225005745887756, 0.31664222478866577, 0.33103442192077637, 0.3454265892505646, 0.3598187565803528, 0.374210923910141, 0.3886030912399292, 0.4029952883720398, 0.417387455701828]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 3.0, 5.0, 9.0, 4.0, 9.0, 5.0, 15.0, 7.0, 17.0, 20.0, 40.0, 39.0, 59.0, 77.0, 118.0, 200.0, 285.0, 493.0, 818.0, 1713.0, 3983.0, 1035941.0, 3355.0, 1388.0, 705.0, 449.0, 257.0, 155.0, 115.0, 72.0, 59.0, 31.0, 32.0, 22.0, 16.0, 15.0, 8.0, 11.0, 11.0, 8.0, 7.0, 5.0, 1.0, 4.0, 7.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7920936942100525, -0.7683619856834412, -0.7446303367614746, -0.7208986282348633, -0.6971669793128967, -0.6734352707862854, -0.6497036218643188, -0.6259719133377075, -0.6022402048110962, -0.5785084962844849, -0.5547768473625183, -0.531045138835907, -0.5073134899139404, -0.4835817813873291, -0.45985010266304016, -0.4361184239387512, -0.41238677501678467, -0.3886550962924957, -0.3649234175682068, -0.34119170904159546, -0.3174600601196289, -0.2937283515930176, -0.26999667286872864, -0.2462649941444397, -0.22253331542015076, -0.19880163669586182, -0.17506995797157288, -0.15133826434612274, -0.1276065856218338, -0.10387490689754486, -0.08014321327209473, -0.056411534547805786, -0.032679855823516846, -0.008948173373937607, 0.014783509075641632, 0.03851519525051117, 0.06224687397480011, 0.08597855269908905, 0.10971024632453918, 0.13344192504882812, 0.15717360377311707, 0.180905282497406, 0.20463696122169495, 0.22836865484714508, 0.2521003484725952, 0.27583199739456177, 0.2995637059211731, 0.32329538464546204, 0.347027063369751, 0.3707587420940399, 0.39449042081832886, 0.4182221293449402, 0.44195377826690674, 0.46568548679351807, 0.489417165517807, 0.513148844242096, 0.5368804931640625, 0.5606122016906738, 0.5843438506126404, 0.6080755591392517, 0.6318072080612183, 0.6555389165878296, 0.6792706251144409, 0.7030022740364075, 0.7267339825630188]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 9.0, 3.0, 6.0, 19.0, 20.0, 31.0, 38.0, 56.0, 93.0, 117.0, 178.0, 259.0, 468.0, 1034.0, 3502.0, 51455756.0, 5920.0, 1232.0, 577.0, 328.0, 216.0, 135.0, 101.0, 62.0, 50.0, 32.0, 28.0, 23.0, 12.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.387202262878418, -10.047842025756836, -9.70848274230957, -9.369122505187988, -9.029762268066406, -8.69040298461914, -8.351042747497559, -8.011682510375977, -7.6723222732543945, -7.332962512969971, -6.993602752685547, -6.654242515563965, -6.314882278442383, -5.975522518157959, -5.636162757873535, -5.296802520751953, -4.957442283630371, -4.618082523345947, -4.278722763061523, -3.9393625259399414, -3.6000025272369385, -3.2606425285339355, -2.9212825298309326, -2.5819225311279297, -2.2425625324249268, -1.9032025337219238, -1.563842535018921, -1.224482536315918, -0.885122537612915, -0.5457625389099121, -0.20640254020690918, 0.13295841217041016, 0.4723184108734131, 0.811678409576416, 1.151038408279419, 1.4903984069824219, 1.8297584056854248, 2.1691184043884277, 2.5084784030914307, 2.8478384017944336, 3.1871984004974365, 3.5265583992004395, 3.8659183979034424, 4.205278396606445, 4.544638633728027, 4.883998394012451, 5.223358154296875, 5.562718391418457, 5.902078628540039, 6.241438388824463, 6.580798149108887, 6.920158386230469, 7.259518623352051, 7.598878383636475, 7.938238143920898, 8.27759838104248, 8.616958618164062, 8.956317901611328, 9.29567813873291, 9.635038375854492, 9.974398612976074, 10.313758850097656, 10.653118133544922, 10.992478370666504]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 16.0, 18.0, 28.0, 42.0, 72.0, 64.0, 115.0, 163.0, 307.0, 431.0, 645.0, 1056.0, 1752.0, 2719.0, 4801.0, 7860.0, 13485.0, 24120.0, 43756.0, 79521.0, 146907.0, 264780.0, 444811.0, 2621232.0, 1655880.0, 421060.0, 248093.0, 137278.0, 74274.0, 40961.0, 22810.0, 12994.0, 7433.0, 4491.0, 2764.0, 1676.0, 1115.0, 692.0, 387.0, 288.0, 184.0, 129.0, 73.0, 54.0, 27.0, 19.0, 18.0, 15.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.77099609375, -0.7482833862304688, -0.7255706787109375, -0.7028579711914062, -0.680145263671875, -0.6574325561523438, -0.6347198486328125, -0.6120071411132812, -0.58929443359375, -0.5665817260742188, -0.5438690185546875, -0.5211563110351562, -0.498443603515625, -0.47573089599609375, -0.4530181884765625, -0.43030548095703125, -0.4075927734375, -0.38488006591796875, -0.3621673583984375, -0.33945465087890625, -0.316741943359375, -0.29402923583984375, -0.2713165283203125, -0.24860382080078125, -0.22589111328125, -0.20317840576171875, -0.1804656982421875, -0.15775299072265625, -0.135040283203125, -0.11232757568359375, -0.0896148681640625, -0.06690216064453125, -0.044189453125, -0.02147674560546875, 0.0012359619140625, 0.02394866943359375, 0.046661376953125, 0.06937408447265625, 0.0920867919921875, 0.11479949951171875, 0.13751220703125, 0.16022491455078125, 0.1829376220703125, 0.20565032958984375, 0.228363037109375, 0.25107574462890625, 0.2737884521484375, 0.29650115966796875, 0.3192138671875, 0.34192657470703125, 0.3646392822265625, 0.38735198974609375, 0.410064697265625, 0.43277740478515625, 0.4554901123046875, 0.47820281982421875, 0.50091552734375, 0.5236282348632812, 0.5463409423828125, 0.5690536499023438, 0.591766357421875, 0.6144790649414062, 0.6371917724609375, 0.6599044799804688, 0.6826171875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 5.0, 8.0, 12.0, 11.0, 20.0, 14.0, 23.0, 20.0, 15.0, 27.0, 37.0, 49.0, 45.0, 45.0, 50.0, 65.0, 240.0, 805.0, 115.0, 55.0, 46.0, 52.0, 42.0, 36.0, 33.0, 24.0, 22.0, 20.0, 22.0, 14.0, 14.0, 11.0, 5.0, 10.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.4049072265625, -5.247314453125, -5.0897216796875, -4.93212890625, -4.7745361328125, -4.616943359375, -4.4593505859375, -4.3017578125, -4.1441650390625, -3.986572265625, -3.8289794921875, -3.67138671875, -3.5137939453125, -3.356201171875, -3.1986083984375, -3.041015625, -2.8834228515625, -2.725830078125, -2.5682373046875, -2.41064453125, -2.2530517578125, -2.095458984375, -1.9378662109375, -1.7802734375, -1.6226806640625, -1.465087890625, -1.3074951171875, -1.14990234375, -0.9923095703125, -0.834716796875, -0.6771240234375, -0.51953125, -0.3619384765625, -0.204345703125, -0.0467529296875, 0.11083984375, 0.2684326171875, 0.426025390625, 0.5836181640625, 0.7412109375, 0.8988037109375, 1.056396484375, 1.2139892578125, 1.37158203125, 1.5291748046875, 1.686767578125, 1.8443603515625, 2.001953125, 2.1595458984375, 2.317138671875, 2.4747314453125, 2.63232421875, 2.7899169921875, 2.947509765625, 3.1051025390625, 3.2626953125, 3.4202880859375, 3.577880859375, 3.7354736328125, 3.89306640625, 4.0506591796875, 4.208251953125, 4.3658447265625, 4.5234375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 8.0, 14.0, 21.0, 41.0, 86.0, 91.0, 174.0, 285.0, 427.0, 683.0, 1020.0, 1738.0, 2672.0, 4442.0, 7084.0, 11442.0, 18563.0, 29475.0, 47676.0, 74988.0, 116299.0, 173113.0, 245073.0, 323822.0, 595413.0, 3293874.0, 398791.0, 297153.0, 220176.0, 152391.0, 100788.0, 64954.0, 41074.0, 25781.0, 15952.0, 9668.0, 6165.0, 3815.0, 2423.0, 1390.0, 916.0, 560.0, 354.0, 225.0, 112.0, 86.0, 47.0, 32.0, 16.0, 12.0, 10.0, 12.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.405517578125, -0.392578125, -0.379638671875, -0.36669921875, -0.353759765625, -0.3408203125, -0.327880859375, -0.31494140625, -0.302001953125, -0.2890625, -0.276123046875, -0.26318359375, -0.250244140625, -0.2373046875, -0.224365234375, -0.21142578125, -0.198486328125, -0.185546875, -0.172607421875, -0.15966796875, -0.146728515625, -0.1337890625, -0.120849609375, -0.10791015625, -0.094970703125, -0.08203125, -0.069091796875, -0.05615234375, -0.043212890625, -0.0302734375, -0.017333984375, -0.00439453125, 0.008544921875, 0.021484375, 0.034423828125, 0.04736328125, 0.060302734375, 0.0732421875, 0.086181640625, 0.09912109375, 0.112060546875, 0.125, 0.137939453125, 0.15087890625, 0.163818359375, 0.1767578125, 0.189697265625, 0.20263671875, 0.215576171875, 0.228515625, 0.241455078125, 0.25439453125, 0.267333984375, 0.2802734375, 0.293212890625, 0.30615234375, 0.319091796875, 0.33203125, 0.344970703125, 0.35791015625, 0.370849609375, 0.3837890625, 0.396728515625, 0.40966796875, 0.422607421875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 13.0, 5.0, 14.0, 18.0, 13.0, 17.0, 20.0, 17.0, 20.0, 30.0, 30.0, 29.0, 37.0, 34.0, 41.0, 28.0, 40.0, 75.0, 438.0, 592.0, 73.0, 41.0, 28.0, 26.0, 33.0, 42.0, 20.0, 29.0, 26.0, 14.0, 17.0, 16.0, 23.0, 14.0, 10.0, 12.0, 14.0, 8.0, 4.0, 9.0, 9.0, 7.0, 4.0, 5.0, 7.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.076171875, -2.977264404296875, -2.87835693359375, -2.779449462890625, -2.6805419921875, -2.581634521484375, -2.48272705078125, -2.383819580078125, -2.284912109375, -2.186004638671875, -2.08709716796875, -1.988189697265625, -1.8892822265625, -1.790374755859375, -1.69146728515625, -1.592559814453125, -1.49365234375, -1.394744873046875, -1.29583740234375, -1.196929931640625, -1.0980224609375, -0.999114990234375, -0.90020751953125, -0.801300048828125, -0.702392578125, -0.603485107421875, -0.50457763671875, -0.405670166015625, -0.3067626953125, -0.207855224609375, -0.10894775390625, -0.010040283203125, 0.0888671875, 0.187774658203125, 0.28668212890625, 0.385589599609375, 0.4844970703125, 0.583404541015625, 0.68231201171875, 0.781219482421875, 0.880126953125, 0.979034423828125, 1.07794189453125, 1.176849365234375, 1.2757568359375, 1.374664306640625, 1.47357177734375, 1.572479248046875, 1.67138671875, 1.770294189453125, 1.86920166015625, 1.968109130859375, 2.0670166015625, 2.165924072265625, 2.26483154296875, 2.363739013671875, 2.462646484375, 2.561553955078125, 2.66046142578125, 2.759368896484375, 2.8582763671875, 2.957183837890625, 3.05609130859375, 3.154998779296875, 3.25390625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 18.0, 20.0, 25.0, 26.0, 34.0, 47.0, 71.0, 94.0, 113.0, 148.0, 213.0, 319.0, 486.0, 684.0, 931.0, 1494.0, 2473.0, 4143.0, 7615.0, 15149.0, 31358.0, 64539.0, 132790.0, 5544323.0, 298825.0, 93221.0, 45443.0, 21798.0, 10582.0, 5507.0, 3203.0, 1763.0, 1149.0, 774.0, 564.0, 422.0, 287.0, 251.0, 162.0, 114.0, 77.0, 50.0, 42.0, 22.0, 16.0, 12.0, 14.0, 4.0, 6.0, 6.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.5313720703125, -1.484619140625, -1.4378662109375, -1.39111328125, -1.3443603515625, -1.297607421875, -1.2508544921875, -1.2041015625, -1.1573486328125, -1.110595703125, -1.0638427734375, -1.01708984375, -0.9703369140625, -0.923583984375, -0.8768310546875, -0.830078125, -0.7833251953125, -0.736572265625, -0.6898193359375, -0.64306640625, -0.5963134765625, -0.549560546875, -0.5028076171875, -0.4560546875, -0.4093017578125, -0.362548828125, -0.3157958984375, -0.26904296875, -0.2222900390625, -0.175537109375, -0.1287841796875, -0.08203125, -0.0352783203125, 0.011474609375, 0.0582275390625, 0.10498046875, 0.1517333984375, 0.198486328125, 0.2452392578125, 0.2919921875, 0.3387451171875, 0.385498046875, 0.4322509765625, 0.47900390625, 0.5257568359375, 0.572509765625, 0.6192626953125, 0.666015625, 0.7127685546875, 0.759521484375, 0.8062744140625, 0.85302734375, 0.8997802734375, 0.946533203125, 0.9932861328125, 1.0400390625, 1.0867919921875, 1.133544921875, 1.1802978515625, 1.22705078125, 1.2738037109375, 1.320556640625, 1.3673095703125, 1.4140625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 16.0, 6.0, 8.0, 11.0, 26.0, 13.0, 36.0, 28.0, 25.0, 25.0, 30.0, 29.0, 49.0, 45.0, 49.0, 44.0, 340.0, 750.0, 69.0, 38.0, 40.0, 33.0, 47.0, 36.0, 31.0, 27.0, 24.0, 27.0, 18.0, 13.0, 15.0, 18.0, 9.0, 6.0, 6.0, 6.0, 4.0, 8.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.06884765625, -3.9462890625, -3.82373046875, -3.701171875, -3.57861328125, -3.4560546875, -3.33349609375, -3.2109375, -3.08837890625, -2.9658203125, -2.84326171875, -2.720703125, -2.59814453125, -2.4755859375, -2.35302734375, -2.23046875, -2.10791015625, -1.9853515625, -1.86279296875, -1.740234375, -1.61767578125, -1.4951171875, -1.37255859375, -1.25, -1.12744140625, -1.0048828125, -0.88232421875, -0.759765625, -0.63720703125, -0.5146484375, -0.39208984375, -0.26953125, -0.14697265625, -0.0244140625, 0.09814453125, 0.220703125, 0.34326171875, 0.4658203125, 0.58837890625, 0.7109375, 0.83349609375, 0.9560546875, 1.07861328125, 1.201171875, 1.32373046875, 1.4462890625, 1.56884765625, 1.69140625, 1.81396484375, 1.9365234375, 2.05908203125, 2.181640625, 2.30419921875, 2.4267578125, 2.54931640625, 2.671875, 2.79443359375, 2.9169921875, 3.03955078125, 3.162109375, 3.28466796875, 3.4072265625, 3.52978515625, 3.65234375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 11.0, 25.0, 35.0, 75.0, 162.0, 245.0, 216.0, 105.0, 47.0, 22.0, 21.0, 9.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.026805877685547, -18.461204528808594, -17.89560317993164, -17.330001831054688, -16.764400482177734, -16.198801040649414, -15.633199691772461, -15.067598342895508, -14.501996994018555, -13.936395645141602, -13.370794296264648, -12.805193901062012, -12.239592552185059, -11.673991203308105, -11.108390808105469, -10.542789459228516, -9.977188110351562, -9.41158676147461, -8.845985412597656, -8.28038501739502, -7.714783668518066, -7.149182319641113, -6.583581447601318, -6.017980575561523, -5.45237922668457, -4.886777877807617, -4.321177005767822, -3.7555758953094482, -3.189974784851074, -2.6243736743927, -2.058772563934326, -1.4931714534759521, -0.9275722503662109, -0.3619711399078369, 0.2036299705505371, 0.7692310810089111, 1.3348321914672852, 1.9004333019256592, 2.466034412384033, 3.0316355228424072, 3.5972366333007812, 4.162837982177734, 4.728438854217529, 5.294039726257324, 5.859641075134277, 6.4252424240112305, 6.990843296051025, 7.55644416809082, 8.122045516967773, 8.687646865844727, 9.25324821472168, 9.818848609924316, 10.38444995880127, 10.950051307678223, 11.51565170288086, 12.081253051757812, 12.646854400634766, 13.212455749511719, 13.778057098388672, 14.343657493591309, 14.909258842468262, 15.474860191345215, 16.04046058654785, 16.606061935424805, 17.171663284301758]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 5.0, 9.0, 10.0, 13.0, 9.0, 16.0, 17.0, 18.0, 33.0, 28.0, 29.0, 53.0, 51.0, 44.0, 55.0, 62.0, 67.0, 53.0, 53.0, 45.0, 44.0, 39.0, 42.0, 21.0, 37.0, 26.0, 18.0, 9.0, 14.0, 8.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-12.745399475097656, -12.375323295593262, -12.005248069763184, -11.635171890258789, -11.265096664428711, -10.895020484924316, -10.524944305419922, -10.154869079589844, -9.784793853759766, -9.414717674255371, -9.044642448425293, -8.674566268920898, -8.30449104309082, -7.934414863586426, -7.5643391609191895, -7.194263458251953, -6.824187278747559, -6.454111576080322, -6.084035873413086, -5.713959693908691, -5.343884468078613, -4.973808288574219, -4.603732585906982, -4.233656883239746, -3.8635811805725098, -3.4935054779052734, -3.123429775238037, -2.7533538341522217, -2.3832781314849854, -2.013202428817749, -1.6431264877319336, -1.2730507850646973, -0.9029760360717773, -0.5329002737998962, -0.16282451152801514, 0.20725131034851074, 0.5773270130157471, 0.9474027156829834, 1.3174786567687988, 1.6875543594360352, 2.0576300621032715, 2.427705764770508, 2.797781467437744, 3.1678574085235596, 3.537933111190796, 3.9080088138580322, 4.278084754943848, 4.648160457611084, 5.01823616027832, 5.388311862945557, 5.758387565612793, 6.1284637451171875, 6.498538970947266, 6.86861515045166, 7.2386908531188965, 7.608766555786133, 7.978842258453369, 8.348917961120605, 8.718994140625, 9.089069366455078, 9.459145545959473, 9.82922077178955, 10.199296951293945, 10.569372177124023, 10.939448356628418]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 8.0, 10.0, 8.0, 14.0, 37.0, 35.0, 52.0, 80.0, 90.0, 108.0, 193.0, 299.0, 434.0, 817.0, 1475.0, 2877.0, 6527.0, 16773.0, 73269.0, 3966963.0, 90873.0, 18738.0, 6967.0, 3383.0, 1743.0, 950.0, 543.0, 333.0, 199.0, 137.0, 94.0, 60.0, 43.0, 34.0, 23.0, 18.0, 12.0, 11.0, 9.0, 3.0, 9.0, 6.0, 7.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.1640625, -0.15917396545410156, -0.15428543090820312, -0.1493968963623047, -0.14450836181640625, -0.1396198272705078, -0.13473129272460938, -0.12984275817871094, -0.1249542236328125, -0.12006568908691406, -0.11517715454101562, -0.11028861999511719, -0.10540008544921875, -0.10051155090332031, -0.09562301635742188, -0.09073448181152344, -0.085845947265625, -0.08095741271972656, -0.07606887817382812, -0.07118034362792969, -0.06629180908203125, -0.06140327453613281, -0.056514739990234375, -0.05162620544433594, -0.0467376708984375, -0.04184913635253906, -0.036960601806640625, -0.03207206726074219, -0.02718353271484375, -0.022294998168945312, -0.017406463623046875, -0.012517929077148438, -0.00762939453125, -0.0027408599853515625, 0.002147674560546875, 0.0070362091064453125, 0.01192474365234375, 0.016813278198242188, 0.021701812744140625, 0.026590347290039062, 0.0314788818359375, 0.03636741638183594, 0.041255950927734375, 0.04614448547363281, 0.05103302001953125, 0.05592155456542969, 0.060810089111328125, 0.06569862365722656, 0.070587158203125, 0.07547569274902344, 0.08036422729492188, 0.08525276184082031, 0.09014129638671875, 0.09502983093261719, 0.09991836547851562, 0.10480690002441406, 0.1096954345703125, 0.11458396911621094, 0.11947250366210938, 0.12436103820800781, 0.12924957275390625, 0.1341381072998047, 0.13902664184570312, 0.14391517639160156, 0.1488037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 6.0, 5.0, 8.0, 10.0, 14.0, 14.0, 31.0, 51.0, 182.0, 465.0, 56.0, 28.0, 14.0, 13.0, 10.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.047943115234375, -0.046575069427490234, -0.04520702362060547, -0.0438389778137207, -0.04247093200683594, -0.04110288619995117, -0.039734840393066406, -0.03836679458618164, -0.036998748779296875, -0.03563070297241211, -0.034262657165527344, -0.03289461135864258, -0.03152656555175781, -0.030158519744873047, -0.02879047393798828, -0.027422428131103516, -0.02605438232421875, -0.024686336517333984, -0.02331829071044922, -0.021950244903564453, -0.020582199096679688, -0.019214153289794922, -0.017846107482910156, -0.01647806167602539, -0.015110015869140625, -0.01374197006225586, -0.012373924255371094, -0.011005878448486328, -0.009637832641601562, -0.008269786834716797, -0.006901741027832031, -0.005533695220947266, -0.0041656494140625, -0.0027976036071777344, -0.0014295578002929688, -6.151199340820312e-05, 0.0013065338134765625, 0.002674579620361328, 0.004042625427246094, 0.005410671234130859, 0.006778717041015625, 0.00814676284790039, 0.009514808654785156, 0.010882854461669922, 0.012250900268554688, 0.013618946075439453, 0.014986991882324219, 0.016355037689208984, 0.01772308349609375, 0.019091129302978516, 0.02045917510986328, 0.021827220916748047, 0.023195266723632812, 0.024563312530517578, 0.025931358337402344, 0.02729940414428711, 0.028667449951171875, 0.03003549575805664, 0.031403541564941406, 0.03277158737182617, 0.03413963317871094, 0.0355076789855957, 0.03687572479248047, 0.038243770599365234, 0.03961181640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 7.0, 3.0, 12.0, 14.0, 20.0, 34.0, 40.0, 54.0, 96.0, 156.0, 345.0, 787.0, 1811.0, 4880.0, 14697.0, 54042.0, 287101.0, 3206417.0, 514418.0, 78126.0, 20336.0, 6503.0, 2361.0, 973.0, 435.0, 228.0, 136.0, 65.0, 51.0, 31.0, 29.0, 16.0, 12.0, 8.0, 10.0, 6.0, 0.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09147453308105469, -0.08803939819335938, -0.08460426330566406, -0.08116912841796875, -0.07773399353027344, -0.07429885864257812, -0.07086372375488281, -0.0674285888671875, -0.06399345397949219, -0.060558319091796875, -0.05712318420410156, -0.05368804931640625, -0.05025291442871094, -0.046817779541015625, -0.04338264465332031, -0.039947509765625, -0.03651237487792969, -0.033077239990234375, -0.029642105102539062, -0.02620697021484375, -0.022771835327148438, -0.019336700439453125, -0.015901565551757812, -0.0124664306640625, -0.009031295776367188, -0.005596160888671875, -0.0021610260009765625, 0.00127410888671875, 0.0047092437744140625, 0.008144378662109375, 0.011579513549804688, 0.0150146484375, 0.018449783325195312, 0.021884918212890625, 0.025320053100585938, 0.02875518798828125, 0.03219032287597656, 0.035625457763671875, 0.03906059265136719, 0.0424957275390625, 0.04593086242675781, 0.049365997314453125, 0.05280113220214844, 0.05623626708984375, 0.05967140197753906, 0.06310653686523438, 0.06654167175292969, 0.069976806640625, 0.07341194152832031, 0.07684707641601562, 0.08028221130371094, 0.08371734619140625, 0.08715248107910156, 0.09058761596679688, 0.09402275085449219, 0.0974578857421875, 0.10089302062988281, 0.10432815551757812, 0.10776329040527344, 0.11119842529296875, 0.11463356018066406, 0.11806869506835938, 0.12150382995605469, 0.12493896484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 2.0, 13.0, 13.0, 11.0, 17.0, 16.0, 23.0, 34.0, 43.0, 50.0, 65.0, 81.0, 110.0, 183.0, 265.0, 599.0, 1066.0, 551.0, 281.0, 174.0, 111.0, 80.0, 55.0, 48.0, 36.0, 20.0, 25.0, 24.0, 14.0, 10.0, 10.0, 6.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030140399932861328, -0.029000282287597656, -0.027860164642333984, -0.026720046997070312, -0.02557992935180664, -0.02443981170654297, -0.023299694061279297, -0.022159576416015625, -0.021019458770751953, -0.01987934112548828, -0.01873922348022461, -0.017599105834960938, -0.016458988189697266, -0.015318870544433594, -0.014178752899169922, -0.01303863525390625, -0.011898517608642578, -0.010758399963378906, -0.009618282318115234, -0.008478164672851562, -0.007338047027587891, -0.006197929382324219, -0.005057811737060547, -0.003917694091796875, -0.002777576446533203, -0.0016374588012695312, -0.0004973411560058594, 0.0006427764892578125, 0.0017828941345214844, 0.0029230117797851562, 0.004063129425048828, 0.0052032470703125, 0.006343364715576172, 0.007483482360839844, 0.008623600006103516, 0.009763717651367188, 0.01090383529663086, 0.012043952941894531, 0.013184070587158203, 0.014324188232421875, 0.015464305877685547, 0.01660442352294922, 0.01774454116821289, 0.018884658813476562, 0.020024776458740234, 0.021164894104003906, 0.022305011749267578, 0.02344512939453125, 0.024585247039794922, 0.025725364685058594, 0.026865482330322266, 0.028005599975585938, 0.02914571762084961, 0.03028583526611328, 0.03142595291137695, 0.032566070556640625, 0.0337061882019043, 0.03484630584716797, 0.03598642349243164, 0.03712654113769531, 0.038266658782958984, 0.039406776428222656, 0.04054689407348633, 0.04168701171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 12.0, 28.0, 64.0, 149.0, 243.0, 254.0, 140.0, 60.0, 23.0, 10.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22374887764453888, -0.21200014650821686, -0.20025141537189484, -0.18850268423557281, -0.1767539530992508, -0.16500522196292877, -0.15325647592544556, -0.14150774478912354, -0.1297590136528015, -0.11801028251647949, -0.10626155138015747, -0.09451282024383545, -0.08276408910751343, -0.0710153579711914, -0.05926661938428879, -0.047517888247966766, -0.03576916456222534, -0.02402043342590332, -0.01227170042693615, -0.0005229674279689789, 0.011225763708353043, 0.022974494844675064, 0.034723229706287384, 0.046471960842609406, 0.05822069197893143, 0.06996942311525345, 0.08171815425157547, 0.09346689283847809, 0.10521562397480011, 0.11696435511112213, 0.12871308624744415, 0.14046181738376617, 0.1522105634212494, 0.1639592945575714, 0.17570802569389343, 0.18745675683021545, 0.19920548796653748, 0.2109542191028595, 0.22270295023918152, 0.23445168137550354, 0.24620041251182556, 0.2579491436481476, 0.2696978747844696, 0.2814466059207916, 0.29319533705711365, 0.30494406819343567, 0.3166927993297577, 0.3284415304660797, 0.3401902914047241, 0.35193902254104614, 0.36368775367736816, 0.3754364848136902, 0.3871852159500122, 0.39893394708633423, 0.41068267822265625, 0.42243140935897827, 0.4341801404953003, 0.4459288716316223, 0.45767760276794434, 0.46942633390426636, 0.4811750650405884, 0.4929237961769104, 0.5046725273132324, 0.5164212584495544, 0.5281699895858765]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 5.0, 6.0, 3.0, 9.0, 12.0, 14.0, 15.0, 20.0, 25.0, 35.0, 44.0, 39.0, 51.0, 51.0, 74.0, 64.0, 71.0, 71.0, 71.0, 56.0, 62.0, 32.0, 32.0, 22.0, 29.0, 19.0, 24.0, 9.0, 8.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17424196004867554, -0.16807514429092407, -0.1619083285331726, -0.15574151277542114, -0.14957469701766968, -0.14340786635875702, -0.13724105060100555, -0.1310742348432541, -0.12490741908550262, -0.11874060332775116, -0.1125737875699997, -0.10640696436166763, -0.10024014860391617, -0.0940733328461647, -0.08790650963783264, -0.08173969388008118, -0.07557287812232971, -0.06940606236457825, -0.06323924660682678, -0.05707242339849472, -0.050905607640743256, -0.04473879188299179, -0.03857197239995003, -0.032405152916908264, -0.0262383371591568, -0.020071519538760185, -0.013904701918363571, -0.007737884297966957, -0.001571066677570343, 0.004595750942826271, 0.010762568563222885, 0.01692938804626465, 0.023096203804016113, 0.029263021424412727, 0.03542983904480934, 0.041596658527851105, 0.04776347428560257, 0.053930290043354034, 0.0600971095263958, 0.06626392900943756, 0.07243074476718903, 0.07859756052494049, 0.08476437628269196, 0.09093119949102402, 0.09709801524877548, 0.10326483100652695, 0.10943165421485901, 0.11559846997261047, 0.12176528573036194, 0.1279321014881134, 0.13409891724586487, 0.14026573300361633, 0.1464325487613678, 0.15259937942028046, 0.15876619517803192, 0.1649330109357834, 0.17109982669353485, 0.17726664245128632, 0.18343345820903778, 0.18960027396678925, 0.1957671046257019, 0.20193392038345337, 0.20810073614120483, 0.2142675518989563, 0.22043436765670776]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 1.0, 6.0, 6.0, 13.0, 19.0, 34.0, 39.0, 54.0, 84.0, 128.0, 168.0, 206.0, 307.0, 426.0, 551.0, 837.0, 1209.0, 1629.0, 2324.0, 3583.0, 5382.0, 8550.0, 14316.0, 26646.0, 71387.0, 762478.0, 79506.0, 28038.0, 14664.0, 8820.0, 5510.0, 3593.0, 2429.0, 1660.0, 1107.0, 795.0, 551.0, 393.0, 308.0, 244.0, 167.0, 118.0, 90.0, 66.0, 28.0, 30.0, 24.0, 11.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1036376953125, -0.10035037994384766, -0.09706306457519531, -0.09377574920654297, -0.09048843383789062, -0.08720111846923828, -0.08391380310058594, -0.0806264877319336, -0.07733917236328125, -0.0740518569946289, -0.07076454162597656, -0.06747722625732422, -0.06418991088867188, -0.06090259552001953, -0.05761528015136719, -0.054327964782714844, -0.0510406494140625, -0.047753334045410156, -0.04446601867675781, -0.04117870330810547, -0.037891387939453125, -0.03460407257080078, -0.03131675720214844, -0.028029441833496094, -0.02474212646484375, -0.021454811096191406, -0.018167495727539062, -0.014880180358886719, -0.011592864990234375, -0.008305549621582031, -0.0050182342529296875, -0.0017309188842773438, 0.001556396484375, 0.004843711853027344, 0.008131027221679688, 0.011418342590332031, 0.014705657958984375, 0.01799297332763672, 0.021280288696289062, 0.024567604064941406, 0.02785491943359375, 0.031142234802246094, 0.03442955017089844, 0.03771686553955078, 0.041004180908203125, 0.04429149627685547, 0.04757881164550781, 0.050866127014160156, 0.0541534423828125, 0.057440757751464844, 0.06072807312011719, 0.06401538848876953, 0.06730270385742188, 0.07059001922607422, 0.07387733459472656, 0.0771646499633789, 0.08045196533203125, 0.0837392807006836, 0.08702659606933594, 0.09031391143798828, 0.09360122680664062, 0.09688854217529297, 0.10017585754394531, 0.10346317291259766, 0.10675048828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 5.0, 9.0, 9.0, 6.0, 6.0, 6.0, 7.0, 17.0, 24.0, 27.0, 80.0, 361.0, 249.0, 52.0, 32.0, 15.0, 14.0, 11.0, 7.0, 8.0, 9.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.044189453125, -0.04288339614868164, -0.04157733917236328, -0.04027128219604492, -0.03896522521972656, -0.0376591682434082, -0.036353111267089844, -0.035047054290771484, -0.033740997314453125, -0.032434940338134766, -0.031128883361816406, -0.029822826385498047, -0.028516769409179688, -0.027210712432861328, -0.02590465545654297, -0.02459859848022461, -0.02329254150390625, -0.02198648452758789, -0.02068042755126953, -0.019374370574951172, -0.018068313598632812, -0.016762256622314453, -0.015456199645996094, -0.014150142669677734, -0.012844085693359375, -0.011538028717041016, -0.010231971740722656, -0.008925914764404297, -0.0076198577880859375, -0.006313800811767578, -0.005007743835449219, -0.0037016868591308594, -0.0023956298828125, -0.0010895729064941406, 0.00021648406982421875, 0.0015225410461425781, 0.0028285980224609375, 0.004134654998779297, 0.005440711975097656, 0.006746768951416016, 0.008052825927734375, 0.009358882904052734, 0.010664939880371094, 0.011970996856689453, 0.013277053833007812, 0.014583110809326172, 0.01588916778564453, 0.01719522476196289, 0.01850128173828125, 0.01980733871459961, 0.02111339569091797, 0.022419452667236328, 0.023725509643554688, 0.025031566619873047, 0.026337623596191406, 0.027643680572509766, 0.028949737548828125, 0.030255794525146484, 0.031561851501464844, 0.0328679084777832, 0.03417396545410156, 0.03548002243041992, 0.03678607940673828, 0.03809213638305664, 0.039398193359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 12.0, 10.0, 13.0, 12.0, 19.0, 13.0, 30.0, 49.0, 70.0, 80.0, 127.0, 196.0, 349.0, 654.0, 1382.0, 3186.0, 8582.0, 26079.0, 99762.0, 436684.0, 356226.0, 79939.0, 22210.0, 7318.0, 2765.0, 1207.0, 621.0, 330.0, 175.0, 130.0, 83.0, 49.0, 41.0, 38.0, 18.0, 16.0, 24.0, 17.0, 7.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10247802734375, -0.09916400909423828, -0.09584999084472656, -0.09253597259521484, -0.08922195434570312, -0.0859079360961914, -0.08259391784667969, -0.07927989959716797, -0.07596588134765625, -0.07265186309814453, -0.06933784484863281, -0.0660238265991211, -0.06270980834960938, -0.059395790100097656, -0.05608177185058594, -0.05276775360107422, -0.0494537353515625, -0.04613971710205078, -0.04282569885253906, -0.039511680603027344, -0.036197662353515625, -0.032883644104003906, -0.029569625854492188, -0.02625560760498047, -0.02294158935546875, -0.01962757110595703, -0.016313552856445312, -0.012999534606933594, -0.009685516357421875, -0.006371498107910156, -0.0030574798583984375, 0.00025653839111328125, 0.003570556640625, 0.006884574890136719, 0.010198593139648438, 0.013512611389160156, 0.016826629638671875, 0.020140647888183594, 0.023454666137695312, 0.02676868438720703, 0.03008270263671875, 0.03339672088623047, 0.03671073913574219, 0.040024757385253906, 0.043338775634765625, 0.046652793884277344, 0.04996681213378906, 0.05328083038330078, 0.0565948486328125, 0.05990886688232422, 0.06322288513183594, 0.06653690338134766, 0.06985092163085938, 0.0731649398803711, 0.07647895812988281, 0.07979297637939453, 0.08310699462890625, 0.08642101287841797, 0.08973503112792969, 0.0930490493774414, 0.09636306762695312, 0.09967708587646484, 0.10299110412597656, 0.10630512237548828, 0.109619140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 10.0, 12.0, 9.0, 6.0, 9.0, 16.0, 16.0, 18.0, 24.0, 23.0, 26.0, 38.0, 36.0, 33.0, 39.0, 33.0, 31.0, 28.0, 56.0, 42.0, 38.0, 42.0, 35.0, 42.0, 32.0, 36.0, 40.0, 31.0, 25.0, 24.0, 32.0, 19.0, 13.0, 7.0, 9.0, 16.0, 17.0, 10.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.123260498046875, -0.11920166015625, -0.115142822265625, -0.111083984375, -0.107025146484375, -0.10296630859375, -0.098907470703125, -0.0948486328125, -0.090789794921875, -0.08673095703125, -0.082672119140625, -0.07861328125, -0.074554443359375, -0.07049560546875, -0.066436767578125, -0.0623779296875, -0.058319091796875, -0.05426025390625, -0.050201416015625, -0.046142578125, -0.042083740234375, -0.03802490234375, -0.033966064453125, -0.0299072265625, -0.025848388671875, -0.02178955078125, -0.017730712890625, -0.013671875, -0.009613037109375, -0.00555419921875, -0.001495361328125, 0.0025634765625, 0.006622314453125, 0.01068115234375, 0.014739990234375, 0.018798828125, 0.022857666015625, 0.02691650390625, 0.030975341796875, 0.0350341796875, 0.039093017578125, 0.04315185546875, 0.047210693359375, 0.05126953125, 0.055328369140625, 0.05938720703125, 0.063446044921875, 0.0675048828125, 0.071563720703125, 0.07562255859375, 0.079681396484375, 0.083740234375, 0.087799072265625, 0.09185791015625, 0.095916748046875, 0.0999755859375, 0.104034423828125, 0.10809326171875, 0.112152099609375, 0.1162109375, 0.120269775390625, 0.12432861328125, 0.128387451171875, 0.1324462890625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 11.0, 15.0, 15.0, 31.0, 65.0, 98.0, 127.0, 259.0, 562.0, 1232.0, 3442.0, 12675.0, 82478.0, 732303.0, 185716.0, 21056.0, 5267.0, 1663.0, 717.0, 350.0, 187.0, 97.0, 62.0, 41.0, 22.0, 19.0, 7.0, 12.0, 5.0, 8.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09393310546875, -0.09105682373046875, -0.0881805419921875, -0.08530426025390625, -0.082427978515625, -0.07955169677734375, -0.0766754150390625, -0.07379913330078125, -0.0709228515625, -0.06804656982421875, -0.0651702880859375, -0.06229400634765625, -0.059417724609375, -0.05654144287109375, -0.0536651611328125, -0.05078887939453125, -0.04791259765625, -0.04503631591796875, -0.0421600341796875, -0.03928375244140625, -0.036407470703125, -0.03353118896484375, -0.0306549072265625, -0.02777862548828125, -0.02490234375, -0.02202606201171875, -0.0191497802734375, -0.01627349853515625, -0.013397216796875, -0.01052093505859375, -0.0076446533203125, -0.00476837158203125, -0.00189208984375, 0.00098419189453125, 0.0038604736328125, 0.00673675537109375, 0.009613037109375, 0.01248931884765625, 0.0153656005859375, 0.01824188232421875, 0.0211181640625, 0.02399444580078125, 0.0268707275390625, 0.02974700927734375, 0.032623291015625, 0.03549957275390625, 0.0383758544921875, 0.04125213623046875, 0.04412841796875, 0.04700469970703125, 0.0498809814453125, 0.05275726318359375, 0.055633544921875, 0.05850982666015625, 0.0613861083984375, 0.06426239013671875, 0.067138671875, 0.07001495361328125, 0.0728912353515625, 0.07576751708984375, 0.078643798828125, 0.08152008056640625, 0.0843963623046875, 0.08727264404296875, 0.09014892578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 5.0, 5.0, 5.0, 7.0, 10.0, 12.0, 16.0, 20.0, 34.0, 30.0, 28.0, 42.0, 59.0, 57.0, 83.0, 74.0, 58.0, 57.0, 49.0, 66.0, 38.0, 36.0, 41.0, 23.0, 38.0, 30.0, 15.0, 12.0, 9.0, 21.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2278556823730469e-05, -1.176539808511734e-05, -1.1252239346504211e-05, -1.0739080607891083e-05, -1.0225921869277954e-05, -9.712763130664825e-06, -9.199604392051697e-06, -8.686445653438568e-06, -8.17328691482544e-06, -7.66012817621231e-06, -7.146969437599182e-06, -6.6338106989860535e-06, -6.120651960372925e-06, -5.607493221759796e-06, -5.0943344831466675e-06, -4.581175744533539e-06, -4.06801700592041e-06, -3.5548582673072815e-06, -3.041699528694153e-06, -2.528540790081024e-06, -2.0153820514678955e-06, -1.5022233128547668e-06, -9.890645742416382e-07, -4.759058356285095e-07, 3.725290298461914e-08, 5.504116415977478e-07, 1.0635703802108765e-06, 1.5767291188240051e-06, 2.089887857437134e-06, 2.6030465960502625e-06, 3.116205334663391e-06, 3.6293640732765198e-06, 4.1425228118896484e-06, 4.655681550502777e-06, 5.168840289115906e-06, 5.6819990277290344e-06, 6.195157766342163e-06, 6.708316504955292e-06, 7.22147524356842e-06, 7.734633982181549e-06, 8.247792720794678e-06, 8.760951459407806e-06, 9.274110198020935e-06, 9.787268936634064e-06, 1.0300427675247192e-05, 1.0813586413860321e-05, 1.132674515247345e-05, 1.1839903891086578e-05, 1.2353062629699707e-05, 1.2866221368312836e-05, 1.3379380106925964e-05, 1.3892538845539093e-05, 1.4405697584152222e-05, 1.491885632276535e-05, 1.543201506137848e-05, 1.5945173799991608e-05, 1.6458332538604736e-05, 1.6971491277217865e-05, 1.7484650015830994e-05, 1.7997808754444122e-05, 1.851096749305725e-05, 1.902412623167038e-05, 1.9537284970283508e-05, 2.0050443708896637e-05, 2.0563602447509766e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 9.0, 25.0, 30.0, 54.0, 107.0, 199.0, 473.0, 1163.0, 3959.0, 18313.0, 170356.0, 750991.0, 86571.0, 11769.0, 2834.0, 902.0, 377.0, 177.0, 90.0, 51.0, 23.0, 24.0, 10.0, 17.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0916748046875, -0.08832550048828125, -0.0849761962890625, -0.08162689208984375, -0.078277587890625, -0.07492828369140625, -0.0715789794921875, -0.06822967529296875, -0.06488037109375, -0.06153106689453125, -0.0581817626953125, -0.05483245849609375, -0.051483154296875, -0.04813385009765625, -0.0447845458984375, -0.04143524169921875, -0.0380859375, -0.03473663330078125, -0.0313873291015625, -0.02803802490234375, -0.024688720703125, -0.02133941650390625, -0.0179901123046875, -0.01464080810546875, -0.01129150390625, -0.00794219970703125, -0.0045928955078125, -0.00124359130859375, 0.002105712890625, 0.00545501708984375, 0.0088043212890625, 0.01215362548828125, 0.0155029296875, 0.01885223388671875, 0.0222015380859375, 0.02555084228515625, 0.028900146484375, 0.03224945068359375, 0.0355987548828125, 0.03894805908203125, 0.04229736328125, 0.04564666748046875, 0.0489959716796875, 0.05234527587890625, 0.055694580078125, 0.05904388427734375, 0.0623931884765625, 0.06574249267578125, 0.069091796875, 0.07244110107421875, 0.0757904052734375, 0.07913970947265625, 0.082489013671875, 0.08583831787109375, 0.0891876220703125, 0.09253692626953125, 0.09588623046875, 0.09923553466796875, 0.1025848388671875, 0.10593414306640625, 0.109283447265625, 0.11263275146484375, 0.1159820556640625, 0.11933135986328125, 0.1226806640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 8.0, 12.0, 19.0, 23.0, 35.0, 42.0, 75.0, 85.0, 130.0, 101.0, 127.0, 97.0, 75.0, 51.0, 34.0, 30.0, 20.0, 12.0, 7.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07171630859375, -0.0688161849975586, -0.06591606140136719, -0.06301593780517578, -0.060115814208984375, -0.05721569061279297, -0.05431556701660156, -0.051415443420410156, -0.04851531982421875, -0.045615196228027344, -0.04271507263183594, -0.03981494903564453, -0.036914825439453125, -0.03401470184326172, -0.031114578247070312, -0.028214454650878906, -0.0253143310546875, -0.022414207458496094, -0.019514083862304688, -0.01661396026611328, -0.013713836669921875, -0.010813713073730469, -0.007913589477539062, -0.005013465881347656, -0.00211334228515625, 0.0007867813110351562, 0.0036869049072265625, 0.006587028503417969, 0.009487152099609375, 0.012387275695800781, 0.015287399291992188, 0.018187522888183594, 0.021087646484375, 0.023987770080566406, 0.026887893676757812, 0.02978801727294922, 0.032688140869140625, 0.03558826446533203, 0.03848838806152344, 0.041388511657714844, 0.04428863525390625, 0.047188758850097656, 0.05008888244628906, 0.05298900604248047, 0.055889129638671875, 0.05878925323486328, 0.06168937683105469, 0.0645895004272461, 0.0674896240234375, 0.0703897476196289, 0.07328987121582031, 0.07618999481201172, 0.07909011840820312, 0.08199024200439453, 0.08489036560058594, 0.08779048919677734, 0.09069061279296875, 0.09359073638916016, 0.09649085998535156, 0.09939098358154297, 0.10229110717773438, 0.10519123077392578, 0.10809135437011719, 0.1109914779663086, 0.1138916015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 25.0, 47.0, 133.0, 276.0, 282.0, 119.0, 50.0, 29.0, 12.0, 6.0, 10.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1231088638305664, -1.076072335243225, -1.0290359258651733, -0.981999397277832, -0.9349629878997803, -0.887926459312439, -0.8408899903297424, -0.7938535213470459, -0.7468170523643494, -0.6997805833816528, -0.6527441143989563, -0.6057076454162598, -0.5586711168289185, -0.5116347074508667, -0.4645981788635254, -0.41756170988082886, -0.3705252408981323, -0.3234887719154358, -0.27645230293273926, -0.22941580414772034, -0.1823793351650238, -0.13534286618232727, -0.08830636739730835, -0.041269898414611816, 0.005766570568084717, 0.05280304700136185, 0.09983952343463898, 0.1468760073184967, 0.19391247630119324, 0.24094894528388977, 0.2879854440689087, 0.3350219130516052, 0.3820585012435913, 0.42909497022628784, 0.4761314392089844, 0.5231679677963257, 0.5702043771743774, 0.6172409057617188, 0.6642773747444153, 0.7113138437271118, 0.7583503127098083, 0.8053867816925049, 0.8524232506752014, 0.899459719657898, 0.9464962482452393, 0.993532657623291, 1.0405691862106323, 1.0876057147979736, 1.1346421241760254, 1.1816786527633667, 1.2287150621414185, 1.2757515907287598, 1.3227880001068115, 1.3698245286941528, 1.4168610572814941, 1.463897466659546, 1.5109338760375977, 1.557970404624939, 1.6050068140029907, 1.652043342590332, 1.6990797519683838, 1.746116280555725, 1.7931528091430664, 1.8401892185211182, 1.8872257471084595]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 8.0, 6.0, 8.0, 15.0, 19.0, 40.0, 53.0, 90.0, 138.0, 170.0, 134.0, 92.0, 71.0, 39.0, 30.0, 10.0, 13.0, 8.0, 5.0, 10.0, 6.0, 8.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0380027294158936, -2.9527106285095215, -2.8674187660217285, -2.7821266651153564, -2.6968345642089844, -2.6115427017211914, -2.5262506008148193, -2.4409584999084473, -2.3556666374206543, -2.2703745365142822, -2.1850826740264893, -2.099790573120117, -2.014498472213745, -1.9292064905166626, -1.84391450881958, -1.758622407913208, -1.673330307006836, -1.5880383253097534, -1.5027462244033813, -1.4174542427062988, -1.3321621417999268, -1.2468701601028442, -1.1615781784057617, -1.0762860774993896, -0.9909940958023071, -0.9057020545005798, -0.8204100131988525, -0.73511803150177, -0.6498259902000427, -0.5645339488983154, -0.4792419672012329, -0.3939499258995056, -0.3086576461791992, -0.22336561977863312, -0.13807359337806702, -0.05278158187866211, 0.032510459423065186, 0.11780250072479248, 0.203094482421875, 0.2883865237236023, 0.3736785650253296, 0.4589706063270569, 0.5442626476287842, 0.6295546293258667, 0.714846670627594, 0.8001387119293213, 0.8854306936264038, 0.9707227349281311, 1.0560147762298584, 1.141306757926941, 1.226598858833313, 1.3118908405303955, 1.3971829414367676, 1.48247492313385, 1.5677669048309326, 1.6530590057373047, 1.7383509874343872, 1.8236429691314697, 1.9089350700378418, 1.9942270517349243, 2.079519033432007, 2.164811134338379, 2.250102996826172, 2.335395097732544, 2.420687198638916]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 11.0, 13.0, 15.0, 31.0, 47.0, 72.0, 99.0, 149.0, 236.0, 320.0, 562.0, 861.0, 1440.0, 2470.0, 4775.0, 10208.0, 26285.0, 122434.0, 3879397.0, 101224.0, 23233.0, 9252.0, 4484.0, 2476.0, 1462.0, 889.0, 587.0, 380.0, 248.0, 178.0, 118.0, 99.0, 63.0, 43.0, 26.0, 27.0, 23.0, 11.0, 8.0, 12.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.322265625, -0.31317901611328125, -0.3040924072265625, -0.29500579833984375, -0.285919189453125, -0.27683258056640625, -0.2677459716796875, -0.25865936279296875, -0.24957275390625, -0.24048614501953125, -0.2313995361328125, -0.22231292724609375, -0.213226318359375, -0.20413970947265625, -0.1950531005859375, -0.18596649169921875, -0.1768798828125, -0.16779327392578125, -0.1587066650390625, -0.14962005615234375, -0.140533447265625, -0.13144683837890625, -0.1223602294921875, -0.11327362060546875, -0.10418701171875, -0.09510040283203125, -0.0860137939453125, -0.07692718505859375, -0.067840576171875, -0.05875396728515625, -0.0496673583984375, -0.04058074951171875, -0.031494140625, -0.02240753173828125, -0.0133209228515625, -0.00423431396484375, 0.004852294921875, 0.01393890380859375, 0.0230255126953125, 0.03211212158203125, 0.04119873046875, 0.05028533935546875, 0.0593719482421875, 0.06845855712890625, 0.077545166015625, 0.08663177490234375, 0.0957183837890625, 0.10480499267578125, 0.1138916015625, 0.12297821044921875, 0.1320648193359375, 0.14115142822265625, 0.150238037109375, 0.15932464599609375, 0.1684112548828125, 0.17749786376953125, 0.18658447265625, 0.19567108154296875, 0.2047576904296875, 0.21384429931640625, 0.222930908203125, 0.23201751708984375, 0.2411041259765625, 0.25019073486328125, 0.25927734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 2.0, 11.0, 8.0, 11.0, 13.0, 16.0, 27.0, 54.0, 101.0, 209.0, 242.0, 112.0, 55.0, 20.0, 15.0, 8.0, 13.0, 8.0, 5.0, 14.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03717041015625, -0.036008358001708984, -0.03484630584716797, -0.03368425369262695, -0.03252220153808594, -0.03136014938354492, -0.030198097229003906, -0.02903604507446289, -0.027873992919921875, -0.02671194076538086, -0.025549888610839844, -0.024387836456298828, -0.023225784301757812, -0.022063732147216797, -0.02090167999267578, -0.019739627838134766, -0.01857757568359375, -0.017415523529052734, -0.01625347137451172, -0.015091419219970703, -0.013929367065429688, -0.012767314910888672, -0.011605262756347656, -0.01044321060180664, -0.009281158447265625, -0.00811910629272461, -0.006957054138183594, -0.005795001983642578, -0.0046329498291015625, -0.003470897674560547, -0.0023088455200195312, -0.0011467933654785156, 1.52587890625e-05, 0.0011773109436035156, 0.0023393630981445312, 0.003501415252685547, 0.0046634674072265625, 0.005825519561767578, 0.006987571716308594, 0.00814962387084961, 0.009311676025390625, 0.01047372817993164, 0.011635780334472656, 0.012797832489013672, 0.013959884643554688, 0.015121936798095703, 0.01628398895263672, 0.017446041107177734, 0.01860809326171875, 0.019770145416259766, 0.02093219757080078, 0.022094249725341797, 0.023256301879882812, 0.024418354034423828, 0.025580406188964844, 0.02674245834350586, 0.027904510498046875, 0.02906656265258789, 0.030228614807128906, 0.03139066696166992, 0.03255271911621094, 0.03371477127075195, 0.03487682342529297, 0.036038875579833984, 0.037200927734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 14.0, 23.0, 41.0, 50.0, 72.0, 148.0, 271.0, 591.0, 1369.0, 3744.0, 12517.0, 55023.0, 572250.0, 3386271.0, 128856.0, 22979.0, 6105.0, 2153.0, 908.0, 402.0, 190.0, 105.0, 68.0, 39.0, 28.0, 15.0, 8.0, 10.0, 5.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.2549896240234375, -0.246551513671875, -0.2381134033203125, -0.22967529296875, -0.2212371826171875, -0.212799072265625, -0.2043609619140625, -0.1959228515625, -0.1874847412109375, -0.179046630859375, -0.1706085205078125, -0.16217041015625, -0.1537322998046875, -0.145294189453125, -0.1368560791015625, -0.12841796875, -0.1199798583984375, -0.111541748046875, -0.1031036376953125, -0.09466552734375, -0.0862274169921875, -0.077789306640625, -0.0693511962890625, -0.0609130859375, -0.0524749755859375, -0.044036865234375, -0.0355987548828125, -0.02716064453125, -0.0187225341796875, -0.010284423828125, -0.0018463134765625, 0.006591796875, 0.0150299072265625, 0.023468017578125, 0.0319061279296875, 0.04034423828125, 0.0487823486328125, 0.057220458984375, 0.0656585693359375, 0.0740966796875, 0.0825347900390625, 0.090972900390625, 0.0994110107421875, 0.10784912109375, 0.1162872314453125, 0.124725341796875, 0.1331634521484375, 0.1416015625, 0.1500396728515625, 0.158477783203125, 0.1669158935546875, 0.17535400390625, 0.1837921142578125, 0.192230224609375, 0.2006683349609375, 0.2091064453125, 0.2175445556640625, 0.225982666015625, 0.2344207763671875, 0.24285888671875, 0.2512969970703125, 0.259735107421875, 0.2681732177734375, 0.276611328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 9.0, 7.0, 13.0, 11.0, 15.0, 16.0, 24.0, 39.0, 67.0, 106.0, 138.0, 251.0, 541.0, 1639.0, 468.0, 231.0, 146.0, 97.0, 64.0, 46.0, 34.0, 17.0, 12.0, 11.0, 14.0, 7.0, 9.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.038083553314208984, -0.03682994842529297, -0.03557634353637695, -0.03432273864746094, -0.03306913375854492, -0.031815528869628906, -0.03056192398071289, -0.029308319091796875, -0.02805471420288086, -0.026801109313964844, -0.025547504425048828, -0.024293899536132812, -0.023040294647216797, -0.02178668975830078, -0.020533084869384766, -0.01927947998046875, -0.018025875091552734, -0.01677227020263672, -0.015518665313720703, -0.014265060424804688, -0.013011455535888672, -0.011757850646972656, -0.01050424575805664, -0.009250640869140625, -0.00799703598022461, -0.006743431091308594, -0.005489826202392578, -0.0042362213134765625, -0.002982616424560547, -0.0017290115356445312, -0.0004754066467285156, 0.0007781982421875, 0.0020318031311035156, 0.0032854080200195312, 0.004539012908935547, 0.0057926177978515625, 0.007046222686767578, 0.008299827575683594, 0.00955343246459961, 0.010807037353515625, 0.01206064224243164, 0.013314247131347656, 0.014567852020263672, 0.015821456909179688, 0.017075061798095703, 0.01832866668701172, 0.019582271575927734, 0.02083587646484375, 0.022089481353759766, 0.02334308624267578, 0.024596691131591797, 0.025850296020507812, 0.027103900909423828, 0.028357505798339844, 0.02961111068725586, 0.030864715576171875, 0.03211832046508789, 0.033371925354003906, 0.03462553024291992, 0.03587913513183594, 0.03713274002075195, 0.03838634490966797, 0.039639949798583984, 0.0408935546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 10.0, 92.0, 442.0, 353.0, 74.0, 15.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2886160910129547, -0.2639516294002533, -0.23928715288639069, -0.21462269127368927, -0.18995821475982666, -0.16529375314712524, -0.14062929153442383, -0.11596481502056122, -0.0913003534078598, -0.06663588434457779, -0.041971419006586075, -0.01730695366859436, 0.007357515394687653, 0.032021984457969666, 0.05668644607067108, 0.08135092258453369, 0.10601538419723511, 0.13067984580993652, 0.15534432232379913, 0.18000878393650055, 0.20467326045036316, 0.22933772206306458, 0.254002183675766, 0.2786666750907898, 0.3033311367034912, 0.3279955983161926, 0.35266005992889404, 0.37732452154159546, 0.40198901295661926, 0.4266534745693207, 0.4513179361820221, 0.4759824275970459, 0.5006468892097473, 0.5253113508224487, 0.5499758124351501, 0.5746402740478516, 0.599304735660553, 0.6239691972732544, 0.6486337184906006, 0.673298180103302, 0.6979626417160034, 0.7226271033287048, 0.7472915649414062, 0.7719560265541077, 0.7966204881668091, 0.8212850093841553, 0.8459494113922119, 0.8706139326095581, 0.8952783346176147, 0.9199427962303162, 0.9446072578430176, 0.969271719455719, 0.9939361810684204, 1.0186007022857666, 1.0432651042938232, 1.0679296255111694, 1.0925941467285156, 1.1172586679458618, 1.1419230699539185, 1.1665875911712646, 1.1912519931793213, 1.2159165143966675, 1.2405809164047241, 1.2652454376220703, 1.289909839630127]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 9.0, 7.0, 16.0, 16.0, 19.0, 21.0, 35.0, 38.0, 49.0, 47.0, 46.0, 57.0, 60.0, 68.0, 56.0, 57.0, 59.0, 63.0, 45.0, 37.0, 30.0, 36.0, 18.0, 17.0, 10.0, 13.0, 13.0, 8.0, 5.0, 5.0, 10.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.23094552755355835, -0.22420775890350342, -0.21747000515460968, -0.21073223650455475, -0.203994482755661, -0.19725671410560608, -0.19051894545555115, -0.1837811917066574, -0.17704343795776367, -0.17030566930770874, -0.163567915558815, -0.15683014690876007, -0.15009239315986633, -0.1433546245098114, -0.13661685585975647, -0.12987910211086273, -0.1231413334608078, -0.11640357226133347, -0.10966581106185913, -0.1029280424118042, -0.09619028866291046, -0.08945252001285553, -0.0827147588133812, -0.07597699761390686, -0.06923923641443253, -0.06250147521495819, -0.055763714015483856, -0.04902594909071922, -0.04228818789124489, -0.035550426691770554, -0.02881266176700592, -0.022074900567531586, -0.015337139368057251, -0.008599377237260342, -0.0018616151064634323, 0.004876147955656052, 0.011613909155130386, 0.01835167035460472, 0.025089435279369354, 0.03182719647884369, 0.038564957678318024, 0.04530271887779236, 0.05204048007726669, 0.058778245002031326, 0.06551600992679596, 0.0722537636756897, 0.07899153232574463, 0.08572929352521896, 0.0924670547246933, 0.09920481592416763, 0.10594257712364197, 0.1126803457736969, 0.11941809952259064, 0.12615586817264557, 0.1328936219215393, 0.13963139057159424, 0.14636915922164917, 0.1531069278717041, 0.15984468162059784, 0.16658245027065277, 0.1733202040195465, 0.18005797266960144, 0.18679574131965637, 0.1935334950685501, 0.20027124881744385]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 6.0, 12.0, 26.0, 20.0, 40.0, 53.0, 83.0, 101.0, 149.0, 222.0, 357.0, 505.0, 864.0, 1349.0, 2219.0, 3747.0, 7230.0, 15584.0, 39957.0, 244889.0, 621690.0, 66505.0, 21328.0, 9589.0, 4915.0, 2768.0, 1570.0, 933.0, 588.0, 396.0, 258.0, 170.0, 136.0, 85.0, 55.0, 45.0, 28.0, 15.0, 16.0, 17.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0], "bins": [-0.222412109375, -0.21626663208007812, -0.21012115478515625, -0.20397567749023438, -0.1978302001953125, -0.19168472290039062, -0.18553924560546875, -0.17939376831054688, -0.173248291015625, -0.16710281372070312, -0.16095733642578125, -0.15481185913085938, -0.1486663818359375, -0.14252090454101562, -0.13637542724609375, -0.13022994995117188, -0.12408447265625, -0.11793899536132812, -0.11179351806640625, -0.10564804077148438, -0.0995025634765625, -0.09335708618164062, -0.08721160888671875, -0.08106613159179688, -0.074920654296875, -0.06877517700195312, -0.06262969970703125, -0.056484222412109375, -0.0503387451171875, -0.044193267822265625, -0.03804779052734375, -0.031902313232421875, -0.0257568359375, -0.019611358642578125, -0.01346588134765625, -0.007320404052734375, -0.0011749267578125, 0.004970550537109375, 0.01111602783203125, 0.017261505126953125, 0.023406982421875, 0.029552459716796875, 0.03569793701171875, 0.041843414306640625, 0.0479888916015625, 0.054134368896484375, 0.06027984619140625, 0.06642532348632812, 0.07257080078125, 0.07871627807617188, 0.08486175537109375, 0.09100723266601562, 0.0971527099609375, 0.10329818725585938, 0.10944366455078125, 0.11558914184570312, 0.121734619140625, 0.12788009643554688, 0.13402557373046875, 0.14017105102539062, 0.1463165283203125, 0.15246200561523438, 0.15860748291015625, 0.16475296020507812, 0.1708984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 7.0, 3.0, 14.0, 12.0, 10.0, 19.0, 25.0, 44.0, 85.0, 152.0, 216.0, 152.0, 92.0, 51.0, 26.0, 18.0, 13.0, 11.0, 9.0, 7.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03662109375, -0.03542137145996094, -0.034221649169921875, -0.03302192687988281, -0.03182220458984375, -0.030622482299804688, -0.029422760009765625, -0.028223037719726562, -0.0270233154296875, -0.025823593139648438, -0.024623870849609375, -0.023424148559570312, -0.02222442626953125, -0.021024703979492188, -0.019824981689453125, -0.018625259399414062, -0.017425537109375, -0.016225814819335938, -0.015026092529296875, -0.013826370239257812, -0.01262664794921875, -0.011426925659179688, -0.010227203369140625, -0.009027481079101562, -0.0078277587890625, -0.0066280364990234375, -0.005428314208984375, -0.0042285919189453125, -0.00302886962890625, -0.0018291473388671875, -0.000629425048828125, 0.0005702972412109375, 0.00177001953125, 0.0029697418212890625, 0.004169464111328125, 0.0053691864013671875, 0.00656890869140625, 0.0077686309814453125, 0.008968353271484375, 0.010168075561523438, 0.0113677978515625, 0.012567520141601562, 0.013767242431640625, 0.014966964721679688, 0.01616668701171875, 0.017366409301757812, 0.018566131591796875, 0.019765853881835938, 0.020965576171875, 0.022165298461914062, 0.023365020751953125, 0.024564743041992188, 0.02576446533203125, 0.026964187622070312, 0.028163909912109375, 0.029363632202148438, 0.0305633544921875, 0.03176307678222656, 0.032962799072265625, 0.03416252136230469, 0.03536224365234375, 0.03656196594238281, 0.037761688232421875, 0.03896141052246094, 0.0401611328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 13.0, 8.0, 8.0, 19.0, 25.0, 48.0, 52.0, 87.0, 138.0, 244.0, 357.0, 637.0, 1200.0, 2476.0, 5943.0, 15279.0, 46885.0, 185956.0, 521220.0, 194403.0, 47503.0, 15079.0, 5696.0, 2447.0, 1198.0, 655.0, 317.0, 215.0, 152.0, 78.0, 55.0, 42.0, 36.0, 22.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12445068359375, -0.12062358856201172, -0.11679649353027344, -0.11296939849853516, -0.10914230346679688, -0.1053152084350586, -0.10148811340332031, -0.09766101837158203, -0.09383392333984375, -0.09000682830810547, -0.08617973327636719, -0.0823526382446289, -0.07852554321289062, -0.07469844818115234, -0.07087135314941406, -0.06704425811767578, -0.0632171630859375, -0.05939006805419922, -0.05556297302246094, -0.051735877990722656, -0.047908782958984375, -0.044081687927246094, -0.04025459289550781, -0.03642749786376953, -0.03260040283203125, -0.02877330780029297, -0.024946212768554688, -0.021119117736816406, -0.017292022705078125, -0.013464927673339844, -0.009637832641601562, -0.005810737609863281, -0.001983642578125, 0.0018434524536132812, 0.0056705474853515625, 0.009497642517089844, 0.013324737548828125, 0.017151832580566406, 0.020978927612304688, 0.02480602264404297, 0.02863311767578125, 0.03246021270751953, 0.03628730773925781, 0.040114402770996094, 0.043941497802734375, 0.047768592834472656, 0.05159568786621094, 0.05542278289794922, 0.0592498779296875, 0.06307697296142578, 0.06690406799316406, 0.07073116302490234, 0.07455825805664062, 0.0783853530883789, 0.08221244812011719, 0.08603954315185547, 0.08986663818359375, 0.09369373321533203, 0.09752082824707031, 0.1013479232788086, 0.10517501831054688, 0.10900211334228516, 0.11282920837402344, 0.11665630340576172, 0.1204833984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 2.0, 6.0, 4.0, 7.0, 12.0, 12.0, 13.0, 26.0, 20.0, 29.0, 27.0, 21.0, 31.0, 43.0, 25.0, 52.0, 48.0, 49.0, 38.0, 43.0, 44.0, 56.0, 49.0, 41.0, 27.0, 42.0, 31.0, 29.0, 26.0, 25.0, 24.0, 18.0, 10.0, 8.0, 11.0, 10.0, 10.0, 7.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0965576171875, -0.09331607818603516, -0.09007453918457031, -0.08683300018310547, -0.08359146118164062, -0.08034992218017578, -0.07710838317871094, -0.0738668441772461, -0.07062530517578125, -0.0673837661743164, -0.06414222717285156, -0.06090068817138672, -0.057659149169921875, -0.05441761016845703, -0.05117607116699219, -0.047934532165527344, -0.0446929931640625, -0.041451454162597656, -0.03820991516113281, -0.03496837615966797, -0.031726837158203125, -0.02848529815673828, -0.025243759155273438, -0.022002220153808594, -0.01876068115234375, -0.015519142150878906, -0.012277603149414062, -0.009036064147949219, -0.005794525146484375, -0.0025529861450195312, 0.0006885528564453125, 0.003930091857910156, 0.007171630859375, 0.010413169860839844, 0.013654708862304688, 0.01689624786376953, 0.020137786865234375, 0.02337932586669922, 0.026620864868164062, 0.029862403869628906, 0.03310394287109375, 0.036345481872558594, 0.03958702087402344, 0.04282855987548828, 0.046070098876953125, 0.04931163787841797, 0.05255317687988281, 0.055794715881347656, 0.0590362548828125, 0.062277793884277344, 0.06551933288574219, 0.06876087188720703, 0.07200241088867188, 0.07524394989013672, 0.07848548889160156, 0.0817270278930664, 0.08496856689453125, 0.0882101058959961, 0.09145164489746094, 0.09469318389892578, 0.09793472290039062, 0.10117626190185547, 0.10441780090332031, 0.10765933990478516, 0.11090087890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 16.0, 15.0, 26.0, 41.0, 59.0, 95.0, 117.0, 184.0, 333.0, 660.0, 1173.0, 2511.0, 6280.0, 20072.0, 97445.0, 564946.0, 290576.0, 44609.0, 11459.0, 3992.0, 1817.0, 861.0, 477.0, 277.0, 176.0, 101.0, 70.0, 47.0, 31.0, 21.0, 15.0, 10.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1287059783935547, -0.12423324584960938, -0.11976051330566406, -0.11528778076171875, -0.11081504821777344, -0.10634231567382812, -0.10186958312988281, -0.0973968505859375, -0.09292411804199219, -0.08845138549804688, -0.08397865295410156, -0.07950592041015625, -0.07503318786621094, -0.07056045532226562, -0.06608772277832031, -0.061614990234375, -0.05714225769042969, -0.052669525146484375, -0.04819679260253906, -0.04372406005859375, -0.03925132751464844, -0.034778594970703125, -0.030305862426757812, -0.0258331298828125, -0.021360397338867188, -0.016887664794921875, -0.012414932250976562, -0.00794219970703125, -0.0034694671630859375, 0.001003265380859375, 0.0054759979248046875, 0.00994873046875, 0.014421463012695312, 0.018894195556640625, 0.023366928100585938, 0.02783966064453125, 0.03231239318847656, 0.036785125732421875, 0.04125785827636719, 0.0457305908203125, 0.05020332336425781, 0.054676055908203125, 0.05914878845214844, 0.06362152099609375, 0.06809425354003906, 0.07256698608398438, 0.07703971862792969, 0.081512451171875, 0.08598518371582031, 0.09045791625976562, 0.09493064880371094, 0.09940338134765625, 0.10387611389160156, 0.10834884643554688, 0.11282157897949219, 0.1172943115234375, 0.12176704406738281, 0.12623977661132812, 0.13071250915527344, 0.13518524169921875, 0.13965797424316406, 0.14413070678710938, 0.1486034393310547, 0.153076171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 3.0, 11.0, 25.0, 23.0, 32.0, 40.0, 47.0, 67.0, 84.0, 88.0, 107.0, 107.0, 92.0, 59.0, 60.0, 54.0, 23.0, 28.0, 22.0, 10.0, 9.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8715858459472656e-05, -1.7663463950157166e-05, -1.6611069440841675e-05, -1.5558674931526184e-05, -1.4506280422210693e-05, -1.3453885912895203e-05, -1.2401491403579712e-05, -1.1349096894264221e-05, -1.029670238494873e-05, -9.24430787563324e-06, -8.191913366317749e-06, -7.139518857002258e-06, -6.087124347686768e-06, -5.034729838371277e-06, -3.982335329055786e-06, -2.9299408197402954e-06, -1.8775463104248047e-06, -8.25151801109314e-07, 2.2724270820617676e-07, 1.2796372175216675e-06, 2.332031726837158e-06, 3.384426236152649e-06, 4.43682074546814e-06, 5.48921525478363e-06, 6.541609764099121e-06, 7.594004273414612e-06, 8.646398782730103e-06, 9.698793292045593e-06, 1.0751187801361084e-05, 1.1803582310676575e-05, 1.2855976819992065e-05, 1.3908371329307556e-05, 1.4960765838623047e-05, 1.6013160347938538e-05, 1.706555485725403e-05, 1.811794936656952e-05, 1.917034387588501e-05, 2.02227383852005e-05, 2.127513289451599e-05, 2.2327527403831482e-05, 2.3379921913146973e-05, 2.4432316422462463e-05, 2.5484710931777954e-05, 2.6537105441093445e-05, 2.7589499950408936e-05, 2.8641894459724426e-05, 2.9694288969039917e-05, 3.074668347835541e-05, 3.17990779876709e-05, 3.285147249698639e-05, 3.390386700630188e-05, 3.495626151561737e-05, 3.600865602493286e-05, 3.706105053424835e-05, 3.811344504356384e-05, 3.9165839552879333e-05, 4.0218234062194824e-05, 4.1270628571510315e-05, 4.2323023080825806e-05, 4.3375417590141296e-05, 4.442781209945679e-05, 4.548020660877228e-05, 4.653260111808777e-05, 4.758499562740326e-05, 4.863739013671875e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 8.0, 10.0, 16.0, 19.0, 32.0, 46.0, 61.0, 78.0, 142.0, 230.0, 353.0, 630.0, 1141.0, 2224.0, 4822.0, 11893.0, 36418.0, 153478.0, 509231.0, 245839.0, 54062.0, 16008.0, 5989.0, 2661.0, 1324.0, 704.0, 399.0, 256.0, 135.0, 93.0, 69.0, 48.0, 31.0, 25.0, 10.0, 21.0, 12.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.1171875, -0.11380577087402344, -0.11042404174804688, -0.10704231262207031, -0.10366058349609375, -0.10027885437011719, -0.09689712524414062, -0.09351539611816406, -0.0901336669921875, -0.08675193786621094, -0.08337020874023438, -0.07998847961425781, -0.07660675048828125, -0.07322502136230469, -0.06984329223632812, -0.06646156311035156, -0.063079833984375, -0.05969810485839844, -0.056316375732421875, -0.05293464660644531, -0.04955291748046875, -0.04617118835449219, -0.042789459228515625, -0.03940773010253906, -0.0360260009765625, -0.03264427185058594, -0.029262542724609375, -0.025880813598632812, -0.02249908447265625, -0.019117355346679688, -0.015735626220703125, -0.012353897094726562, -0.00897216796875, -0.0055904388427734375, -0.002208709716796875, 0.0011730194091796875, 0.00455474853515625, 0.007936477661132812, 0.011318206787109375, 0.014699935913085938, 0.0180816650390625, 0.021463394165039062, 0.024845123291015625, 0.028226852416992188, 0.03160858154296875, 0.03499031066894531, 0.038372039794921875, 0.04175376892089844, 0.045135498046875, 0.04851722717285156, 0.051898956298828125, 0.05528068542480469, 0.05866241455078125, 0.06204414367675781, 0.06542587280273438, 0.06880760192871094, 0.0721893310546875, 0.07557106018066406, 0.07895278930664062, 0.08233451843261719, 0.08571624755859375, 0.08909797668457031, 0.09247970581054688, 0.09586143493652344, 0.0992431640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 7.0, 10.0, 15.0, 22.0, 16.0, 23.0, 28.0, 30.0, 48.0, 58.0, 73.0, 74.0, 80.0, 67.0, 79.0, 55.0, 65.0, 68.0, 43.0, 27.0, 21.0, 14.0, 13.0, 10.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08795166015625, -0.08558177947998047, -0.08321189880371094, -0.0808420181274414, -0.07847213745117188, -0.07610225677490234, -0.07373237609863281, -0.07136249542236328, -0.06899261474609375, -0.06662273406982422, -0.06425285339355469, -0.061882972717285156, -0.059513092041015625, -0.057143211364746094, -0.05477333068847656, -0.05240345001220703, -0.0500335693359375, -0.04766368865966797, -0.04529380798339844, -0.042923927307128906, -0.040554046630859375, -0.038184165954589844, -0.03581428527832031, -0.03344440460205078, -0.03107452392578125, -0.02870464324951172, -0.026334762573242188, -0.023964881896972656, -0.021595001220703125, -0.019225120544433594, -0.016855239868164062, -0.014485359191894531, -0.012115478515625, -0.009745597839355469, -0.0073757171630859375, -0.005005836486816406, -0.002635955810546875, -0.00026607513427734375, 0.0021038055419921875, 0.004473686218261719, 0.00684356689453125, 0.009213447570800781, 0.011583328247070312, 0.013953208923339844, 0.016323089599609375, 0.018692970275878906, 0.021062850952148438, 0.02343273162841797, 0.0258026123046875, 0.02817249298095703, 0.030542373657226562, 0.032912254333496094, 0.035282135009765625, 0.037652015686035156, 0.04002189636230469, 0.04239177703857422, 0.04476165771484375, 0.04713153839111328, 0.04950141906738281, 0.051871299743652344, 0.054241180419921875, 0.056611061096191406, 0.05898094177246094, 0.06135082244873047, 0.063720703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 11.0, 92.0, 785.0, 112.0, 13.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.077866554260254, -0.9116312861442566, -0.7453960180282593, -0.579160749912262, -0.41292548179626465, -0.24669021368026733, -0.08045494556427002, 0.08578038215637207, 0.2520155906677246, 0.4182508587837219, 0.5844861268997192, 0.7507213950157166, 0.9169566631317139, 1.0831918716430664, 1.2494271993637085, 1.4156625270843506, 1.5818977355957031, 1.7481329441070557, 1.9143682718276978, 2.08060359954834, 2.2468388080596924, 2.413074016571045, 2.5793094635009766, 2.745544672012329, 2.9117798805236816, 3.078015089035034, 3.2442502975463867, 3.4104857444763184, 3.576720952987671, 3.7429561614990234, 3.909191608428955, 4.075427055358887, 4.24166202545166, 4.407897472381592, 4.574132442474365, 4.740367889404297, 4.90660285949707, 5.072838306427002, 5.239073753356934, 5.405308723449707, 5.571544170379639, 5.73777961730957, 5.904014587402344, 6.070250034332275, 6.236485481262207, 6.4027204513549805, 6.568955898284912, 6.735191345214844, 6.901426315307617, 7.067661762237549, 7.233896732330322, 7.400132179260254, 7.566367149353027, 7.732602596282959, 7.898838043212891, 8.065073013305664, 8.231307983398438, 8.397542953491211, 8.5637788772583, 8.730013847351074, 8.896248817443848, 9.062484741210938, 9.228719711303711, 9.394954681396484, 9.561190605163574]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 10.0, 4.0, 6.0, 8.0, 16.0, 12.0, 19.0, 23.0, 37.0, 69.0, 52.0, 65.0, 75.0, 71.0, 83.0, 83.0, 71.0, 63.0, 48.0, 49.0, 20.0, 15.0, 17.0, 10.0, 17.0, 9.0, 8.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1898272037506104, -1.1554876565933228, -1.1211482286453247, -1.086808681488037, -1.052469253540039, -1.0181297063827515, -0.9837902188301086, -0.9494507312774658, -0.915111243724823, -0.8807717561721802, -0.8464322686195374, -0.8120927810668945, -0.7777532339096069, -0.7434138059616089, -0.7090742588043213, -0.6747347712516785, -0.6403952836990356, -0.6060557961463928, -0.57171630859375, -0.5373768210411072, -0.5030373334884644, -0.46869781613349915, -0.43435829877853394, -0.4000188112258911, -0.3656793236732483, -0.33133983612060547, -0.29700034856796265, -0.26266083121299744, -0.22832134366035461, -0.1939818561077118, -0.15964235365390778, -0.12530285120010376, -0.09096336364746094, -0.05662386864423752, -0.0222843736410141, 0.01205512136220932, 0.04639461636543274, 0.08073410391807556, 0.11507360637187958, 0.1494131088256836, 0.18375259637832642, 0.21809208393096924, 0.25243157148361206, 0.28677108883857727, 0.3211105763912201, 0.3554500639438629, 0.3897895812988281, 0.42412906885147095, 0.45846855640411377, 0.4928080439567566, 0.5271475315093994, 0.5614870190620422, 0.5958265066146851, 0.6301660537719727, 0.6645055413246155, 0.6988450288772583, 0.7331845164299011, 0.767524003982544, 0.8018634915351868, 0.8362029790878296, 0.8705425262451172, 0.9048819541931152, 0.9392215013504028, 0.9735609889030457, 1.0079004764556885]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 16.0, 11.0, 18.0, 28.0, 30.0, 27.0, 65.0, 79.0, 106.0, 139.0, 200.0, 333.0, 436.0, 660.0, 1059.0, 1706.0, 3092.0, 6029.0, 13899.0, 46188.0, 878554.0, 3159404.0, 52098.0, 14899.0, 6340.0, 3187.0, 1788.0, 1147.0, 737.0, 512.0, 357.0, 246.0, 205.0, 150.0, 112.0, 78.0, 69.0, 47.0, 52.0, 40.0, 28.0, 28.0, 23.0, 15.0, 14.0, 4.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.3525390625, -0.3408050537109375, -0.329071044921875, -0.3173370361328125, -0.30560302734375, -0.2938690185546875, -0.282135009765625, -0.2704010009765625, -0.2586669921875, -0.2469329833984375, -0.235198974609375, -0.2234649658203125, -0.21173095703125, -0.1999969482421875, -0.188262939453125, -0.1765289306640625, -0.164794921875, -0.1530609130859375, -0.141326904296875, -0.1295928955078125, -0.11785888671875, -0.1061248779296875, -0.094390869140625, -0.0826568603515625, -0.0709228515625, -0.0591888427734375, -0.047454833984375, -0.0357208251953125, -0.02398681640625, -0.0122528076171875, -0.000518798828125, 0.0112152099609375, 0.02294921875, 0.0346832275390625, 0.046417236328125, 0.0581512451171875, 0.06988525390625, 0.0816192626953125, 0.093353271484375, 0.1050872802734375, 0.1168212890625, 0.1285552978515625, 0.140289306640625, 0.1520233154296875, 0.16375732421875, 0.1754913330078125, 0.187225341796875, 0.1989593505859375, 0.210693359375, 0.2224273681640625, 0.234161376953125, 0.2458953857421875, 0.25762939453125, 0.2693634033203125, 0.281097412109375, 0.2928314208984375, 0.3045654296875, 0.3162994384765625, 0.328033447265625, 0.3397674560546875, 0.35150146484375, 0.3632354736328125, 0.374969482421875, 0.3867034912109375, 0.3984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 8.0, 5.0, 3.0, 6.0, 2.0, 6.0, 14.0, 12.0, 22.0, 31.0, 44.0, 65.0, 110.0, 161.0, 133.0, 117.0, 94.0, 47.0, 38.0, 27.0, 13.0, 11.0, 7.0, 3.0, 2.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.034088134765625, -0.032959938049316406, -0.03183174133300781, -0.03070354461669922, -0.029575347900390625, -0.02844715118408203, -0.027318954467773438, -0.026190757751464844, -0.02506256103515625, -0.023934364318847656, -0.022806167602539062, -0.02167797088623047, -0.020549774169921875, -0.01942157745361328, -0.018293380737304688, -0.017165184020996094, -0.0160369873046875, -0.014908790588378906, -0.013780593872070312, -0.012652397155761719, -0.011524200439453125, -0.010396003723144531, -0.009267807006835938, -0.008139610290527344, -0.00701141357421875, -0.005883216857910156, -0.0047550201416015625, -0.0036268234252929688, -0.002498626708984375, -0.0013704299926757812, -0.0002422332763671875, 0.0008859634399414062, 0.00201416015625, 0.0031423568725585938, 0.0042705535888671875, 0.005398750305175781, 0.006526947021484375, 0.007655143737792969, 0.008783340454101562, 0.009911537170410156, 0.01103973388671875, 0.012167930603027344, 0.013296127319335938, 0.014424324035644531, 0.015552520751953125, 0.01668071746826172, 0.017808914184570312, 0.018937110900878906, 0.0200653076171875, 0.021193504333496094, 0.022321701049804688, 0.02344989776611328, 0.024578094482421875, 0.02570629119873047, 0.026834487915039062, 0.027962684631347656, 0.02909088134765625, 0.030219078063964844, 0.03134727478027344, 0.03247547149658203, 0.033603668212890625, 0.03473186492919922, 0.03586006164550781, 0.036988258361816406, 0.038116455078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 8.0, 16.0, 12.0, 27.0, 66.0, 133.0, 344.0, 1361.0, 10417.0, 321676.0, 3829569.0, 26984.0, 2699.0, 571.0, 181.0, 87.0, 39.0, 25.0, 20.0, 12.0, 8.0, 1.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.8121795654296875, -0.788421630859375, -0.7646636962890625, -0.74090576171875, -0.7171478271484375, -0.693389892578125, -0.6696319580078125, -0.6458740234375, -0.6221160888671875, -0.598358154296875, -0.5746002197265625, -0.55084228515625, -0.5270843505859375, -0.503326416015625, -0.4795684814453125, -0.455810546875, -0.4320526123046875, -0.408294677734375, -0.3845367431640625, -0.36077880859375, -0.3370208740234375, -0.313262939453125, -0.2895050048828125, -0.2657470703125, -0.2419891357421875, -0.218231201171875, -0.1944732666015625, -0.17071533203125, -0.1469573974609375, -0.123199462890625, -0.0994415283203125, -0.07568359375, -0.0519256591796875, -0.028167724609375, -0.0044097900390625, 0.01934814453125, 0.0431060791015625, 0.066864013671875, 0.0906219482421875, 0.1143798828125, 0.1381378173828125, 0.161895751953125, 0.1856536865234375, 0.20941162109375, 0.2331695556640625, 0.256927490234375, 0.2806854248046875, 0.304443359375, 0.3282012939453125, 0.351959228515625, 0.3757171630859375, 0.39947509765625, 0.4232330322265625, 0.446990966796875, 0.4707489013671875, 0.4945068359375, 0.5182647705078125, 0.542022705078125, 0.5657806396484375, 0.58953857421875, 0.6132965087890625, 0.637054443359375, 0.6608123779296875, 0.6845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 11.0, 10.0, 22.0, 28.0, 49.0, 69.0, 113.0, 276.0, 683.0, 1950.0, 410.0, 193.0, 89.0, 50.0, 37.0, 20.0, 16.0, 12.0, 5.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06629371643066406, -0.06410598754882812, -0.06191825866699219, -0.05973052978515625, -0.05754280090332031, -0.055355072021484375, -0.05316734313964844, -0.0509796142578125, -0.04879188537597656, -0.046604156494140625, -0.04441642761230469, -0.04222869873046875, -0.04004096984863281, -0.037853240966796875, -0.03566551208496094, -0.033477783203125, -0.03129005432128906, -0.029102325439453125, -0.026914596557617188, -0.02472686767578125, -0.022539138793945312, -0.020351409912109375, -0.018163681030273438, -0.0159759521484375, -0.013788223266601562, -0.011600494384765625, -0.009412765502929688, -0.00722503662109375, -0.0050373077392578125, -0.002849578857421875, -0.0006618499755859375, 0.00152587890625, 0.0037136077880859375, 0.005901336669921875, 0.008089065551757812, 0.01027679443359375, 0.012464523315429688, 0.014652252197265625, 0.016839981079101562, 0.0190277099609375, 0.021215438842773438, 0.023403167724609375, 0.025590896606445312, 0.02777862548828125, 0.029966354370117188, 0.032154083251953125, 0.03434181213378906, 0.036529541015625, 0.03871726989746094, 0.040904998779296875, 0.04309272766113281, 0.04528045654296875, 0.04746818542480469, 0.049655914306640625, 0.05184364318847656, 0.0540313720703125, 0.05621910095214844, 0.058406829833984375, 0.06059455871582031, 0.06278228759765625, 0.06497001647949219, 0.06715774536132812, 0.06934547424316406, 0.071533203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 16.0, 19.0, 26.0, 75.0, 120.0, 136.0, 190.0, 147.0, 107.0, 67.0, 32.0, 23.0, 11.0, 4.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3303999900817871, -0.32059523463249207, -0.31079044938087463, -0.3009856939315796, -0.29118093848228455, -0.2813761830329895, -0.27157139778137207, -0.261766642332077, -0.251961886882782, -0.24215711653232574, -0.2323523610830307, -0.22254759073257446, -0.21274283528327942, -0.20293806493282318, -0.19313329458236694, -0.1833285391330719, -0.17352375388145447, -0.16371898353099823, -0.15391422808170319, -0.14410945773124695, -0.1343047022819519, -0.12449993193149567, -0.11469516158103943, -0.10489039868116379, -0.09508563578128815, -0.0852808728814125, -0.07547610998153687, -0.06567133963108063, -0.05586657673120499, -0.046061813831329346, -0.036257047206163406, -0.026452280580997467, -0.016647517681121826, -0.006842752918601036, 0.002962011843919754, 0.012766776606440544, 0.022571541368961334, 0.032376304268836975, 0.042181070894002914, 0.051985837519168854, 0.061790600419044495, 0.07159536331892014, 0.08140012621879578, 0.09120489656925201, 0.10100965946912766, 0.1108144223690033, 0.12061919271945953, 0.13042396306991577, 0.14022871851921082, 0.15003348886966705, 0.1598382443189621, 0.16964301466941833, 0.17944777011871338, 0.18925254046916962, 0.19905731081962585, 0.2088620662689209, 0.21866683661937714, 0.22847160696983337, 0.23827636241912842, 0.24808113276958466, 0.2578859031200409, 0.26769065856933594, 0.277495414018631, 0.2873001992702484, 0.29710495471954346]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 4.0, 8.0, 10.0, 7.0, 15.0, 22.0, 21.0, 32.0, 39.0, 36.0, 43.0, 58.0, 63.0, 62.0, 70.0, 69.0, 57.0, 59.0, 57.0, 41.0, 59.0, 34.0, 28.0, 25.0, 20.0, 16.0, 7.0, 7.0, 7.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23356515169143677, -0.22616197168827057, -0.21875879168510437, -0.21135561168193817, -0.20395243167877197, -0.19654925167560577, -0.18914607167243958, -0.18174290657043457, -0.17433971166610718, -0.16693653166294098, -0.15953335165977478, -0.15213017165660858, -0.14472699165344238, -0.13732381165027618, -0.12992063164710999, -0.12251745909452438, -0.11511428654193878, -0.10771110653877258, -0.10030792653560638, -0.09290474653244019, -0.08550156652927399, -0.07809838652610779, -0.07069521397352219, -0.06329203397035599, -0.05588885396718979, -0.04848567396402359, -0.04108249396085739, -0.03367931768298149, -0.026276137679815292, -0.018872957676649094, -0.011469781398773193, -0.004066601395606995, 0.003336578607559204, 0.010739757679402828, 0.018142936751246452, 0.025546114891767502, 0.0329492948949337, 0.0403524748980999, 0.0477556511759758, 0.055158831179142, 0.0625620111823082, 0.0699651911854744, 0.0773683711886406, 0.0847715437412262, 0.0921747237443924, 0.0995779037475586, 0.10698108375072479, 0.11438426375389099, 0.12178744375705719, 0.1291906237602234, 0.1365938037633896, 0.1439969837665558, 0.15140016376972198, 0.15880334377288818, 0.1662065088748932, 0.17360970377922058, 0.18101286888122559, 0.18841604888439178, 0.19581922888755798, 0.20322240889072418, 0.21062558889389038, 0.21802876889705658, 0.22543194890022278, 0.23283511400222778, 0.24023830890655518]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 15.0, 18.0, 25.0, 31.0, 42.0, 68.0, 79.0, 138.0, 211.0, 291.0, 461.0, 811.0, 1392.0, 2460.0, 4779.0, 10877.0, 32468.0, 167038.0, 647489.0, 132026.0, 28150.0, 9604.0, 4405.0, 2279.0, 1228.0, 726.0, 454.0, 305.0, 193.0, 150.0, 96.0, 65.0, 48.0, 38.0, 26.0, 23.0, 8.0, 7.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.22307205200195312, -0.21494293212890625, -0.20681381225585938, -0.1986846923828125, -0.19055557250976562, -0.18242645263671875, -0.17429733276367188, -0.166168212890625, -0.15803909301757812, -0.14990997314453125, -0.14178085327148438, -0.1336517333984375, -0.12552261352539062, -0.11739349365234375, -0.10926437377929688, -0.10113525390625, -0.09300613403320312, -0.08487701416015625, -0.07674789428710938, -0.0686187744140625, -0.060489654541015625, -0.05236053466796875, -0.044231414794921875, -0.036102294921875, -0.027973175048828125, -0.01984405517578125, -0.011714935302734375, -0.0035858154296875, 0.004543304443359375, 0.01267242431640625, 0.020801544189453125, 0.0289306640625, 0.037059783935546875, 0.04518890380859375, 0.053318023681640625, 0.0614471435546875, 0.06957626342773438, 0.07770538330078125, 0.08583450317382812, 0.093963623046875, 0.10209274291992188, 0.11022186279296875, 0.11835098266601562, 0.1264801025390625, 0.13460922241210938, 0.14273834228515625, 0.15086746215820312, 0.15899658203125, 0.16712570190429688, 0.17525482177734375, 0.18338394165039062, 0.1915130615234375, 0.19964218139648438, 0.20777130126953125, 0.21590042114257812, 0.224029541015625, 0.23215866088867188, 0.24028778076171875, 0.24841690063476562, 0.2565460205078125, 0.2646751403808594, 0.27280426025390625, 0.2809333801269531, 0.2890625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 5.0, 11.0, 13.0, 23.0, 31.0, 55.0, 78.0, 122.0, 159.0, 166.0, 115.0, 79.0, 41.0, 32.0, 19.0, 10.0, 9.0, 2.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.038909912109375, -0.03768587112426758, -0.036461830139160156, -0.035237789154052734, -0.03401374816894531, -0.03278970718383789, -0.03156566619873047, -0.030341625213623047, -0.029117584228515625, -0.027893543243408203, -0.02666950225830078, -0.02544546127319336, -0.024221420288085938, -0.022997379302978516, -0.021773338317871094, -0.020549297332763672, -0.01932525634765625, -0.018101215362548828, -0.016877174377441406, -0.015653133392333984, -0.014429092407226562, -0.01320505142211914, -0.011981010437011719, -0.010756969451904297, -0.009532928466796875, -0.008308887481689453, -0.007084846496582031, -0.005860805511474609, -0.0046367645263671875, -0.0034127235412597656, -0.0021886825561523438, -0.0009646415710449219, 0.0002593994140625, 0.0014834403991699219, 0.0027074813842773438, 0.003931522369384766, 0.0051555633544921875, 0.006379604339599609, 0.007603645324707031, 0.008827686309814453, 0.010051727294921875, 0.011275768280029297, 0.012499809265136719, 0.01372385025024414, 0.014947891235351562, 0.016171932220458984, 0.017395973205566406, 0.018620014190673828, 0.01984405517578125, 0.021068096160888672, 0.022292137145996094, 0.023516178131103516, 0.024740219116210938, 0.02596426010131836, 0.02718830108642578, 0.028412342071533203, 0.029636383056640625, 0.030860424041748047, 0.03208446502685547, 0.03330850601196289, 0.03453254699707031, 0.035756587982177734, 0.036980628967285156, 0.03820466995239258, 0.0394287109375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 13.0, 9.0, 16.0, 21.0, 46.0, 53.0, 79.0, 113.0, 160.0, 303.0, 529.0, 1075.0, 2992.0, 10795.0, 56439.0, 374243.0, 499517.0, 80594.0, 14917.0, 3821.0, 1325.0, 562.0, 333.0, 224.0, 107.0, 58.0, 49.0, 33.0, 29.0, 19.0, 15.0, 8.0, 11.0, 9.0, 3.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23313331604003906, -0.22420120239257812, -0.2152690887451172, -0.20633697509765625, -0.1974048614501953, -0.18847274780273438, -0.17954063415527344, -0.1706085205078125, -0.16167640686035156, -0.15274429321289062, -0.1438121795654297, -0.13488006591796875, -0.1259479522705078, -0.11701583862304688, -0.10808372497558594, -0.099151611328125, -0.09021949768066406, -0.08128738403320312, -0.07235527038574219, -0.06342315673828125, -0.05449104309082031, -0.045558929443359375, -0.03662681579589844, -0.0276947021484375, -0.018762588500976562, -0.009830474853515625, -0.0008983612060546875, 0.00803375244140625, 0.016965866088867188, 0.025897979736328125, 0.03483009338378906, 0.04376220703125, 0.05269432067871094, 0.061626434326171875, 0.07055854797363281, 0.07949066162109375, 0.08842277526855469, 0.09735488891601562, 0.10628700256347656, 0.1152191162109375, 0.12415122985839844, 0.13308334350585938, 0.1420154571533203, 0.15094757080078125, 0.1598796844482422, 0.16881179809570312, 0.17774391174316406, 0.186676025390625, 0.19560813903808594, 0.20454025268554688, 0.2134723663330078, 0.22240447998046875, 0.2313365936279297, 0.24026870727539062, 0.24920082092285156, 0.2581329345703125, 0.26706504821777344, 0.2759971618652344, 0.2849292755126953, 0.29386138916015625, 0.3027935028076172, 0.3117256164550781, 0.32065773010253906, 0.32958984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 8.0, 2.0, 10.0, 7.0, 11.0, 6.0, 12.0, 14.0, 20.0, 16.0, 28.0, 24.0, 29.0, 29.0, 35.0, 36.0, 37.0, 54.0, 52.0, 54.0, 40.0, 44.0, 48.0, 54.0, 46.0, 42.0, 39.0, 32.0, 35.0, 29.0, 19.0, 13.0, 14.0, 12.0, 9.0, 17.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10009765625, -0.09634971618652344, -0.09260177612304688, -0.08885383605957031, -0.08510589599609375, -0.08135795593261719, -0.07761001586914062, -0.07386207580566406, -0.0701141357421875, -0.06636619567871094, -0.06261825561523438, -0.05887031555175781, -0.05512237548828125, -0.05137443542480469, -0.047626495361328125, -0.04387855529785156, -0.040130615234375, -0.03638267517089844, -0.032634735107421875, -0.028886795043945312, -0.02513885498046875, -0.021390914916992188, -0.017642974853515625, -0.013895034790039062, -0.0101470947265625, -0.0063991546630859375, -0.002651214599609375, 0.0010967254638671875, 0.00484466552734375, 0.008592605590820312, 0.012340545654296875, 0.016088485717773438, 0.01983642578125, 0.023584365844726562, 0.027332305908203125, 0.031080245971679688, 0.03482818603515625, 0.03857612609863281, 0.042324066162109375, 0.04607200622558594, 0.0498199462890625, 0.05356788635253906, 0.057315826416015625, 0.06106376647949219, 0.06481170654296875, 0.06855964660644531, 0.07230758666992188, 0.07605552673339844, 0.079803466796875, 0.08355140686035156, 0.08729934692382812, 0.09104728698730469, 0.09479522705078125, 0.09854316711425781, 0.10229110717773438, 0.10603904724121094, 0.1097869873046875, 0.11353492736816406, 0.11728286743164062, 0.12103080749511719, 0.12477874755859375, 0.1285266876220703, 0.13227462768554688, 0.13602256774902344, 0.1397705078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 8.0, 13.0, 12.0, 20.0, 19.0, 53.0, 67.0, 66.0, 133.0, 166.0, 222.0, 319.0, 551.0, 922.0, 1682.0, 3171.0, 6682.0, 15176.0, 37878.0, 104135.0, 296515.0, 357164.0, 138945.0, 48746.0, 19120.0, 7989.0, 3872.0, 2043.0, 1096.0, 559.0, 397.0, 239.0, 151.0, 113.0, 80.0, 52.0, 51.0, 31.0, 25.0, 16.0, 14.0, 5.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08282470703125, -0.0802469253540039, -0.07766914367675781, -0.07509136199951172, -0.07251358032226562, -0.06993579864501953, -0.06735801696777344, -0.06478023529052734, -0.06220245361328125, -0.059624671936035156, -0.05704689025878906, -0.05446910858154297, -0.051891326904296875, -0.04931354522705078, -0.04673576354980469, -0.044157981872558594, -0.0415802001953125, -0.039002418518066406, -0.03642463684082031, -0.03384685516357422, -0.031269073486328125, -0.02869129180908203, -0.026113510131835938, -0.023535728454589844, -0.02095794677734375, -0.018380165100097656, -0.015802383422851562, -0.013224601745605469, -0.010646820068359375, -0.008069038391113281, -0.0054912567138671875, -0.0029134750366210938, -0.000335693359375, 0.0022420883178710938, 0.0048198699951171875, 0.007397651672363281, 0.009975433349609375, 0.012553215026855469, 0.015130996704101562, 0.017708778381347656, 0.02028656005859375, 0.022864341735839844, 0.025442123413085938, 0.02801990509033203, 0.030597686767578125, 0.03317546844482422, 0.03575325012207031, 0.038331031799316406, 0.0409088134765625, 0.043486595153808594, 0.04606437683105469, 0.04864215850830078, 0.051219940185546875, 0.05379772186279297, 0.05637550354003906, 0.058953285217285156, 0.06153106689453125, 0.06410884857177734, 0.06668663024902344, 0.06926441192626953, 0.07184219360351562, 0.07441997528076172, 0.07699775695800781, 0.0795755386352539, 0.0821533203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 14.0, 14.0, 14.0, 24.0, 23.0, 34.0, 39.0, 37.0, 45.0, 58.0, 79.0, 73.0, 84.0, 65.0, 68.0, 52.0, 48.0, 52.0, 33.0, 29.0, 23.0, 21.0, 15.0, 15.0, 8.0, 7.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.647804260253906e-05, -3.535579890012741e-05, -3.423355519771576e-05, -3.311131149530411e-05, -3.1989067792892456e-05, -3.0866824090480804e-05, -2.9744580388069153e-05, -2.86223366856575e-05, -2.750009298324585e-05, -2.6377849280834198e-05, -2.5255605578422546e-05, -2.4133361876010895e-05, -2.3011118173599243e-05, -2.188887447118759e-05, -2.076663076877594e-05, -1.964438706636429e-05, -1.8522143363952637e-05, -1.7399899661540985e-05, -1.6277655959129333e-05, -1.5155412256717682e-05, -1.403316855430603e-05, -1.2910924851894379e-05, -1.1788681149482727e-05, -1.0666437447071075e-05, -9.544193744659424e-06, -8.421950042247772e-06, -7.299706339836121e-06, -6.177462637424469e-06, -5.055218935012817e-06, -3.932975232601166e-06, -2.810731530189514e-06, -1.6884878277778625e-06, -5.662441253662109e-07, 5.559995770454407e-07, 1.6782432794570923e-06, 2.800486981868744e-06, 3.9227306842803955e-06, 5.044974386692047e-06, 6.167218089103699e-06, 7.28946179151535e-06, 8.411705493927002e-06, 9.533949196338654e-06, 1.0656192898750305e-05, 1.1778436601161957e-05, 1.2900680303573608e-05, 1.402292400598526e-05, 1.5145167708396912e-05, 1.6267411410808563e-05, 1.7389655113220215e-05, 1.8511898815631866e-05, 1.9634142518043518e-05, 2.075638622045517e-05, 2.187862992286682e-05, 2.3000873625278473e-05, 2.4123117327690125e-05, 2.5245361030101776e-05, 2.6367604732513428e-05, 2.748984843492508e-05, 2.861209213733673e-05, 2.9734335839748383e-05, 3.0856579542160034e-05, 3.1978823244571686e-05, 3.310106694698334e-05, 3.422331064939499e-05, 3.534555435180664e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 10.0, 9.0, 11.0, 15.0, 25.0, 40.0, 46.0, 87.0, 112.0, 228.0, 416.0, 786.0, 1908.0, 5688.0, 20903.0, 105175.0, 549593.0, 296652.0, 49323.0, 11330.0, 3462.0, 1330.0, 577.0, 327.0, 176.0, 93.0, 73.0, 37.0, 27.0, 18.0, 13.0, 19.0, 12.0, 9.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13454437255859375, -0.1301727294921875, -0.12580108642578125, -0.121429443359375, -0.11705780029296875, -0.1126861572265625, -0.10831451416015625, -0.10394287109375, -0.09957122802734375, -0.0951995849609375, -0.09082794189453125, -0.086456298828125, -0.08208465576171875, -0.0777130126953125, -0.07334136962890625, -0.0689697265625, -0.06459808349609375, -0.0602264404296875, -0.05585479736328125, -0.051483154296875, -0.04711151123046875, -0.0427398681640625, -0.03836822509765625, -0.03399658203125, -0.02962493896484375, -0.0252532958984375, -0.02088165283203125, -0.016510009765625, -0.01213836669921875, -0.0077667236328125, -0.00339508056640625, 0.0009765625, 0.00534820556640625, 0.0097198486328125, 0.01409149169921875, 0.018463134765625, 0.02283477783203125, 0.0272064208984375, 0.03157806396484375, 0.03594970703125, 0.04032135009765625, 0.0446929931640625, 0.04906463623046875, 0.053436279296875, 0.05780792236328125, 0.0621795654296875, 0.06655120849609375, 0.0709228515625, 0.07529449462890625, 0.0796661376953125, 0.08403778076171875, 0.088409423828125, 0.09278106689453125, 0.0971527099609375, 0.10152435302734375, 0.10589599609375, 0.11026763916015625, 0.1146392822265625, 0.11901092529296875, 0.123382568359375, 0.12775421142578125, 0.1321258544921875, 0.13649749755859375, 0.140869140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 4.0, 8.0, 7.0, 10.0, 14.0, 16.0, 27.0, 28.0, 29.0, 43.0, 49.0, 55.0, 62.0, 71.0, 69.0, 66.0, 76.0, 59.0, 57.0, 48.0, 35.0, 24.0, 22.0, 18.0, 14.0, 14.0, 7.0, 13.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.060272216796875, -0.058428287506103516, -0.05658435821533203, -0.05474042892456055, -0.05289649963378906, -0.05105257034301758, -0.049208641052246094, -0.04736471176147461, -0.045520782470703125, -0.04367685317993164, -0.041832923889160156, -0.03998899459838867, -0.03814506530761719, -0.0363011360168457, -0.03445720672607422, -0.032613277435302734, -0.03076934814453125, -0.028925418853759766, -0.02708148956298828, -0.025237560272216797, -0.023393630981445312, -0.021549701690673828, -0.019705772399902344, -0.01786184310913086, -0.016017913818359375, -0.01417398452758789, -0.012330055236816406, -0.010486125946044922, -0.008642196655273438, -0.006798267364501953, -0.004954338073730469, -0.0031104087829589844, -0.0012664794921875, 0.0005774497985839844, 0.0024213790893554688, 0.004265308380126953, 0.0061092376708984375, 0.007953166961669922, 0.009797096252441406, 0.01164102554321289, 0.013484954833984375, 0.01532888412475586, 0.017172813415527344, 0.019016742706298828, 0.020860671997070312, 0.022704601287841797, 0.02454853057861328, 0.026392459869384766, 0.02823638916015625, 0.030080318450927734, 0.03192424774169922, 0.0337681770324707, 0.03561210632324219, 0.03745603561401367, 0.039299964904785156, 0.04114389419555664, 0.042987823486328125, 0.04483175277709961, 0.046675682067871094, 0.04851961135864258, 0.05036354064941406, 0.05220746994018555, 0.05405139923095703, 0.055895328521728516, 0.0577392578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 13.0, 27.0, 53.0, 118.0, 233.0, 238.0, 146.0, 94.0, 35.0, 14.0, 13.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8776824474334717, -1.8176438808441162, -1.7576054334640503, -1.6975668668746948, -1.6375283002853394, -1.5774898529052734, -1.517451286315918, -1.4574127197265625, -1.397374153137207, -1.3373355865478516, -1.2772971391677856, -1.2172585725784302, -1.1572200059890747, -1.0971815586090088, -1.0371429920196533, -0.9771044254302979, -0.9170659780502319, -0.8570274710655212, -0.7969889044761658, -0.7369503974914551, -0.6769118309020996, -0.6168733239173889, -0.5568348169326782, -0.49679628014564514, -0.43675774335861206, -0.376719206571579, -0.3166806697845459, -0.2566421627998352, -0.19660362601280212, -0.13656508922576904, -0.07652658224105835, -0.01648804545402527, 0.04355049133300781, 0.1035890206694603, 0.16362755000591278, 0.22366607189178467, 0.28370460867881775, 0.34374314546585083, 0.4037816524505615, 0.4638201892375946, 0.5238587260246277, 0.5838972330093384, 0.6439357995986938, 0.7039743065834045, 0.7640128135681152, 0.8240513801574707, 0.8840898871421814, 0.9441283941268921, 1.0041669607162476, 1.064205527305603, 1.124243974685669, 1.1842825412750244, 1.2443211078643799, 1.3043596744537354, 1.3643981218338013, 1.4244366884231567, 1.4844751358032227, 1.5445137023925781, 1.604552149772644, 1.6645907163619995, 1.724629282951355, 1.784667730331421, 1.8447062969207764, 1.9047448635101318, 1.9647834300994873]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 17.0, 17.0, 21.0, 29.0, 25.0, 45.0, 39.0, 50.0, 64.0, 75.0, 72.0, 60.0, 67.0, 58.0, 45.0, 46.0, 45.0, 39.0, 32.0, 19.0, 20.0, 19.0, 18.0, 14.0, 8.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9781767725944519, -0.9423176050186157, -0.9064583778381348, -0.8705992102622986, -0.8347400426864624, -0.7988808751106262, -0.76302170753479, -0.7271624803543091, -0.6913033127784729, -0.6554441452026367, -0.6195849180221558, -0.5837257504463196, -0.5478665828704834, -0.5120074152946472, -0.47614821791648865, -0.4402890205383301, -0.4044298529624939, -0.3685706853866577, -0.33271148800849915, -0.2968522906303406, -0.2609931230545044, -0.22513394057750702, -0.18927475810050964, -0.15341556072235107, -0.11755639314651489, -0.08169721066951752, -0.04583802819252014, -0.009978845715522766, 0.02588033676147461, 0.061739519238471985, 0.09759870171546936, 0.13345789909362793, 0.1693171262741089, 0.20517630875110626, 0.24103549122810364, 0.2768946886062622, 0.3127538561820984, 0.34861302375793457, 0.38447222113609314, 0.4203314185142517, 0.4561905860900879, 0.4920497536659241, 0.5279089212417603, 0.5637681484222412, 0.5996273159980774, 0.6354864835739136, 0.6713457107543945, 0.7072048783302307, 0.7430640459060669, 0.7789232134819031, 0.8147823810577393, 0.8506416082382202, 0.8865007758140564, 0.9223599433898926, 0.9582191705703735, 0.9940783381462097, 1.029937505722046, 1.0657967329025269, 1.1016558408737183, 1.1375150680541992, 1.1733741760253906, 1.2092334032058716, 1.2450926303863525, 1.280951738357544, 1.316810965538025]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 1.0, 1.0, 10.0, 17.0, 11.0, 40.0, 100.0, 197.0, 571.0, 2373.0, 19596.0, 4051129.0, 112363.0, 5714.0, 1266.0, 462.0, 194.0, 111.0, 42.0, 29.0, 17.0, 14.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.9731292724609375, -0.940399169921875, -0.9076690673828125, -0.87493896484375, -0.8422088623046875, -0.809478759765625, -0.7767486572265625, -0.7440185546875, -0.7112884521484375, -0.678558349609375, -0.6458282470703125, -0.61309814453125, -0.5803680419921875, -0.547637939453125, -0.5149078369140625, -0.482177734375, -0.4494476318359375, -0.416717529296875, -0.3839874267578125, -0.35125732421875, -0.3185272216796875, -0.285797119140625, -0.2530670166015625, -0.2203369140625, -0.1876068115234375, -0.154876708984375, -0.1221466064453125, -0.08941650390625, -0.0566864013671875, -0.023956298828125, 0.0087738037109375, 0.04150390625, 0.0742340087890625, 0.106964111328125, 0.1396942138671875, 0.17242431640625, 0.2051544189453125, 0.237884521484375, 0.2706146240234375, 0.3033447265625, 0.3360748291015625, 0.368804931640625, 0.4015350341796875, 0.43426513671875, 0.4669952392578125, 0.499725341796875, 0.5324554443359375, 0.565185546875, 0.5979156494140625, 0.630645751953125, 0.6633758544921875, 0.69610595703125, 0.7288360595703125, 0.761566162109375, 0.7942962646484375, 0.8270263671875, 0.8597564697265625, 0.892486572265625, 0.9252166748046875, 0.95794677734375, 0.9906768798828125, 1.023406982421875, 1.0561370849609375, 1.0888671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 6.0, 7.0, 18.0, 21.0, 29.0, 43.0, 67.0, 107.0, 146.0, 131.0, 130.0, 100.0, 61.0, 46.0, 31.0, 25.0, 9.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043304443359375, -0.04178476333618164, -0.04026508331298828, -0.03874540328979492, -0.03722572326660156, -0.0357060432434082, -0.034186363220214844, -0.032666683197021484, -0.031147003173828125, -0.029627323150634766, -0.028107643127441406, -0.026587963104248047, -0.025068283081054688, -0.023548603057861328, -0.02202892303466797, -0.02050924301147461, -0.01898956298828125, -0.01746988296508789, -0.01595020294189453, -0.014430522918701172, -0.012910842895507812, -0.011391162872314453, -0.009871482849121094, -0.008351802825927734, -0.006832122802734375, -0.005312442779541016, -0.0037927627563476562, -0.002273082733154297, -0.0007534027099609375, 0.0007662773132324219, 0.0022859573364257812, 0.0038056373596191406, 0.0053253173828125, 0.006844997406005859, 0.008364677429199219, 0.009884357452392578, 0.011404037475585938, 0.012923717498779297, 0.014443397521972656, 0.015963077545166016, 0.017482757568359375, 0.019002437591552734, 0.020522117614746094, 0.022041797637939453, 0.023561477661132812, 0.025081157684326172, 0.02660083770751953, 0.02812051773071289, 0.02964019775390625, 0.03115987777709961, 0.03267955780029297, 0.03419923782348633, 0.03571891784667969, 0.03723859786987305, 0.038758277893066406, 0.040277957916259766, 0.041797637939453125, 0.043317317962646484, 0.044836997985839844, 0.0463566780090332, 0.04787635803222656, 0.04939603805541992, 0.05091571807861328, 0.05243539810180664, 0.053955078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 2.0, 11.0, 6.0, 11.0, 25.0, 28.0, 30.0, 50.0, 79.0, 91.0, 149.0, 222.0, 449.0, 792.0, 1542.0, 3383.0, 8209.0, 22235.0, 75676.0, 472385.0, 3292128.0, 240010.0, 49947.0, 15710.0, 5909.0, 2569.0, 1174.0, 575.0, 328.0, 175.0, 112.0, 79.0, 56.0, 32.0, 31.0, 23.0, 13.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2191162109375, -0.21164894104003906, -0.20418167114257812, -0.1967144012451172, -0.18924713134765625, -0.1817798614501953, -0.17431259155273438, -0.16684532165527344, -0.1593780517578125, -0.15191078186035156, -0.14444351196289062, -0.1369762420654297, -0.12950897216796875, -0.12204170227050781, -0.11457443237304688, -0.10710716247558594, -0.099639892578125, -0.09217262268066406, -0.08470535278320312, -0.07723808288574219, -0.06977081298828125, -0.06230354309082031, -0.054836273193359375, -0.04736900329589844, -0.0399017333984375, -0.03243446350097656, -0.024967193603515625, -0.017499923706054688, -0.01003265380859375, -0.0025653839111328125, 0.004901885986328125, 0.012369155883789062, 0.01983642578125, 0.027303695678710938, 0.034770965576171875, 0.04223823547363281, 0.04970550537109375, 0.05717277526855469, 0.06464004516601562, 0.07210731506347656, 0.0795745849609375, 0.08704185485839844, 0.09450912475585938, 0.10197639465332031, 0.10944366455078125, 0.11691093444824219, 0.12437820434570312, 0.13184547424316406, 0.139312744140625, 0.14678001403808594, 0.15424728393554688, 0.1617145538330078, 0.16918182373046875, 0.1766490936279297, 0.18411636352539062, 0.19158363342285156, 0.1990509033203125, 0.20651817321777344, 0.21398544311523438, 0.2214527130126953, 0.22891998291015625, 0.2363872528076172, 0.24385452270507812, 0.25132179260253906, 0.2587890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 6.0, 9.0, 14.0, 24.0, 20.0, 20.0, 36.0, 44.0, 65.0, 106.0, 183.0, 405.0, 1612.0, 686.0, 292.0, 168.0, 124.0, 68.0, 52.0, 41.0, 23.0, 13.0, 10.0, 6.0, 11.0, 10.0, 1.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05889892578125, -0.056987762451171875, -0.05507659912109375, -0.053165435791015625, -0.0512542724609375, -0.049343109130859375, -0.04743194580078125, -0.045520782470703125, -0.043609619140625, -0.041698455810546875, -0.03978729248046875, -0.037876129150390625, -0.0359649658203125, -0.034053802490234375, -0.03214263916015625, -0.030231475830078125, -0.0283203125, -0.026409149169921875, -0.02449798583984375, -0.022586822509765625, -0.0206756591796875, -0.018764495849609375, -0.01685333251953125, -0.014942169189453125, -0.013031005859375, -0.011119842529296875, -0.00920867919921875, -0.007297515869140625, -0.0053863525390625, -0.003475189208984375, -0.00156402587890625, 0.000347137451171875, 0.00225830078125, 0.004169464111328125, 0.00608062744140625, 0.007991790771484375, 0.0099029541015625, 0.011814117431640625, 0.01372528076171875, 0.015636444091796875, 0.017547607421875, 0.019458770751953125, 0.02136993408203125, 0.023281097412109375, 0.0251922607421875, 0.027103424072265625, 0.02901458740234375, 0.030925750732421875, 0.0328369140625, 0.034748077392578125, 0.03665924072265625, 0.038570404052734375, 0.0404815673828125, 0.042392730712890625, 0.04430389404296875, 0.046215057373046875, 0.048126220703125, 0.050037384033203125, 0.05194854736328125, 0.053859710693359375, 0.0557708740234375, 0.057682037353515625, 0.05959320068359375, 0.061504364013671875, 0.06341552734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 28.0, 110.0, 240.0, 350.0, 191.0, 52.0, 12.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3059757947921753, -1.2800270318984985, -1.2540782690048218, -1.228129506111145, -1.2021806240081787, -1.176231861114502, -1.1502830982208252, -1.1243343353271484, -1.0983855724334717, -1.072436809539795, -1.0464880466461182, -1.0205392837524414, -0.9945904612541199, -0.9686416387557983, -0.9426928758621216, -0.9167441129684448, -0.8907953500747681, -0.8648465871810913, -0.8388977646827698, -0.812949001789093, -0.7870002388954163, -0.7610514163970947, -0.735102653503418, -0.7091538906097412, -0.6832050681114197, -0.6572563052177429, -0.6313074827194214, -0.6053587198257446, -0.5794099569320679, -0.5534611940383911, -0.5275123715400696, -0.5015636086463928, -0.47561487555503845, -0.4496660828590393, -0.42371731996536255, -0.3977685272693634, -0.37181976437568665, -0.3458709716796875, -0.31992220878601074, -0.2939734160900116, -0.26802462339401245, -0.2420758455991745, -0.21612706780433655, -0.1901782751083374, -0.16422951221466064, -0.1382807195186615, -0.11233194172382355, -0.0863831639289856, -0.06043440103530884, -0.034485623240470886, -0.008536841720342636, 0.017411939799785614, 0.043360717594623566, 0.06930950284004211, 0.09525828063488007, 0.12120705842971802, 0.14715583622455597, 0.17310461401939392, 0.19905339181423187, 0.22500216960906982, 0.25095096230506897, 0.2768997550010681, 0.3028485178947449, 0.32879728078842163, 0.3547460734844208]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 6.0, 14.0, 13.0, 12.0, 8.0, 10.0, 14.0, 14.0, 23.0, 22.0, 27.0, 34.0, 43.0, 40.0, 37.0, 40.0, 34.0, 49.0, 41.0, 41.0, 38.0, 47.0, 43.0, 39.0, 41.0, 32.0, 27.0, 24.0, 27.0, 26.0, 22.0, 13.0, 12.0, 16.0, 9.0, 10.0, 12.0, 7.0, 3.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.21332383155822754, -0.2074023187160492, -0.20148082077503204, -0.1955593079328537, -0.18963779509067535, -0.1837162971496582, -0.17779478430747986, -0.1718732714653015, -0.16595175862312317, -0.16003024578094482, -0.15410874783992767, -0.14818723499774933, -0.14226572215557098, -0.13634422421455383, -0.1304227113723755, -0.12450119853019714, -0.11857970058917999, -0.11265819519758224, -0.1067366823554039, -0.10081517696380615, -0.09489366412162781, -0.08897215873003006, -0.08305065333843231, -0.07712914049625397, -0.07120763510465622, -0.06528612971305847, -0.05936461687088013, -0.05344311147928238, -0.04752160236239433, -0.04160009324550629, -0.03567858785390854, -0.029757078737020493, -0.023835569620132446, -0.0179140605032444, -0.011992553249001503, -0.006071045994758606, -0.0001495368778705597, 0.005771972239017487, 0.011693477630615234, 0.01761498674750328, 0.023536495864391327, 0.029458004981279373, 0.03537951409816742, 0.04130101948976517, 0.047222528606653214, 0.05314403772354126, 0.05906554311513901, 0.06498704850673676, 0.0709085613489151, 0.07683006674051285, 0.08275157958269119, 0.08867308497428894, 0.09459459781646729, 0.10051610320806503, 0.10643760859966278, 0.11235912144184113, 0.11828062683343887, 0.12420213222503662, 0.13012364506721497, 0.1360451579093933, 0.14196665585041046, 0.1478881686925888, 0.15380966663360596, 0.1597311794757843, 0.16565269231796265]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 6.0, 7.0, 14.0, 9.0, 18.0, 33.0, 56.0, 72.0, 90.0, 194.0, 331.0, 538.0, 1023.0, 2051.0, 5323.0, 20280.0, 130314.0, 668951.0, 182309.0, 25615.0, 6500.0, 2320.0, 1033.0, 595.0, 336.0, 202.0, 120.0, 78.0, 47.0, 30.0, 21.0, 10.0, 10.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30810546875, -0.29834747314453125, -0.2885894775390625, -0.27883148193359375, -0.269073486328125, -0.25931549072265625, -0.2495574951171875, -0.23979949951171875, -0.23004150390625, -0.22028350830078125, -0.2105255126953125, -0.20076751708984375, -0.191009521484375, -0.18125152587890625, -0.1714935302734375, -0.16173553466796875, -0.1519775390625, -0.14221954345703125, -0.1324615478515625, -0.12270355224609375, -0.112945556640625, -0.10318756103515625, -0.0934295654296875, -0.08367156982421875, -0.07391357421875, -0.06415557861328125, -0.0543975830078125, -0.04463958740234375, -0.034881591796875, -0.02512359619140625, -0.0153656005859375, -0.00560760498046875, 0.004150390625, 0.01390838623046875, 0.0236663818359375, 0.03342437744140625, 0.043182373046875, 0.05294036865234375, 0.0626983642578125, 0.07245635986328125, 0.08221435546875, 0.09197235107421875, 0.1017303466796875, 0.11148834228515625, 0.121246337890625, 0.13100433349609375, 0.1407623291015625, 0.15052032470703125, 0.1602783203125, 0.17003631591796875, 0.1797943115234375, 0.18955230712890625, 0.199310302734375, 0.20906829833984375, 0.2188262939453125, 0.22858428955078125, 0.23834228515625, 0.24810028076171875, 0.2578582763671875, 0.26761627197265625, 0.277374267578125, 0.28713226318359375, 0.2968902587890625, 0.30664825439453125, 0.31640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 13.0, 12.0, 16.0, 29.0, 41.0, 76.0, 77.0, 124.0, 142.0, 131.0, 111.0, 77.0, 55.0, 33.0, 21.0, 16.0, 15.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046661376953125, -0.04509735107421875, -0.0435333251953125, -0.04196929931640625, -0.0404052734375, -0.03884124755859375, -0.0372772216796875, -0.03571319580078125, -0.034149169921875, -0.03258514404296875, -0.0310211181640625, -0.02945709228515625, -0.02789306640625, -0.02632904052734375, -0.0247650146484375, -0.02320098876953125, -0.021636962890625, -0.02007293701171875, -0.0185089111328125, -0.01694488525390625, -0.015380859375, -0.01381683349609375, -0.0122528076171875, -0.01068878173828125, -0.009124755859375, -0.00756072998046875, -0.0059967041015625, -0.00443267822265625, -0.00286865234375, -0.00130462646484375, 0.0002593994140625, 0.00182342529296875, 0.003387451171875, 0.00495147705078125, 0.0065155029296875, 0.00807952880859375, 0.0096435546875, 0.01120758056640625, 0.0127716064453125, 0.01433563232421875, 0.015899658203125, 0.01746368408203125, 0.0190277099609375, 0.02059173583984375, 0.02215576171875, 0.02371978759765625, 0.0252838134765625, 0.02684783935546875, 0.028411865234375, 0.02997589111328125, 0.0315399169921875, 0.03310394287109375, 0.03466796875, 0.03623199462890625, 0.0377960205078125, 0.03936004638671875, 0.040924072265625, 0.04248809814453125, 0.0440521240234375, 0.04561614990234375, 0.04718017578125, 0.04874420166015625, 0.0503082275390625, 0.05187225341796875, 0.053436279296875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 6.0, 11.0, 15.0, 28.0, 31.0, 51.0, 65.0, 106.0, 160.0, 243.0, 395.0, 762.0, 1477.0, 3788.0, 11812.0, 48578.0, 243873.0, 544025.0, 148607.0, 30664.0, 8222.0, 2896.0, 1174.0, 589.0, 332.0, 205.0, 138.0, 99.0, 55.0, 42.0, 31.0, 21.0, 8.0, 9.0, 7.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26239585876464844, -0.2542839050292969, -0.2461719512939453, -0.23805999755859375, -0.2299480438232422, -0.22183609008789062, -0.21372413635253906, -0.2056121826171875, -0.19750022888183594, -0.18938827514648438, -0.1812763214111328, -0.17316436767578125, -0.1650524139404297, -0.15694046020507812, -0.14882850646972656, -0.140716552734375, -0.13260459899902344, -0.12449264526367188, -0.11638069152832031, -0.10826873779296875, -0.10015678405761719, -0.09204483032226562, -0.08393287658691406, -0.0758209228515625, -0.06770896911621094, -0.059597015380859375, -0.05148506164550781, -0.04337310791015625, -0.03526115417480469, -0.027149200439453125, -0.019037246704101562, -0.01092529296875, -0.0028133392333984375, 0.005298614501953125, 0.013410568237304688, 0.02152252197265625, 0.029634475708007812, 0.037746429443359375, 0.04585838317871094, 0.0539703369140625, 0.06208229064941406, 0.07019424438476562, 0.07830619812011719, 0.08641815185546875, 0.09453010559082031, 0.10264205932617188, 0.11075401306152344, 0.118865966796875, 0.12697792053222656, 0.13508987426757812, 0.1432018280029297, 0.15131378173828125, 0.1594257354736328, 0.16753768920898438, 0.17564964294433594, 0.1837615966796875, 0.19187355041503906, 0.19998550415039062, 0.2080974578857422, 0.21620941162109375, 0.2243213653564453, 0.23243331909179688, 0.24054527282714844, 0.2486572265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 6.0, 9.0, 10.0, 14.0, 11.0, 15.0, 25.0, 32.0, 44.0, 37.0, 41.0, 44.0, 43.0, 40.0, 53.0, 49.0, 47.0, 52.0, 57.0, 65.0, 62.0, 34.0, 34.0, 30.0, 34.0, 23.0, 21.0, 15.0, 7.0, 6.0, 6.0, 5.0, 6.0, 4.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1922607421875, -0.18689727783203125, -0.1815338134765625, -0.17617034912109375, -0.170806884765625, -0.16544342041015625, -0.1600799560546875, -0.15471649169921875, -0.14935302734375, -0.14398956298828125, -0.1386260986328125, -0.13326263427734375, -0.127899169921875, -0.12253570556640625, -0.1171722412109375, -0.11180877685546875, -0.1064453125, -0.10108184814453125, -0.0957183837890625, -0.09035491943359375, -0.084991455078125, -0.07962799072265625, -0.0742645263671875, -0.06890106201171875, -0.06353759765625, -0.05817413330078125, -0.0528106689453125, -0.04744720458984375, -0.042083740234375, -0.03672027587890625, -0.0313568115234375, -0.02599334716796875, -0.0206298828125, -0.01526641845703125, -0.0099029541015625, -0.00453948974609375, 0.000823974609375, 0.00618743896484375, 0.0115509033203125, 0.01691436767578125, 0.02227783203125, 0.02764129638671875, 0.0330047607421875, 0.03836822509765625, 0.043731689453125, 0.04909515380859375, 0.0544586181640625, 0.05982208251953125, 0.065185546875, 0.07054901123046875, 0.0759124755859375, 0.08127593994140625, 0.086639404296875, 0.09200286865234375, 0.0973663330078125, 0.10272979736328125, 0.10809326171875, 0.11345672607421875, 0.1188201904296875, 0.12418365478515625, 0.129547119140625, 0.13491058349609375, 0.1402740478515625, 0.14563751220703125, 0.1510009765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 5.0, 7.0, 10.0, 17.0, 26.0, 19.0, 37.0, 64.0, 62.0, 105.0, 191.0, 284.0, 449.0, 764.0, 1272.0, 2338.0, 4503.0, 9137.0, 20748.0, 53760.0, 166049.0, 426245.0, 238070.0, 73182.0, 27402.0, 11625.0, 5471.0, 2789.0, 1558.0, 877.0, 534.0, 314.0, 211.0, 124.0, 81.0, 66.0, 44.0, 24.0, 20.0, 18.0, 18.0, 8.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.09466552734375, -0.09185218811035156, -0.08903884887695312, -0.08622550964355469, -0.08341217041015625, -0.08059883117675781, -0.07778549194335938, -0.07497215270996094, -0.0721588134765625, -0.06934547424316406, -0.06653213500976562, -0.06371879577636719, -0.06090545654296875, -0.05809211730957031, -0.055278778076171875, -0.05246543884277344, -0.049652099609375, -0.04683876037597656, -0.044025421142578125, -0.04121208190917969, -0.03839874267578125, -0.03558540344238281, -0.032772064208984375, -0.029958724975585938, -0.0271453857421875, -0.024332046508789062, -0.021518707275390625, -0.018705368041992188, -0.01589202880859375, -0.013078689575195312, -0.010265350341796875, -0.0074520111083984375, -0.004638671875, -0.0018253326416015625, 0.000988006591796875, 0.0038013458251953125, 0.00661468505859375, 0.009428024291992188, 0.012241363525390625, 0.015054702758789062, 0.0178680419921875, 0.020681381225585938, 0.023494720458984375, 0.026308059692382812, 0.02912139892578125, 0.03193473815917969, 0.034748077392578125, 0.03756141662597656, 0.040374755859375, 0.04318809509277344, 0.046001434326171875, 0.04881477355957031, 0.05162811279296875, 0.05444145202636719, 0.057254791259765625, 0.06006813049316406, 0.0628814697265625, 0.06569480895996094, 0.06850814819335938, 0.07132148742675781, 0.07413482666015625, 0.07694816589355469, 0.07976150512695312, 0.08257484436035156, 0.08538818359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 14.0, 11.0, 18.0, 25.0, 36.0, 48.0, 46.0, 60.0, 61.0, 62.0, 84.0, 76.0, 65.0, 84.0, 53.0, 60.0, 38.0, 29.0, 17.0, 17.0, 22.0, 18.0, 10.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.55839729309082e-05, -3.456976264715195e-05, -3.355555236339569e-05, -3.2541342079639435e-05, -3.152713179588318e-05, -3.0512921512126923e-05, -2.9498711228370667e-05, -2.848450094461441e-05, -2.7470290660858154e-05, -2.6456080377101898e-05, -2.5441870093345642e-05, -2.4427659809589386e-05, -2.341344952583313e-05, -2.2399239242076874e-05, -2.1385028958320618e-05, -2.037081867456436e-05, -1.9356608390808105e-05, -1.834239810705185e-05, -1.7328187823295593e-05, -1.6313977539539337e-05, -1.529976725578308e-05, -1.4285556972026825e-05, -1.3271346688270569e-05, -1.2257136404514313e-05, -1.1242926120758057e-05, -1.02287158370018e-05, -9.214505553245544e-06, -8.200295269489288e-06, -7.186084985733032e-06, -6.171874701976776e-06, -5.15766441822052e-06, -4.143454134464264e-06, -3.129243850708008e-06, -2.1150335669517517e-06, -1.1008232831954956e-06, -8.66129994392395e-08, 9.275972843170166e-07, 1.9418075680732727e-06, 2.956017851829529e-06, 3.970228135585785e-06, 4.984438419342041e-06, 5.998648703098297e-06, 7.012858986854553e-06, 8.02706927061081e-06, 9.041279554367065e-06, 1.0055489838123322e-05, 1.1069700121879578e-05, 1.2083910405635834e-05, 1.309812068939209e-05, 1.4112330973148346e-05, 1.5126541256904602e-05, 1.6140751540660858e-05, 1.7154961824417114e-05, 1.816917210817337e-05, 1.9183382391929626e-05, 2.0197592675685883e-05, 2.121180295944214e-05, 2.2226013243198395e-05, 2.324022352695465e-05, 2.4254433810710907e-05, 2.5268644094467163e-05, 2.628285437822342e-05, 2.7297064661979675e-05, 2.831127494573593e-05, 2.9325485229492188e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 6.0, 16.0, 16.0, 31.0, 37.0, 54.0, 78.0, 140.0, 207.0, 390.0, 778.0, 1969.0, 6028.0, 25693.0, 166710.0, 703500.0, 114610.0, 19888.0, 5031.0, 1802.0, 726.0, 354.0, 167.0, 105.0, 74.0, 41.0, 21.0, 23.0, 13.0, 8.0, 7.0, 6.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1744384765625, -0.1687030792236328, -0.16296768188476562, -0.15723228454589844, -0.15149688720703125, -0.14576148986816406, -0.14002609252929688, -0.1342906951904297, -0.1285552978515625, -0.12281990051269531, -0.11708450317382812, -0.11134910583496094, -0.10561370849609375, -0.09987831115722656, -0.09414291381835938, -0.08840751647949219, -0.082672119140625, -0.07693672180175781, -0.07120132446289062, -0.06546592712402344, -0.05973052978515625, -0.05399513244628906, -0.048259735107421875, -0.04252433776855469, -0.0367889404296875, -0.031053543090820312, -0.025318145751953125, -0.019582748413085938, -0.01384735107421875, -0.008111953735351562, -0.002376556396484375, 0.0033588409423828125, 0.00909423828125, 0.014829635620117188, 0.020565032958984375, 0.026300430297851562, 0.03203582763671875, 0.03777122497558594, 0.043506622314453125, 0.04924201965332031, 0.0549774169921875, 0.06071281433105469, 0.06644821166992188, 0.07218360900878906, 0.07791900634765625, 0.08365440368652344, 0.08938980102539062, 0.09512519836425781, 0.100860595703125, 0.10659599304199219, 0.11233139038085938, 0.11806678771972656, 0.12380218505859375, 0.12953758239746094, 0.13527297973632812, 0.1410083770751953, 0.1467437744140625, 0.1524791717529297, 0.15821456909179688, 0.16394996643066406, 0.16968536376953125, 0.17542076110839844, 0.18115615844726562, 0.1868915557861328, 0.192626953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 7.0, 9.0, 9.0, 7.0, 20.0, 12.0, 28.0, 29.0, 53.0, 63.0, 82.0, 92.0, 94.0, 97.0, 77.0, 49.0, 39.0, 58.0, 30.0, 34.0, 25.0, 14.0, 9.0, 8.0, 15.0, 3.0, 5.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09930419921875, -0.0966024398803711, -0.09390068054199219, -0.09119892120361328, -0.08849716186523438, -0.08579540252685547, -0.08309364318847656, -0.08039188385009766, -0.07769012451171875, -0.07498836517333984, -0.07228660583496094, -0.06958484649658203, -0.06688308715820312, -0.06418132781982422, -0.06147956848144531, -0.058777809143066406, -0.0560760498046875, -0.053374290466308594, -0.05067253112792969, -0.04797077178955078, -0.045269012451171875, -0.04256725311279297, -0.03986549377441406, -0.037163734436035156, -0.03446197509765625, -0.031760215759277344, -0.029058456420898438, -0.02635669708251953, -0.023654937744140625, -0.02095317840576172, -0.018251419067382812, -0.015549659729003906, -0.012847900390625, -0.010146141052246094, -0.0074443817138671875, -0.004742622375488281, -0.002040863037109375, 0.0006608963012695312, 0.0033626556396484375, 0.006064414978027344, 0.00876617431640625, 0.011467933654785156, 0.014169692993164062, 0.01687145233154297, 0.019573211669921875, 0.02227497100830078, 0.024976730346679688, 0.027678489685058594, 0.0303802490234375, 0.033082008361816406, 0.03578376770019531, 0.03848552703857422, 0.041187286376953125, 0.04388904571533203, 0.04659080505371094, 0.049292564392089844, 0.05199432373046875, 0.054696083068847656, 0.05739784240722656, 0.06009960174560547, 0.06280136108398438, 0.06550312042236328, 0.06820487976074219, 0.0709066390991211, 0.0736083984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 10.0, 10.0, 14.0, 39.0, 60.0, 121.0, 176.0, 209.0, 156.0, 95.0, 52.0, 30.0, 13.0, 11.0, 10.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4192583560943604, -1.360929012298584, -1.3025997877120972, -1.2442704439163208, -1.1859411001205444, -1.1276118755340576, -1.0692825317382812, -1.0109531879425049, -0.9526238441467285, -0.8942945599555969, -0.8359652161598206, -0.777635931968689, -0.7193065881729126, -0.660977303981781, -0.6026480197906494, -0.544318675994873, -0.48598939180374146, -0.4276600778102875, -0.3693307638168335, -0.3110014796257019, -0.25267213582992554, -0.19434285163879395, -0.13601353764533997, -0.07768422365188599, -0.019354909658432007, 0.038974400609731674, 0.09730371087789536, 0.15563301742076874, 0.21396233141422272, 0.2722916305065155, 0.3306209444999695, 0.38895025849342346, 0.44727957248687744, 0.505608856678009, 0.5639382004737854, 0.622267484664917, 0.6805968284606934, 0.738926112651825, 0.7972553968429565, 0.8555847406387329, 0.9139140844345093, 0.9722433686256409, 1.0305726528167725, 1.0889019966125488, 1.1472313404083252, 1.2055606842041016, 1.2638899087905884, 1.3222192525863647, 1.3805484771728516, 1.438877820968628, 1.4972070455551147, 1.5555363893508911, 1.6138657331466675, 1.6721949577331543, 1.7305243015289307, 1.788853645324707, 1.8471829891204834, 1.9055123329162598, 1.9638415575027466, 2.0221710205078125, 2.0805001258850098, 2.138829469680786, 2.1971588134765625, 2.255488157272339, 2.3138175010681152]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 2.0, 3.0, 8.0, 13.0, 10.0, 14.0, 10.0, 17.0, 21.0, 17.0, 26.0, 31.0, 39.0, 41.0, 43.0, 40.0, 45.0, 37.0, 44.0, 48.0, 42.0, 44.0, 45.0, 48.0, 37.0, 40.0, 36.0, 28.0, 35.0, 20.0, 21.0, 20.0, 19.0, 10.0, 13.0, 5.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0357482433319092, -1.0045775175094604, -0.9734067916870117, -0.9422361254692078, -0.911065399646759, -0.8798946738243103, -0.8487240076065063, -0.8175532817840576, -0.7863825559616089, -0.7552118301391602, -0.7240411043167114, -0.6928704380989075, -0.6616997122764587, -0.63052898645401, -0.599358320236206, -0.5681875944137573, -0.5370168685913086, -0.5058461427688599, -0.4746754467487335, -0.4435047507286072, -0.41233402490615845, -0.3811632990837097, -0.3499926030635834, -0.31882190704345703, -0.2876511812210083, -0.25648045539855957, -0.22530975937843323, -0.1941390484571457, -0.16296833753585815, -0.13179762661457062, -0.10062691569328308, -0.06945620477199554, -0.03828549385070801, -0.007114782929420471, 0.024055927991867065, 0.0552266389131546, 0.08639734983444214, 0.11756806075572968, 0.1487387716770172, 0.17990948259830475, 0.21108019351959229, 0.24225090444087982, 0.27342161536216736, 0.3045923113822937, 0.33576303720474243, 0.36693376302719116, 0.3981044590473175, 0.42927515506744385, 0.4604458808898926, 0.4916166067123413, 0.52278733253479, 0.553957998752594, 0.5851287245750427, 0.6162994503974915, 0.6474701166152954, 0.6786408424377441, 0.7098115682601929, 0.7409822940826416, 0.7721530199050903, 0.8033236861228943, 0.834494411945343, 0.8656651377677917, 0.8968358039855957, 0.9280065298080444, 0.9591772556304932]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 9.0, 11.0, 15.0, 26.0, 38.0, 86.0, 147.0, 252.0, 597.0, 1308.0, 3464.0, 12346.0, 76736.0, 3840703.0, 226596.0, 22331.0, 5549.0, 2008.0, 893.0, 479.0, 245.0, 150.0, 84.0, 48.0, 42.0, 31.0, 13.0, 20.0, 12.0, 5.0, 7.0, 10.0, 10.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3680267333984375, -0.356414794921875, -0.3448028564453125, -0.33319091796875, -0.3215789794921875, -0.309967041015625, -0.2983551025390625, -0.2867431640625, -0.2751312255859375, -0.263519287109375, -0.2519073486328125, -0.24029541015625, -0.2286834716796875, -0.217071533203125, -0.2054595947265625, -0.19384765625, -0.1822357177734375, -0.170623779296875, -0.1590118408203125, -0.14739990234375, -0.1357879638671875, -0.124176025390625, -0.1125640869140625, -0.1009521484375, -0.0893402099609375, -0.077728271484375, -0.0661163330078125, -0.05450439453125, -0.0428924560546875, -0.031280517578125, -0.0196685791015625, -0.008056640625, 0.0035552978515625, 0.015167236328125, 0.0267791748046875, 0.03839111328125, 0.0500030517578125, 0.061614990234375, 0.0732269287109375, 0.0848388671875, 0.0964508056640625, 0.108062744140625, 0.1196746826171875, 0.13128662109375, 0.1428985595703125, 0.154510498046875, 0.1661224365234375, 0.177734375, 0.1893463134765625, 0.200958251953125, 0.2125701904296875, 0.22418212890625, 0.2357940673828125, 0.247406005859375, 0.2590179443359375, 0.2706298828125, 0.2822418212890625, 0.293853759765625, 0.3054656982421875, 0.31707763671875, 0.3286895751953125, 0.340301513671875, 0.3519134521484375, 0.363525390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 9.0, 13.0, 29.0, 29.0, 57.0, 50.0, 82.0, 104.0, 98.0, 93.0, 95.0, 81.0, 68.0, 43.0, 38.0, 30.0, 24.0, 17.0, 13.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04620361328125, -0.044681549072265625, -0.04315948486328125, -0.041637420654296875, -0.0401153564453125, -0.038593292236328125, -0.03707122802734375, -0.035549163818359375, -0.034027099609375, -0.032505035400390625, -0.03098297119140625, -0.029460906982421875, -0.0279388427734375, -0.026416778564453125, -0.02489471435546875, -0.023372650146484375, -0.0218505859375, -0.020328521728515625, -0.01880645751953125, -0.017284393310546875, -0.0157623291015625, -0.014240264892578125, -0.01271820068359375, -0.011196136474609375, -0.009674072265625, -0.008152008056640625, -0.00662994384765625, -0.005107879638671875, -0.0035858154296875, -0.002063751220703125, -0.00054168701171875, 0.000980377197265625, 0.00250244140625, 0.004024505615234375, 0.00554656982421875, 0.007068634033203125, 0.0085906982421875, 0.010112762451171875, 0.01163482666015625, 0.013156890869140625, 0.014678955078125, 0.016201019287109375, 0.01772308349609375, 0.019245147705078125, 0.0207672119140625, 0.022289276123046875, 0.02381134033203125, 0.025333404541015625, 0.02685546875, 0.028377532958984375, 0.02989959716796875, 0.031421661376953125, 0.0329437255859375, 0.034465789794921875, 0.03598785400390625, 0.037509918212890625, 0.039031982421875, 0.040554046630859375, 0.04207611083984375, 0.043598175048828125, 0.0451202392578125, 0.046642303466796875, 0.04816436767578125, 0.049686431884765625, 0.05120849609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 5.0, 5.0, 19.0, 17.0, 41.0, 49.0, 78.0, 150.0, 265.0, 535.0, 1420.0, 4663.0, 21308.0, 195002.0, 3803706.0, 143041.0, 17632.0, 4052.0, 1246.0, 499.0, 234.0, 134.0, 73.0, 40.0, 22.0, 11.0, 17.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3013496398925781, -0.28995513916015625, -0.2785606384277344, -0.2671661376953125, -0.2557716369628906, -0.24437713623046875, -0.23298263549804688, -0.221588134765625, -0.21019363403320312, -0.19879913330078125, -0.18740463256835938, -0.1760101318359375, -0.16461563110351562, -0.15322113037109375, -0.14182662963867188, -0.13043212890625, -0.11903762817382812, -0.10764312744140625, -0.09624862670898438, -0.0848541259765625, -0.07345962524414062, -0.06206512451171875, -0.050670623779296875, -0.039276123046875, -0.027881622314453125, -0.01648712158203125, -0.005092620849609375, 0.0063018798828125, 0.017696380615234375, 0.02909088134765625, 0.040485382080078125, 0.0518798828125, 0.06327438354492188, 0.07466888427734375, 0.08606338500976562, 0.0974578857421875, 0.10885238647460938, 0.12024688720703125, 0.13164138793945312, 0.143035888671875, 0.15443038940429688, 0.16582489013671875, 0.17721939086914062, 0.1886138916015625, 0.20000839233398438, 0.21140289306640625, 0.22279739379882812, 0.23419189453125, 0.24558639526367188, 0.25698089599609375, 0.2683753967285156, 0.2797698974609375, 0.2911643981933594, 0.30255889892578125, 0.3139533996582031, 0.325347900390625, 0.3367424011230469, 0.34813690185546875, 0.3595314025878906, 0.3709259033203125, 0.3823204040527344, 0.39371490478515625, 0.4051094055175781, 0.41650390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 10.0, 7.0, 8.0, 24.0, 21.0, 33.0, 83.0, 168.0, 386.0, 2200.0, 672.0, 200.0, 104.0, 59.0, 44.0, 26.0, 9.0, 13.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.11410140991210938, -0.11107635498046875, -0.10805130004882812, -0.1050262451171875, -0.10200119018554688, -0.09897613525390625, -0.09595108032226562, -0.092926025390625, -0.08990097045898438, -0.08687591552734375, -0.08385086059570312, -0.0808258056640625, -0.07780075073242188, -0.07477569580078125, -0.07175064086914062, -0.0687255859375, -0.06570053100585938, -0.06267547607421875, -0.059650421142578125, -0.0566253662109375, -0.053600311279296875, -0.05057525634765625, -0.047550201416015625, -0.044525146484375, -0.041500091552734375, -0.03847503662109375, -0.035449981689453125, -0.0324249267578125, -0.029399871826171875, -0.02637481689453125, -0.023349761962890625, -0.02032470703125, -0.017299652099609375, -0.01427459716796875, -0.011249542236328125, -0.0082244873046875, -0.005199432373046875, -0.00217437744140625, 0.000850677490234375, 0.003875732421875, 0.006900787353515625, 0.00992584228515625, 0.012950897216796875, 0.0159759521484375, 0.019001007080078125, 0.02202606201171875, 0.025051116943359375, 0.028076171875, 0.031101226806640625, 0.03412628173828125, 0.037151336669921875, 0.0401763916015625, 0.043201446533203125, 0.04622650146484375, 0.049251556396484375, 0.052276611328125, 0.055301666259765625, 0.05832672119140625, 0.061351776123046875, 0.0643768310546875, 0.06740188598632812, 0.07042694091796875, 0.07345199584960938, 0.07647705078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 16.0, 27.0, 72.0, 125.0, 200.0, 224.0, 166.0, 88.0, 41.0, 22.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7236816883087158, -0.705675482749939, -0.6876692175865173, -0.6696630120277405, -0.6516567468643188, -0.633650541305542, -0.6156443357467651, -0.5976380705833435, -0.5796318650245667, -0.5616256594657898, -0.5436193943023682, -0.5256131887435913, -0.5076069235801697, -0.4896007180213928, -0.4715944826602936, -0.45358824729919434, -0.4355820119380951, -0.41757577657699585, -0.3995695412158966, -0.38156330585479736, -0.3635571002960205, -0.34555086493492126, -0.327544629573822, -0.30953842401504517, -0.29153215885162354, -0.2735259234905243, -0.25551968812942505, -0.237513467669487, -0.21950724720954895, -0.2015010118484497, -0.18349477648735046, -0.16548855602741241, -0.14748233556747437, -0.12947610020637512, -0.11146987974643707, -0.09346364438533783, -0.07545741647481918, -0.05745118856430054, -0.039444953203201294, -0.021438732743263245, -0.0034324973821640015, 0.014573732390999794, 0.03257996216416359, 0.050586193799972534, 0.06859242171049118, 0.08659864962100983, 0.10460488498210907, 0.12261110544204712, 0.14061734080314636, 0.1586235761642456, 0.17662979662418365, 0.1946360319852829, 0.21264225244522095, 0.2306484878063202, 0.24865472316741943, 0.2666609287261963, 0.2846671938896179, 0.30267342925071716, 0.3206796646118164, 0.33868587017059326, 0.3566921055316925, 0.37469834089279175, 0.392704576253891, 0.41071081161499023, 0.4287170171737671]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 5.0, 10.0, 6.0, 13.0, 11.0, 14.0, 25.0, 29.0, 26.0, 28.0, 24.0, 30.0, 32.0, 35.0, 40.0, 46.0, 38.0, 45.0, 46.0, 45.0, 46.0, 53.0, 34.0, 44.0, 59.0, 35.0, 34.0, 18.0, 25.0, 18.0, 14.0, 19.0, 11.0, 7.0, 5.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19146603345870972, -0.18510855734348297, -0.17875108122825623, -0.17239362001419067, -0.16603614389896393, -0.15967866778373718, -0.15332119166851044, -0.1469637155532837, -0.14060625433921814, -0.1342487782239914, -0.12789130210876465, -0.1215338334441185, -0.11517636477947235, -0.1088188886642456, -0.10246141254901886, -0.09610393643379211, -0.08974646031856537, -0.08338898420333862, -0.07703151553869247, -0.07067403942346573, -0.06431657075881958, -0.057959094643592834, -0.05160161852836609, -0.04524414613842964, -0.038886673748493195, -0.03252920135855675, -0.02617172710597515, -0.019814252853393555, -0.013456780463457108, -0.00709930807352066, -0.0007418319582939148, 0.005615640431642532, 0.01197311282157898, 0.018330585211515427, 0.024688059464097023, 0.03104553371667862, 0.037403006106615067, 0.043760478496551514, 0.05011795461177826, 0.056475427001714706, 0.06283289939165115, 0.0691903755068779, 0.07554784417152405, 0.0819053202867508, 0.08826279640197754, 0.09462026506662369, 0.10097774118185043, 0.10733520984649658, 0.11369268596172333, 0.12005016207695007, 0.12640763819217682, 0.13276511430740356, 0.13912257552146912, 0.14548005163669586, 0.1518375277519226, 0.15819500386714935, 0.1645524799823761, 0.17090995609760284, 0.1772674322128296, 0.18362489342689514, 0.1899823695421219, 0.19633984565734863, 0.20269732177257538, 0.20905479788780212, 0.21541225910186768]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 9.0, 9.0, 5.0, 14.0, 19.0, 16.0, 34.0, 34.0, 38.0, 56.0, 82.0, 114.0, 125.0, 244.0, 294.0, 454.0, 783.0, 1346.0, 2417.0, 5163.0, 11257.0, 27857.0, 76779.0, 217311.0, 398357.0, 192265.0, 67634.0, 25146.0, 10259.0, 4724.0, 2306.0, 1236.0, 711.0, 463.0, 272.0, 189.0, 135.0, 120.0, 75.0, 50.0, 32.0, 24.0, 20.0, 18.0, 20.0, 15.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.1541748046875, -0.14969825744628906, -0.14522171020507812, -0.1407451629638672, -0.13626861572265625, -0.1317920684814453, -0.12731552124023438, -0.12283897399902344, -0.1183624267578125, -0.11388587951660156, -0.10940933227539062, -0.10493278503417969, -0.10045623779296875, -0.09597969055175781, -0.09150314331054688, -0.08702659606933594, -0.082550048828125, -0.07807350158691406, -0.07359695434570312, -0.06912040710449219, -0.06464385986328125, -0.06016731262207031, -0.055690765380859375, -0.05121421813964844, -0.0467376708984375, -0.04226112365722656, -0.037784576416015625, -0.03330802917480469, -0.02883148193359375, -0.024354934692382812, -0.019878387451171875, -0.015401840209960938, -0.01092529296875, -0.0064487457275390625, -0.001972198486328125, 0.0025043487548828125, 0.00698089599609375, 0.011457443237304688, 0.015933990478515625, 0.020410537719726562, 0.0248870849609375, 0.029363632202148438, 0.033840179443359375, 0.03831672668457031, 0.04279327392578125, 0.04726982116699219, 0.051746368408203125, 0.05622291564941406, 0.060699462890625, 0.06517601013183594, 0.06965255737304688, 0.07412910461425781, 0.07860565185546875, 0.08308219909667969, 0.08755874633789062, 0.09203529357910156, 0.0965118408203125, 0.10098838806152344, 0.10546493530273438, 0.10994148254394531, 0.11441802978515625, 0.11889457702636719, 0.12337112426757812, 0.12784767150878906, 0.13232421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 14.0, 17.0, 25.0, 32.0, 49.0, 62.0, 81.0, 71.0, 98.0, 94.0, 106.0, 79.0, 63.0, 46.0, 35.0, 40.0, 21.0, 16.0, 14.0, 9.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040679931640625, -0.03924703598022461, -0.03781414031982422, -0.03638124465942383, -0.03494834899902344, -0.03351545333862305, -0.032082557678222656, -0.030649662017822266, -0.029216766357421875, -0.027783870697021484, -0.026350975036621094, -0.024918079376220703, -0.023485183715820312, -0.022052288055419922, -0.02061939239501953, -0.01918649673461914, -0.01775360107421875, -0.01632070541381836, -0.014887809753417969, -0.013454914093017578, -0.012022018432617188, -0.010589122772216797, -0.009156227111816406, -0.007723331451416016, -0.006290435791015625, -0.004857540130615234, -0.0034246444702148438, -0.001991748809814453, -0.0005588531494140625, 0.0008740425109863281, 0.0023069381713867188, 0.0037398338317871094, 0.0051727294921875, 0.006605625152587891, 0.008038520812988281, 0.009471416473388672, 0.010904312133789062, 0.012337207794189453, 0.013770103454589844, 0.015202999114990234, 0.016635894775390625, 0.018068790435791016, 0.019501686096191406, 0.020934581756591797, 0.022367477416992188, 0.023800373077392578, 0.02523326873779297, 0.02666616439819336, 0.02809906005859375, 0.02953195571899414, 0.03096485137939453, 0.03239774703979492, 0.03383064270019531, 0.0352635383605957, 0.036696434020996094, 0.038129329681396484, 0.039562225341796875, 0.040995121002197266, 0.042428016662597656, 0.04386091232299805, 0.04529380798339844, 0.04672670364379883, 0.04815959930419922, 0.04959249496459961, 0.051025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 8.0, 5.0, 7.0, 15.0, 18.0, 26.0, 28.0, 38.0, 83.0, 122.0, 176.0, 252.0, 451.0, 769.0, 1533.0, 3762.0, 10068.0, 31500.0, 118679.0, 414501.0, 337663.0, 89792.0, 24733.0, 7981.0, 3069.0, 1422.0, 726.0, 402.0, 254.0, 157.0, 95.0, 81.0, 45.0, 30.0, 31.0, 7.0, 8.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16034507751464844, -0.15479660034179688, -0.1492481231689453, -0.14369964599609375, -0.1381511688232422, -0.13260269165039062, -0.12705421447753906, -0.1215057373046875, -0.11595726013183594, -0.11040878295898438, -0.10486030578613281, -0.09931182861328125, -0.09376335144042969, -0.08821487426757812, -0.08266639709472656, -0.077117919921875, -0.07156944274902344, -0.06602096557617188, -0.06047248840332031, -0.05492401123046875, -0.04937553405761719, -0.043827056884765625, -0.03827857971191406, -0.0327301025390625, -0.027181625366210938, -0.021633148193359375, -0.016084671020507812, -0.01053619384765625, -0.0049877166748046875, 0.000560760498046875, 0.0061092376708984375, 0.01165771484375, 0.017206192016601562, 0.022754669189453125, 0.028303146362304688, 0.03385162353515625, 0.03940010070800781, 0.044948577880859375, 0.05049705505371094, 0.0560455322265625, 0.06159400939941406, 0.06714248657226562, 0.07269096374511719, 0.07823944091796875, 0.08378791809082031, 0.08933639526367188, 0.09488487243652344, 0.100433349609375, 0.10598182678222656, 0.11153030395507812, 0.11707878112792969, 0.12262725830078125, 0.1281757354736328, 0.13372421264648438, 0.13927268981933594, 0.1448211669921875, 0.15036964416503906, 0.15591812133789062, 0.1614665985107422, 0.16701507568359375, 0.1725635528564453, 0.17811203002929688, 0.18366050720214844, 0.189208984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 6.0, 11.0, 15.0, 22.0, 27.0, 21.0, 32.0, 26.0, 37.0, 34.0, 38.0, 55.0, 48.0, 54.0, 61.0, 44.0, 55.0, 51.0, 41.0, 49.0, 31.0, 41.0, 44.0, 29.0, 19.0, 25.0, 13.0, 10.0, 7.0, 6.0, 12.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.15947532653808594, -0.15427780151367188, -0.1490802764892578, -0.14388275146484375, -0.1386852264404297, -0.13348770141601562, -0.12829017639160156, -0.1230926513671875, -0.11789512634277344, -0.11269760131835938, -0.10750007629394531, -0.10230255126953125, -0.09710502624511719, -0.09190750122070312, -0.08670997619628906, -0.081512451171875, -0.07631492614746094, -0.07111740112304688, -0.06591987609863281, -0.06072235107421875, -0.05552482604980469, -0.050327301025390625, -0.04512977600097656, -0.0399322509765625, -0.03473472595214844, -0.029537200927734375, -0.024339675903320312, -0.01914215087890625, -0.013944625854492188, -0.008747100830078125, -0.0035495758056640625, 0.00164794921875, 0.0068454742431640625, 0.012042999267578125, 0.017240524291992188, 0.02243804931640625, 0.027635574340820312, 0.032833099365234375, 0.03803062438964844, 0.0432281494140625, 0.04842567443847656, 0.053623199462890625, 0.05882072448730469, 0.06401824951171875, 0.06921577453613281, 0.07441329956054688, 0.07961082458496094, 0.084808349609375, 0.09000587463378906, 0.09520339965820312, 0.10040092468261719, 0.10559844970703125, 0.11079597473144531, 0.11599349975585938, 0.12119102478027344, 0.1263885498046875, 0.13158607482910156, 0.13678359985351562, 0.1419811248779297, 0.14717864990234375, 0.1523761749267578, 0.15757369995117188, 0.16277122497558594, 0.16796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 10.0, 8.0, 17.0, 25.0, 35.0, 51.0, 64.0, 115.0, 162.0, 266.0, 489.0, 864.0, 1586.0, 3258.0, 6968.0, 16751.0, 47565.0, 183508.0, 502037.0, 201019.0, 51647.0, 17702.0, 7168.0, 3392.0, 1661.0, 894.0, 502.0, 290.0, 182.0, 103.0, 67.0, 47.0, 32.0, 19.0, 14.0, 11.0, 4.0, 4.0, 5.0, 7.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07781982421875, -0.07535171508789062, -0.07288360595703125, -0.07041549682617188, -0.0679473876953125, -0.06547927856445312, -0.06301116943359375, -0.060543060302734375, -0.058074951171875, -0.055606842041015625, -0.05313873291015625, -0.050670623779296875, -0.0482025146484375, -0.045734405517578125, -0.04326629638671875, -0.040798187255859375, -0.038330078125, -0.035861968994140625, -0.03339385986328125, -0.030925750732421875, -0.0284576416015625, -0.025989532470703125, -0.02352142333984375, -0.021053314208984375, -0.018585205078125, -0.016117095947265625, -0.01364898681640625, -0.011180877685546875, -0.0087127685546875, -0.006244659423828125, -0.00377655029296875, -0.001308441162109375, 0.00115966796875, 0.003627777099609375, 0.00609588623046875, 0.008563995361328125, 0.0110321044921875, 0.013500213623046875, 0.01596832275390625, 0.018436431884765625, 0.020904541015625, 0.023372650146484375, 0.02584075927734375, 0.028308868408203125, 0.0307769775390625, 0.033245086669921875, 0.03571319580078125, 0.038181304931640625, 0.0406494140625, 0.043117523193359375, 0.04558563232421875, 0.048053741455078125, 0.0505218505859375, 0.052989959716796875, 0.05545806884765625, 0.057926177978515625, 0.060394287109375, 0.06286239624023438, 0.06533050537109375, 0.06779861450195312, 0.0702667236328125, 0.07273483276367188, 0.07520294189453125, 0.07767105102539062, 0.08013916015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 18.0, 13.0, 22.0, 16.0, 22.0, 24.0, 29.0, 34.0, 27.0, 45.0, 52.0, 61.0, 65.0, 65.0, 67.0, 55.0, 70.0, 53.0, 40.0, 37.0, 37.0, 32.0, 13.0, 17.0, 16.0, 14.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1636486053466797e-05, -2.0889565348625183e-05, -2.014264464378357e-05, -1.9395723938941956e-05, -1.8648803234100342e-05, -1.7901882529258728e-05, -1.7154961824417114e-05, -1.64080411195755e-05, -1.5661120414733887e-05, -1.4914199709892273e-05, -1.416727900505066e-05, -1.3420358300209045e-05, -1.2673437595367432e-05, -1.1926516890525818e-05, -1.1179596185684204e-05, -1.043267548084259e-05, -9.685754776000977e-06, -8.938834071159363e-06, -8.191913366317749e-06, -7.444992661476135e-06, -6.6980719566345215e-06, -5.951151251792908e-06, -5.204230546951294e-06, -4.45730984210968e-06, -3.7103891372680664e-06, -2.9634684324264526e-06, -2.216547727584839e-06, -1.469627022743225e-06, -7.227063179016113e-07, 2.421438694000244e-08, 7.711350917816162e-07, 1.51805579662323e-06, 2.2649765014648438e-06, 3.0118972063064575e-06, 3.7588179111480713e-06, 4.505738615989685e-06, 5.252659320831299e-06, 5.999580025672913e-06, 6.746500730514526e-06, 7.49342143535614e-06, 8.240342140197754e-06, 8.987262845039368e-06, 9.734183549880981e-06, 1.0481104254722595e-05, 1.1228024959564209e-05, 1.1974945664405823e-05, 1.2721866369247437e-05, 1.346878707408905e-05, 1.4215707778930664e-05, 1.4962628483772278e-05, 1.570954918861389e-05, 1.6456469893455505e-05, 1.720339059829712e-05, 1.7950311303138733e-05, 1.8697232007980347e-05, 1.944415271282196e-05, 2.0191073417663574e-05, 2.0937994122505188e-05, 2.1684914827346802e-05, 2.2431835532188416e-05, 2.317875623703003e-05, 2.3925676941871643e-05, 2.4672597646713257e-05, 2.541951835155487e-05, 2.6166439056396484e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 7.0, 2.0, 4.0, 5.0, 6.0, 1.0, 9.0, 12.0, 16.0, 21.0, 33.0, 64.0, 86.0, 138.0, 250.0, 474.0, 924.0, 1936.0, 4957.0, 14525.0, 60555.0, 472016.0, 416408.0, 54288.0, 13481.0, 4526.0, 1889.0, 850.0, 444.0, 232.0, 141.0, 94.0, 55.0, 38.0, 23.0, 19.0, 8.0, 10.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1162109375, -0.11257553100585938, -0.10894012451171875, -0.10530471801757812, -0.1016693115234375, -0.09803390502929688, -0.09439849853515625, -0.09076309204101562, -0.087127685546875, -0.08349227905273438, -0.07985687255859375, -0.07622146606445312, -0.0725860595703125, -0.06895065307617188, -0.06531524658203125, -0.061679840087890625, -0.05804443359375, -0.054409027099609375, -0.05077362060546875, -0.047138214111328125, -0.0435028076171875, -0.039867401123046875, -0.03623199462890625, -0.032596588134765625, -0.028961181640625, -0.025325775146484375, -0.02169036865234375, -0.018054962158203125, -0.0144195556640625, -0.010784149169921875, -0.00714874267578125, -0.003513336181640625, 0.0001220703125, 0.003757476806640625, 0.00739288330078125, 0.011028289794921875, 0.0146636962890625, 0.018299102783203125, 0.02193450927734375, 0.025569915771484375, 0.029205322265625, 0.032840728759765625, 0.03647613525390625, 0.040111541748046875, 0.0437469482421875, 0.047382354736328125, 0.05101776123046875, 0.054653167724609375, 0.05828857421875, 0.061923980712890625, 0.06555938720703125, 0.06919479370117188, 0.0728302001953125, 0.07646560668945312, 0.08010101318359375, 0.08373641967773438, 0.087371826171875, 0.09100723266601562, 0.09464263916015625, 0.09827804565429688, 0.1019134521484375, 0.10554885864257812, 0.10918426513671875, 0.11281967163085938, 0.116455078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 8.0, 5.0, 9.0, 14.0, 22.0, 23.0, 31.0, 48.0, 81.0, 88.0, 97.0, 120.0, 113.0, 80.0, 80.0, 40.0, 34.0, 19.0, 9.0, 15.0, 14.0, 11.0, 11.0, 3.0, 1.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08917236328125, -0.08665657043457031, -0.08414077758789062, -0.08162498474121094, -0.07910919189453125, -0.07659339904785156, -0.07407760620117188, -0.07156181335449219, -0.0690460205078125, -0.06653022766113281, -0.06401443481445312, -0.06149864196777344, -0.05898284912109375, -0.05646705627441406, -0.053951263427734375, -0.05143547058105469, -0.048919677734375, -0.04640388488769531, -0.043888092041015625, -0.04137229919433594, -0.03885650634765625, -0.03634071350097656, -0.033824920654296875, -0.03130912780761719, -0.0287933349609375, -0.026277542114257812, -0.023761749267578125, -0.021245956420898438, -0.01873016357421875, -0.016214370727539062, -0.013698577880859375, -0.011182785034179688, -0.0086669921875, -0.0061511993408203125, -0.003635406494140625, -0.0011196136474609375, 0.00139617919921875, 0.0039119720458984375, 0.006427764892578125, 0.008943557739257812, 0.0114593505859375, 0.013975143432617188, 0.016490936279296875, 0.019006729125976562, 0.02152252197265625, 0.024038314819335938, 0.026554107666015625, 0.029069900512695312, 0.031585693359375, 0.03410148620605469, 0.036617279052734375, 0.03913307189941406, 0.04164886474609375, 0.04416465759277344, 0.046680450439453125, 0.04919624328613281, 0.0517120361328125, 0.05422782897949219, 0.056743621826171875, 0.05925941467285156, 0.06177520751953125, 0.06429100036621094, 0.06680679321289062, 0.06932258605957031, 0.07183837890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 19.0, 32.0, 57.0, 108.0, 170.0, 187.0, 178.0, 122.0, 54.0, 32.0, 19.0, 13.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748592853546143, -1.1267269849777222, -1.07859468460083, -1.030462384223938, -0.9823301434516907, -0.9341978430747986, -0.8860656023025513, -0.8379333019256592, -0.7898010015487671, -0.741668701171875, -0.6935364007949829, -0.6454041600227356, -0.5972718596458435, -0.5491395592689514, -0.5010073184967041, -0.452875018119812, -0.4047427177429199, -0.35661041736602783, -0.30847814679145813, -0.2603458762168884, -0.21221357583999634, -0.16408129036426544, -0.11594900488853455, -0.06781673431396484, -0.019684433937072754, 0.028447851538658142, 0.07658013701438904, 0.12471242249011993, 0.17284470796585083, 0.22097699344158173, 0.2691092789173126, 0.3172415494918823, 0.3653738498687744, 0.4135061502456665, 0.4616384208202362, 0.5097706913948059, 0.557902991771698, 0.6060352921485901, 0.6541675329208374, 0.7022998332977295, 0.7504321336746216, 0.7985644340515137, 0.8466967344284058, 0.8948289752006531, 0.9429612755775452, 0.9910935759544373, 1.0392258167266846, 1.0873581171035767, 1.1354904174804688, 1.1836227178573608, 1.231755018234253, 1.279887318611145, 1.328019618988037, 1.3761518001556396, 1.4242841005325317, 1.4724164009094238, 1.520548701286316, 1.568681001663208, 1.6168133020401, 1.6649456024169922, 1.7130777835845947, 1.7612100839614868, 1.809342384338379, 1.857474684715271, 1.905606985092163]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 9.0, 7.0, 3.0, 15.0, 9.0, 8.0, 18.0, 20.0, 26.0, 35.0, 39.0, 39.0, 48.0, 36.0, 49.0, 43.0, 65.0, 58.0, 46.0, 54.0, 54.0, 38.0, 44.0, 27.0, 38.0, 32.0, 29.0, 23.0, 11.0, 17.0, 12.0, 12.0, 9.0, 6.0, 7.0, 9.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8695246577262878, -0.8401280641555786, -0.8107314109802246, -0.7813347578048706, -0.7519381642341614, -0.7225415706634521, -0.6931449174880981, -0.6637482643127441, -0.6343516707420349, -0.6049550771713257, -0.5755584239959717, -0.5461617708206177, -0.5167651772499084, -0.48736855387687683, -0.4579719305038452, -0.4285753071308136, -0.399178683757782, -0.36978206038475037, -0.34038543701171875, -0.31098881363868713, -0.2815921902656555, -0.2521955668926239, -0.22279894351959229, -0.19340232014656067, -0.16400569677352905, -0.13460907340049744, -0.10521245002746582, -0.0758158266544342, -0.04641920328140259, -0.01702257990837097, 0.012374043464660645, 0.04177066683769226, 0.0711672306060791, 0.10056385397911072, 0.12996047735214233, 0.15935710072517395, 0.18875372409820557, 0.21815034747123718, 0.2475469708442688, 0.2769435942173004, 0.30634021759033203, 0.33573684096336365, 0.36513346433639526, 0.3945300877094269, 0.4239267110824585, 0.4533233344554901, 0.48271995782852173, 0.512116551399231, 0.541513204574585, 0.570909857749939, 0.6003064513206482, 0.6297030448913574, 0.6590996980667114, 0.6884963512420654, 0.7178929448127747, 0.7472895383834839, 0.7766861915588379, 0.8060828447341919, 0.8354794383049011, 0.8648760318756104, 0.8942726850509644, 0.9236693382263184, 0.9530659317970276, 0.9824625253677368, 1.0118591785430908]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 6.0, 7.0, 11.0, 18.0, 25.0, 59.0, 116.0, 251.0, 652.0, 1838.0, 6783.0, 35274.0, 3599826.0, 515807.0, 25189.0, 5415.0, 1684.0, 627.0, 309.0, 145.0, 99.0, 55.0, 32.0, 16.0, 15.0, 9.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41162109375, -0.4004707336425781, -0.38932037353515625, -0.3781700134277344, -0.3670196533203125, -0.3558692932128906, -0.34471893310546875, -0.3335685729980469, -0.322418212890625, -0.3112678527832031, -0.30011749267578125, -0.2889671325683594, -0.2778167724609375, -0.2666664123535156, -0.25551605224609375, -0.24436569213867188, -0.23321533203125, -0.22206497192382812, -0.21091461181640625, -0.19976425170898438, -0.1886138916015625, -0.17746353149414062, -0.16631317138671875, -0.15516281127929688, -0.144012451171875, -0.13286209106445312, -0.12171173095703125, -0.11056137084960938, -0.0994110107421875, -0.08826065063476562, -0.07711029052734375, -0.06595993041992188, -0.0548095703125, -0.043659210205078125, -0.03250885009765625, -0.021358489990234375, -0.0102081298828125, 0.000942230224609375, 0.01209259033203125, 0.023242950439453125, 0.034393310546875, 0.045543670654296875, 0.05669403076171875, 0.06784439086914062, 0.0789947509765625, 0.09014511108398438, 0.10129547119140625, 0.11244583129882812, 0.12359619140625, 0.13474655151367188, 0.14589691162109375, 0.15704727172851562, 0.1681976318359375, 0.17934799194335938, 0.19049835205078125, 0.20164871215820312, 0.212799072265625, 0.22394943237304688, 0.23509979248046875, 0.24625015258789062, 0.2574005126953125, 0.2685508728027344, 0.27970123291015625, 0.2908515930175781, 0.302001953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 5.0, 7.0, 14.0, 15.0, 24.0, 21.0, 42.0, 62.0, 81.0, 79.0, 72.0, 90.0, 94.0, 100.0, 74.0, 52.0, 48.0, 34.0, 29.0, 17.0, 10.0, 11.0, 13.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047088623046875, -0.04561185836791992, -0.044135093688964844, -0.042658329010009766, -0.04118156433105469, -0.03970479965209961, -0.03822803497314453, -0.03675127029418945, -0.035274505615234375, -0.0337977409362793, -0.03232097625732422, -0.03084421157836914, -0.029367446899414062, -0.027890682220458984, -0.026413917541503906, -0.024937152862548828, -0.02346038818359375, -0.021983623504638672, -0.020506858825683594, -0.019030094146728516, -0.017553329467773438, -0.01607656478881836, -0.014599800109863281, -0.013123035430908203, -0.011646270751953125, -0.010169506072998047, -0.008692741394042969, -0.007215976715087891, -0.0057392120361328125, -0.004262447357177734, -0.0027856826782226562, -0.0013089179992675781, 0.0001678466796875, 0.0016446113586425781, 0.0031213760375976562, 0.004598140716552734, 0.0060749053955078125, 0.007551670074462891, 0.009028434753417969, 0.010505199432373047, 0.011981964111328125, 0.013458728790283203, 0.014935493469238281, 0.01641225814819336, 0.017889022827148438, 0.019365787506103516, 0.020842552185058594, 0.022319316864013672, 0.02379608154296875, 0.025272846221923828, 0.026749610900878906, 0.028226375579833984, 0.029703140258789062, 0.03117990493774414, 0.03265666961669922, 0.0341334342956543, 0.035610198974609375, 0.03708696365356445, 0.03856372833251953, 0.04004049301147461, 0.04151725769042969, 0.042994022369384766, 0.044470787048339844, 0.04594755172729492, 0.04742431640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 9.0, 23.0, 24.0, 57.0, 77.0, 125.0, 248.0, 553.0, 1233.0, 3239.0, 10296.0, 47230.0, 634711.0, 3395821.0, 78785.0, 14724.0, 4217.0, 1513.0, 682.0, 290.0, 167.0, 109.0, 53.0, 39.0, 13.0, 19.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.29577064514160156, -0.2875862121582031, -0.2794017791748047, -0.27121734619140625, -0.2630329132080078, -0.2548484802246094, -0.24666404724121094, -0.2384796142578125, -0.23029518127441406, -0.22211074829101562, -0.2139263153076172, -0.20574188232421875, -0.1975574493408203, -0.18937301635742188, -0.18118858337402344, -0.173004150390625, -0.16481971740722656, -0.15663528442382812, -0.1484508514404297, -0.14026641845703125, -0.1320819854736328, -0.12389755249023438, -0.11571311950683594, -0.1075286865234375, -0.09934425354003906, -0.09115982055664062, -0.08297538757324219, -0.07479095458984375, -0.06660652160644531, -0.058422088623046875, -0.05023765563964844, -0.04205322265625, -0.03386878967285156, -0.025684356689453125, -0.017499923706054688, -0.00931549072265625, -0.0011310577392578125, 0.007053375244140625, 0.015237808227539062, 0.0234222412109375, 0.03160667419433594, 0.039791107177734375, 0.04797554016113281, 0.05615997314453125, 0.06434440612792969, 0.07252883911132812, 0.08071327209472656, 0.088897705078125, 0.09708213806152344, 0.10526657104492188, 0.11345100402832031, 0.12163543701171875, 0.1298198699951172, 0.13800430297851562, 0.14618873596191406, 0.1543731689453125, 0.16255760192871094, 0.17074203491210938, 0.1789264678955078, 0.18711090087890625, 0.1952953338623047, 0.20347976684570312, 0.21166419982910156, 0.2198486328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 11.0, 8.0, 8.0, 13.0, 19.0, 17.0, 25.0, 43.0, 41.0, 73.0, 100.0, 177.0, 337.0, 1547.0, 881.0, 295.0, 138.0, 98.0, 52.0, 46.0, 22.0, 25.0, 19.0, 13.0, 15.0, 9.0, 6.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04449462890625, -0.04309892654418945, -0.041703224182128906, -0.04030752182006836, -0.03891181945800781, -0.037516117095947266, -0.03612041473388672, -0.03472471237182617, -0.033329010009765625, -0.03193330764770508, -0.03053760528564453, -0.029141902923583984, -0.027746200561523438, -0.02635049819946289, -0.024954795837402344, -0.023559093475341797, -0.02216339111328125, -0.020767688751220703, -0.019371986389160156, -0.01797628402709961, -0.016580581665039062, -0.015184879302978516, -0.013789176940917969, -0.012393474578857422, -0.010997772216796875, -0.009602069854736328, -0.008206367492675781, -0.006810665130615234, -0.0054149627685546875, -0.004019260406494141, -0.0026235580444335938, -0.0012278556823730469, 0.0001678466796875, 0.0015635490417480469, 0.0029592514038085938, 0.004354953765869141, 0.0057506561279296875, 0.007146358489990234, 0.008542060852050781, 0.009937763214111328, 0.011333465576171875, 0.012729167938232422, 0.014124870300292969, 0.015520572662353516, 0.016916275024414062, 0.01831197738647461, 0.019707679748535156, 0.021103382110595703, 0.02249908447265625, 0.023894786834716797, 0.025290489196777344, 0.02668619155883789, 0.028081893920898438, 0.029477596282958984, 0.03087329864501953, 0.03226900100708008, 0.033664703369140625, 0.03506040573120117, 0.03645610809326172, 0.037851810455322266, 0.03924751281738281, 0.04064321517944336, 0.042038917541503906, 0.04343461990356445, 0.044830322265625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 11.0, 25.0, 21.0, 42.0, 76.0, 101.0, 118.0, 109.0, 128.0, 110.0, 75.0, 65.0, 36.0, 24.0, 19.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2542146146297455, -0.24508729577064514, -0.2359599769115448, -0.22683264315128326, -0.21770532429218292, -0.20857800543308258, -0.19945067167282104, -0.1903233528137207, -0.18119603395462036, -0.17206871509552002, -0.16294139623641968, -0.15381406247615814, -0.1446867436170578, -0.13555942475795746, -0.12643209099769592, -0.11730477213859558, -0.10817745327949524, -0.0990501344203949, -0.08992280811071396, -0.08079548180103302, -0.07166816294193268, -0.06254084408283234, -0.0534135177731514, -0.04428619146347046, -0.03515887260437012, -0.026031550019979477, -0.016904227435588837, -0.007776904851198196, 0.0013504177331924438, 0.010477740317583084, 0.019605062901973724, 0.028732389211654663, 0.03785967826843262, 0.04698700085282326, 0.0561143234372139, 0.06524164974689484, 0.07436896860599518, 0.08349628746509552, 0.09262361377477646, 0.1017509400844574, 0.11087825894355774, 0.12000557780265808, 0.12913289666175842, 0.13826023042201996, 0.1473875492811203, 0.15651486814022064, 0.16564220190048218, 0.17476952075958252, 0.18389683961868286, 0.1930241584777832, 0.20215147733688354, 0.21127881109714508, 0.22040612995624542, 0.22953344881534576, 0.2386607825756073, 0.24778810143470764, 0.256915420293808, 0.2660427391529083, 0.27517005801200867, 0.284297376871109, 0.29342472553253174, 0.3025520443916321, 0.3116793632507324, 0.32080668210983276, 0.3299340009689331]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 1.0, 6.0, 7.0, 8.0, 11.0, 17.0, 18.0, 28.0, 19.0, 18.0, 30.0, 31.0, 31.0, 32.0, 32.0, 42.0, 41.0, 43.0, 34.0, 36.0, 51.0, 38.0, 53.0, 40.0, 25.0, 32.0, 29.0, 27.0, 32.0, 23.0, 24.0, 24.0, 15.0, 16.0, 12.0, 19.0, 14.0, 5.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.14361059665679932, -0.13893955945968628, -0.13426853716373444, -0.1295975148677826, -0.12492647767066956, -0.12025544792413712, -0.11558441817760468, -0.11091338843107224, -0.1062423586845398, -0.10157132893800735, -0.09690029919147491, -0.09222926944494247, -0.08755823969841003, -0.0828872099518776, -0.07821618020534515, -0.07354515045881271, -0.06887412071228027, -0.06420309096574783, -0.05953206121921539, -0.05486103147268295, -0.05019000172615051, -0.04551897197961807, -0.04084794223308563, -0.03617691248655319, -0.03150588274002075, -0.026834852993488312, -0.02216382324695587, -0.01749279350042343, -0.012821763753890991, -0.008150734007358551, -0.003479704260826111, 0.0011913254857063293, 0.0058623552322387695, 0.01053338497877121, 0.01520441472530365, 0.01987544447183609, 0.02454647421836853, 0.02921750396490097, 0.03388853371143341, 0.03855956345796585, 0.04323059320449829, 0.04790162295103073, 0.05257265269756317, 0.05724368244409561, 0.06191471219062805, 0.06658574193716049, 0.07125677168369293, 0.07592780143022537, 0.08059883117675781, 0.08526986092329025, 0.08994089066982269, 0.09461192041635513, 0.09928295016288757, 0.10395397990942001, 0.10862500965595245, 0.1132960394024849, 0.11796706914901733, 0.12263809889554977, 0.12730912864208221, 0.13198015093803406, 0.1366511881351471, 0.14132222533226013, 0.14599324762821198, 0.15066426992416382, 0.15533530712127686]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 8.0, 9.0, 15.0, 11.0, 35.0, 49.0, 52.0, 108.0, 174.0, 300.0, 498.0, 865.0, 1681.0, 3649.0, 8800.0, 24380.0, 77122.0, 256678.0, 432966.0, 163272.0, 49835.0, 16294.0, 6100.0, 2656.0, 1284.0, 677.0, 386.0, 242.0, 125.0, 74.0, 72.0, 39.0, 26.0, 18.0, 13.0, 15.0, 11.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1630859375, -0.15833282470703125, -0.1535797119140625, -0.14882659912109375, -0.144073486328125, -0.13932037353515625, -0.1345672607421875, -0.12981414794921875, -0.12506103515625, -0.12030792236328125, -0.1155548095703125, -0.11080169677734375, -0.106048583984375, -0.10129547119140625, -0.0965423583984375, -0.09178924560546875, -0.0870361328125, -0.08228302001953125, -0.0775299072265625, -0.07277679443359375, -0.068023681640625, -0.06327056884765625, -0.0585174560546875, -0.05376434326171875, -0.04901123046875, -0.04425811767578125, -0.0395050048828125, -0.03475189208984375, -0.029998779296875, -0.02524566650390625, -0.0204925537109375, -0.01573944091796875, -0.010986328125, -0.00623321533203125, -0.0014801025390625, 0.00327301025390625, 0.008026123046875, 0.01277923583984375, 0.0175323486328125, 0.02228546142578125, 0.02703857421875, 0.03179168701171875, 0.0365447998046875, 0.04129791259765625, 0.046051025390625, 0.05080413818359375, 0.0555572509765625, 0.06031036376953125, 0.0650634765625, 0.06981658935546875, 0.0745697021484375, 0.07932281494140625, 0.084075927734375, 0.08882904052734375, 0.0935821533203125, 0.09833526611328125, 0.10308837890625, 0.10784149169921875, 0.1125946044921875, 0.11734771728515625, 0.122100830078125, 0.12685394287109375, 0.1316070556640625, 0.13636016845703125, 0.14111328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 12.0, 6.0, 13.0, 23.0, 29.0, 38.0, 45.0, 56.0, 71.0, 73.0, 75.0, 89.0, 89.0, 76.0, 62.0, 59.0, 46.0, 37.0, 32.0, 20.0, 12.0, 9.0, 9.0, 8.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04254150390625, -0.04115629196166992, -0.039771080017089844, -0.038385868072509766, -0.03700065612792969, -0.03561544418334961, -0.03423023223876953, -0.03284502029418945, -0.031459808349609375, -0.030074596405029297, -0.02868938446044922, -0.02730417251586914, -0.025918960571289062, -0.024533748626708984, -0.023148536682128906, -0.021763324737548828, -0.02037811279296875, -0.018992900848388672, -0.017607688903808594, -0.016222476959228516, -0.014837265014648438, -0.01345205307006836, -0.012066841125488281, -0.010681629180908203, -0.009296417236328125, -0.007911205291748047, -0.006525993347167969, -0.005140781402587891, -0.0037555694580078125, -0.0023703575134277344, -0.0009851455688476562, 0.0004000663757324219, 0.0017852783203125, 0.003170490264892578, 0.004555702209472656, 0.005940914154052734, 0.0073261260986328125, 0.00871133804321289, 0.010096549987792969, 0.011481761932373047, 0.012866973876953125, 0.014252185821533203, 0.01563739776611328, 0.01702260971069336, 0.018407821655273438, 0.019793033599853516, 0.021178245544433594, 0.022563457489013672, 0.02394866943359375, 0.025333881378173828, 0.026719093322753906, 0.028104305267333984, 0.029489517211914062, 0.03087472915649414, 0.03225994110107422, 0.0336451530456543, 0.035030364990234375, 0.03641557693481445, 0.03780078887939453, 0.03918600082397461, 0.04057121276855469, 0.041956424713134766, 0.043341636657714844, 0.04472684860229492, 0.046112060546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 16.0, 19.0, 28.0, 41.0, 49.0, 85.0, 152.0, 243.0, 447.0, 879.0, 1870.0, 5242.0, 19394.0, 90482.0, 428159.0, 393802.0, 81557.0, 17528.0, 4867.0, 1843.0, 784.0, 451.0, 263.0, 136.0, 70.0, 52.0, 38.0, 19.0, 10.0, 6.0, 2.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12103271484375, -0.11526012420654297, -0.10948753356933594, -0.1037149429321289, -0.09794235229492188, -0.09216976165771484, -0.08639717102050781, -0.08062458038330078, -0.07485198974609375, -0.06907939910888672, -0.06330680847167969, -0.057534217834472656, -0.051761627197265625, -0.045989036560058594, -0.04021644592285156, -0.03444385528564453, -0.0286712646484375, -0.02289867401123047, -0.017126083374023438, -0.011353492736816406, -0.005580902099609375, 0.00019168853759765625, 0.0059642791748046875, 0.011736869812011719, 0.01750946044921875, 0.02328205108642578, 0.029054641723632812, 0.034827232360839844, 0.040599822998046875, 0.046372413635253906, 0.05214500427246094, 0.05791759490966797, 0.063690185546875, 0.06946277618408203, 0.07523536682128906, 0.0810079574584961, 0.08678054809570312, 0.09255313873291016, 0.09832572937011719, 0.10409832000732422, 0.10987091064453125, 0.11564350128173828, 0.12141609191894531, 0.12718868255615234, 0.13296127319335938, 0.1387338638305664, 0.14450645446777344, 0.15027904510498047, 0.1560516357421875, 0.16182422637939453, 0.16759681701660156, 0.1733694076538086, 0.17914199829101562, 0.18491458892822266, 0.1906871795654297, 0.19645977020263672, 0.20223236083984375, 0.20800495147705078, 0.2137775421142578, 0.21955013275146484, 0.22532272338867188, 0.2310953140258789, 0.23686790466308594, 0.24264049530029297, 0.2484130859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 8.0, 8.0, 10.0, 22.0, 15.0, 15.0, 25.0, 24.0, 38.0, 35.0, 36.0, 46.0, 50.0, 52.0, 52.0, 43.0, 57.0, 41.0, 63.0, 52.0, 43.0, 35.0, 36.0, 33.0, 29.0, 29.0, 24.0, 22.0, 12.0, 9.0, 5.0, 12.0, 3.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11395263671875, -0.1092233657836914, -0.10449409484863281, -0.09976482391357422, -0.09503555297851562, -0.09030628204345703, -0.08557701110839844, -0.08084774017333984, -0.07611846923828125, -0.07138919830322266, -0.06665992736816406, -0.06193065643310547, -0.057201385498046875, -0.05247211456298828, -0.04774284362792969, -0.043013572692871094, -0.0382843017578125, -0.033555030822753906, -0.028825759887695312, -0.02409648895263672, -0.019367218017578125, -0.014637947082519531, -0.009908676147460938, -0.005179405212402344, -0.00045013427734375, 0.004279136657714844, 0.009008407592773438, 0.013737678527832031, 0.018466949462890625, 0.02319622039794922, 0.027925491333007812, 0.032654762268066406, 0.037384033203125, 0.042113304138183594, 0.04684257507324219, 0.05157184600830078, 0.056301116943359375, 0.06103038787841797, 0.06575965881347656, 0.07048892974853516, 0.07521820068359375, 0.07994747161865234, 0.08467674255371094, 0.08940601348876953, 0.09413528442382812, 0.09886455535888672, 0.10359382629394531, 0.1083230972290039, 0.1130523681640625, 0.1177816390991211, 0.12251091003417969, 0.12724018096923828, 0.13196945190429688, 0.13669872283935547, 0.14142799377441406, 0.14615726470947266, 0.15088653564453125, 0.15561580657958984, 0.16034507751464844, 0.16507434844970703, 0.16980361938476562, 0.17453289031982422, 0.1792621612548828, 0.1839914321899414, 0.188720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 5.0, 6.0, 21.0, 28.0, 37.0, 54.0, 92.0, 142.0, 221.0, 324.0, 590.0, 1064.0, 1897.0, 3868.0, 8177.0, 20205.0, 62332.0, 258846.0, 478556.0, 146678.0, 38714.0, 14047.0, 6157.0, 2944.0, 1480.0, 820.0, 472.0, 274.0, 174.0, 117.0, 64.0, 44.0, 31.0, 23.0, 12.0, 14.0, 9.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059539794921875, -0.057436466217041016, -0.05533313751220703, -0.05322980880737305, -0.05112648010253906, -0.04902315139770508, -0.046919822692871094, -0.04481649398803711, -0.042713165283203125, -0.04060983657836914, -0.038506507873535156, -0.03640317916870117, -0.03429985046386719, -0.0321965217590332, -0.03009319305419922, -0.027989864349365234, -0.02588653564453125, -0.023783206939697266, -0.02167987823486328, -0.019576549530029297, -0.017473220825195312, -0.015369892120361328, -0.013266563415527344, -0.01116323471069336, -0.009059906005859375, -0.006956577301025391, -0.004853248596191406, -0.002749919891357422, -0.0006465911865234375, 0.0014567375183105469, 0.0035600662231445312, 0.005663394927978516, 0.0077667236328125, 0.009870052337646484, 0.011973381042480469, 0.014076709747314453, 0.016180038452148438, 0.018283367156982422, 0.020386695861816406, 0.02249002456665039, 0.024593353271484375, 0.02669668197631836, 0.028800010681152344, 0.030903339385986328, 0.03300666809082031, 0.0351099967956543, 0.03721332550048828, 0.039316654205322266, 0.04141998291015625, 0.043523311614990234, 0.04562664031982422, 0.0477299690246582, 0.04983329772949219, 0.05193662643432617, 0.054039955139160156, 0.05614328384399414, 0.058246612548828125, 0.06034994125366211, 0.062453269958496094, 0.06455659866333008, 0.06665992736816406, 0.06876325607299805, 0.07086658477783203, 0.07296991348266602, 0.0750732421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 8.0, 6.0, 11.0, 13.0, 29.0, 39.0, 38.0, 66.0, 70.0, 81.0, 86.0, 99.0, 102.0, 87.0, 76.0, 58.0, 27.0, 32.0, 19.0, 16.0, 11.0, 8.0, 9.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.218650817871094e-05, -3.080815076828003e-05, -2.942979335784912e-05, -2.8051435947418213e-05, -2.6673078536987305e-05, -2.5294721126556396e-05, -2.3916363716125488e-05, -2.253800630569458e-05, -2.1159648895263672e-05, -1.9781291484832764e-05, -1.8402934074401855e-05, -1.7024576663970947e-05, -1.564621925354004e-05, -1.4267861843109131e-05, -1.2889504432678223e-05, -1.1511147022247314e-05, -1.0132789611816406e-05, -8.754432201385498e-06, -7.37607479095459e-06, -5.997717380523682e-06, -4.6193599700927734e-06, -3.2410025596618652e-06, -1.862645149230957e-06, -4.842877388000488e-07, 8.940696716308594e-07, 2.2724270820617676e-06, 3.6507844924926758e-06, 5.029141902923584e-06, 6.407499313354492e-06, 7.7858567237854e-06, 9.164214134216309e-06, 1.0542571544647217e-05, 1.1920928955078125e-05, 1.3299286365509033e-05, 1.4677643775939941e-05, 1.605600118637085e-05, 1.7434358596801758e-05, 1.8812716007232666e-05, 2.0191073417663574e-05, 2.1569430828094482e-05, 2.294778823852539e-05, 2.43261456489563e-05, 2.5704503059387207e-05, 2.7082860469818115e-05, 2.8461217880249023e-05, 2.983957529067993e-05, 3.121793270111084e-05, 3.259629011154175e-05, 3.3974647521972656e-05, 3.5353004932403564e-05, 3.673136234283447e-05, 3.810971975326538e-05, 3.948807716369629e-05, 4.08664345741272e-05, 4.2244791984558105e-05, 4.3623149394989014e-05, 4.500150680541992e-05, 4.637986421585083e-05, 4.775822162628174e-05, 4.9136579036712646e-05, 5.0514936447143555e-05, 5.189329385757446e-05, 5.327165126800537e-05, 5.465000867843628e-05, 5.602836608886719e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 10.0, 7.0, 9.0, 12.0, 12.0, 30.0, 55.0, 73.0, 127.0, 239.0, 346.0, 739.0, 1440.0, 3248.0, 8354.0, 25193.0, 112008.0, 573650.0, 256185.0, 44735.0, 12963.0, 4837.0, 2065.0, 998.0, 494.0, 281.0, 158.0, 90.0, 63.0, 35.0, 30.0, 16.0, 16.0, 10.0, 9.0, 0.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080322265625, -0.07752513885498047, -0.07472801208496094, -0.0719308853149414, -0.06913375854492188, -0.06633663177490234, -0.06353950500488281, -0.06074237823486328, -0.05794525146484375, -0.05514812469482422, -0.05235099792480469, -0.049553871154785156, -0.046756744384765625, -0.043959617614746094, -0.04116249084472656, -0.03836536407470703, -0.0355682373046875, -0.03277111053466797, -0.029973983764648438, -0.027176856994628906, -0.024379730224609375, -0.021582603454589844, -0.018785476684570312, -0.01598834991455078, -0.01319122314453125, -0.010394096374511719, -0.0075969696044921875, -0.004799842834472656, -0.002002716064453125, 0.0007944107055664062, 0.0035915374755859375, 0.006388664245605469, 0.009185791015625, 0.011982917785644531, 0.014780044555664062, 0.017577171325683594, 0.020374298095703125, 0.023171424865722656, 0.025968551635742188, 0.02876567840576172, 0.03156280517578125, 0.03435993194580078, 0.03715705871582031, 0.039954185485839844, 0.042751312255859375, 0.045548439025878906, 0.04834556579589844, 0.05114269256591797, 0.0539398193359375, 0.05673694610595703, 0.05953407287597656, 0.062331199645996094, 0.06512832641601562, 0.06792545318603516, 0.07072257995605469, 0.07351970672607422, 0.07631683349609375, 0.07911396026611328, 0.08191108703613281, 0.08470821380615234, 0.08750534057617188, 0.0903024673461914, 0.09309959411621094, 0.09589672088623047, 0.09869384765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 7.0, 13.0, 12.0, 24.0, 29.0, 51.0, 59.0, 77.0, 93.0, 88.0, 109.0, 87.0, 66.0, 77.0, 61.0, 29.0, 24.0, 26.0, 13.0, 9.0, 10.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056732177734375, -0.05472898483276367, -0.052725791931152344, -0.050722599029541016, -0.04871940612792969, -0.04671621322631836, -0.04471302032470703, -0.0427098274230957, -0.040706634521484375, -0.03870344161987305, -0.03670024871826172, -0.03469705581665039, -0.03269386291503906, -0.030690670013427734, -0.028687477111816406, -0.026684284210205078, -0.02468109130859375, -0.022677898406982422, -0.020674705505371094, -0.018671512603759766, -0.016668319702148438, -0.01466512680053711, -0.012661933898925781, -0.010658740997314453, -0.008655548095703125, -0.006652355194091797, -0.004649162292480469, -0.0026459693908691406, -0.0006427764892578125, 0.0013604164123535156, 0.0033636093139648438, 0.005366802215576172, 0.0073699951171875, 0.009373188018798828, 0.011376380920410156, 0.013379573822021484, 0.015382766723632812, 0.01738595962524414, 0.01938915252685547, 0.021392345428466797, 0.023395538330078125, 0.025398731231689453, 0.02740192413330078, 0.02940511703491211, 0.03140830993652344, 0.033411502838134766, 0.035414695739746094, 0.03741788864135742, 0.03942108154296875, 0.04142427444458008, 0.043427467346191406, 0.045430660247802734, 0.04743385314941406, 0.04943704605102539, 0.05144023895263672, 0.05344343185424805, 0.055446624755859375, 0.0574498176574707, 0.05945301055908203, 0.06145620346069336, 0.06345939636230469, 0.06546258926391602, 0.06746578216552734, 0.06946897506713867, 0.07147216796875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 8.0, 16.0, 26.0, 51.0, 48.0, 68.0, 118.0, 113.0, 126.0, 104.0, 96.0, 73.0, 42.0, 34.0, 27.0, 16.0, 6.0, 4.0, 5.0, 4.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.873810887336731, -0.844957172870636, -0.816103458404541, -0.787249743938446, -0.7583960294723511, -0.7295423746109009, -0.7006886601448059, -0.6718349456787109, -0.642981231212616, -0.614127516746521, -0.585273802280426, -0.556420087814331, -0.5275664329528809, -0.4987126886844635, -0.4698590040206909, -0.44100528955459595, -0.412151575088501, -0.383297860622406, -0.35444414615631104, -0.32559046149253845, -0.2967367470264435, -0.2678830325603485, -0.23902933299541473, -0.21017563343048096, -0.181321918964386, -0.15246820449829102, -0.12361450493335724, -0.09476079791784286, -0.06590709090232849, -0.03705337643623352, -0.008199676871299744, 0.020654022693634033, 0.049507737159729004, 0.07836144417524338, 0.10721515119075775, 0.13606885075569153, 0.1649225652217865, 0.19377627968788147, 0.22262997925281525, 0.251483678817749, 0.280337393283844, 0.30919110774993896, 0.33804482221603394, 0.3668985068798065, 0.3957522213459015, 0.42460593581199646, 0.45345962047576904, 0.482313334941864, 0.511167049407959, 0.540020763874054, 0.5688744783401489, 0.5977281928062439, 0.6265819072723389, 0.6554355621337891, 0.684289276599884, 0.713142991065979, 0.741996705532074, 0.770850419998169, 0.7997041344642639, 0.8285578489303589, 0.8574115037918091, 0.8862652778625488, 0.915118932723999, 0.943972647190094, 0.972826361656189]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 4.0, 12.0, 19.0, 7.0, 17.0, 20.0, 14.0, 37.0, 33.0, 41.0, 45.0, 52.0, 68.0, 60.0, 62.0, 58.0, 64.0, 65.0, 46.0, 44.0, 48.0, 42.0, 36.0, 30.0, 21.0, 10.0, 13.0, 8.0, 4.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9815332889556885, -0.9500988721847534, -0.9186645150184631, -0.8872301578521729, -0.8557957410812378, -0.8243613243103027, -0.7929269671440125, -0.7614926099777222, -0.7300581932067871, -0.698623776435852, -0.6671894192695618, -0.6357550621032715, -0.6043206453323364, -0.5728862285614014, -0.5414518713951111, -0.5100175142288208, -0.47858309745788574, -0.44714871048927307, -0.4157143235206604, -0.38427993655204773, -0.35284554958343506, -0.3214111626148224, -0.2899767756462097, -0.25854238867759705, -0.22710800170898438, -0.1956736147403717, -0.16423922777175903, -0.13280484080314636, -0.10137045383453369, -0.06993606686592102, -0.03850167989730835, -0.007067292928695679, 0.024367094039916992, 0.05580148100852966, 0.08723586797714233, 0.118670254945755, 0.15010464191436768, 0.18153902888298035, 0.21297341585159302, 0.2444078028202057, 0.27584218978881836, 0.30727657675743103, 0.3387109637260437, 0.37014535069465637, 0.40157973766326904, 0.4330141246318817, 0.4644485116004944, 0.49588289856910706, 0.5273172855377197, 0.5587517023086548, 0.5901860594749451, 0.6216204166412354, 0.6530548334121704, 0.6844892501831055, 0.7159236073493958, 0.747357964515686, 0.7787923812866211, 0.8102267980575562, 0.8416611552238464, 0.8730955123901367, 0.9045299291610718, 0.9359643459320068, 0.9673987030982971, 0.9988330602645874, 1.0302674770355225]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 11.0, 17.0, 28.0, 61.0, 70.0, 129.0, 233.0, 396.0, 770.0, 1397.0, 3074.0, 7296.0, 20248.0, 80001.0, 2480232.0, 1493597.0, 73408.0, 19405.0, 6990.0, 3150.0, 1539.0, 815.0, 482.0, 284.0, 203.0, 129.0, 76.0, 50.0, 32.0, 36.0, 24.0, 22.0, 15.0, 14.0, 7.0, 7.0, 4.0, 6.0, 1.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2025146484375, -0.1961822509765625, -0.189849853515625, -0.1835174560546875, -0.17718505859375, -0.1708526611328125, -0.164520263671875, -0.1581878662109375, -0.15185546875, -0.1455230712890625, -0.139190673828125, -0.1328582763671875, -0.12652587890625, -0.1201934814453125, -0.113861083984375, -0.1075286865234375, -0.1011962890625, -0.0948638916015625, -0.088531494140625, -0.0821990966796875, -0.07586669921875, -0.0695343017578125, -0.063201904296875, -0.0568695068359375, -0.050537109375, -0.0442047119140625, -0.037872314453125, -0.0315399169921875, -0.02520751953125, -0.0188751220703125, -0.012542724609375, -0.0062103271484375, 0.0001220703125, 0.0064544677734375, 0.012786865234375, 0.0191192626953125, 0.02545166015625, 0.0317840576171875, 0.038116455078125, 0.0444488525390625, 0.05078125, 0.0571136474609375, 0.063446044921875, 0.0697784423828125, 0.07611083984375, 0.0824432373046875, 0.088775634765625, 0.0951080322265625, 0.1014404296875, 0.1077728271484375, 0.114105224609375, 0.1204376220703125, 0.12677001953125, 0.1331024169921875, 0.139434814453125, 0.1457672119140625, 0.152099609375, 0.1584320068359375, 0.164764404296875, 0.1710968017578125, 0.17742919921875, 0.1837615966796875, 0.190093994140625, 0.1964263916015625, 0.2027587890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 8.0, 11.0, 13.0, 28.0, 34.0, 51.0, 70.0, 70.0, 77.0, 86.0, 75.0, 95.0, 78.0, 81.0, 65.0, 34.0, 42.0, 15.0, 12.0, 11.0, 11.0, 10.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04193115234375, -0.04046344757080078, -0.03899574279785156, -0.037528038024902344, -0.036060333251953125, -0.034592628479003906, -0.03312492370605469, -0.03165721893310547, -0.03018951416015625, -0.02872180938720703, -0.027254104614257812, -0.025786399841308594, -0.024318695068359375, -0.022850990295410156, -0.021383285522460938, -0.01991558074951172, -0.0184478759765625, -0.01698017120361328, -0.015512466430664062, -0.014044761657714844, -0.012577056884765625, -0.011109352111816406, -0.009641647338867188, -0.008173942565917969, -0.00670623779296875, -0.005238533020019531, -0.0037708282470703125, -0.0023031234741210938, -0.000835418701171875, 0.0006322860717773438, 0.0020999908447265625, 0.0035676956176757812, 0.005035400390625, 0.006503105163574219, 0.007970809936523438, 0.009438514709472656, 0.010906219482421875, 0.012373924255371094, 0.013841629028320312, 0.015309333801269531, 0.01677703857421875, 0.01824474334716797, 0.019712448120117188, 0.021180152893066406, 0.022647857666015625, 0.024115562438964844, 0.025583267211914062, 0.02705097198486328, 0.0285186767578125, 0.02998638153076172, 0.03145408630371094, 0.032921791076660156, 0.034389495849609375, 0.035857200622558594, 0.03732490539550781, 0.03879261016845703, 0.04026031494140625, 0.04172801971435547, 0.04319572448730469, 0.044663429260253906, 0.046131134033203125, 0.047598838806152344, 0.04906654357910156, 0.05053424835205078, 0.052001953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 9.0, 17.0, 27.0, 33.0, 61.0, 89.0, 132.0, 218.0, 414.0, 701.0, 1310.0, 2748.0, 6122.0, 15746.0, 48169.0, 217607.0, 3215349.0, 562354.0, 83119.0, 23553.0, 8711.0, 3842.0, 1754.0, 904.0, 475.0, 282.0, 176.0, 99.0, 73.0, 45.0, 29.0, 31.0, 12.0, 6.0, 11.0, 5.0, 5.0, 2.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15880966186523438, -0.15380096435546875, -0.14879226684570312, -0.1437835693359375, -0.13877487182617188, -0.13376617431640625, -0.12875747680664062, -0.123748779296875, -0.11874008178710938, -0.11373138427734375, -0.10872268676757812, -0.1037139892578125, -0.09870529174804688, -0.09369659423828125, -0.08868789672851562, -0.08367919921875, -0.07867050170898438, -0.07366180419921875, -0.06865310668945312, -0.0636444091796875, -0.058635711669921875, -0.05362701416015625, -0.048618316650390625, -0.043609619140625, -0.038600921630859375, -0.03359222412109375, -0.028583526611328125, -0.0235748291015625, -0.018566131591796875, -0.01355743408203125, -0.008548736572265625, -0.0035400390625, 0.001468658447265625, 0.00647735595703125, 0.011486053466796875, 0.0164947509765625, 0.021503448486328125, 0.02651214599609375, 0.031520843505859375, 0.036529541015625, 0.041538238525390625, 0.04654693603515625, 0.051555633544921875, 0.0565643310546875, 0.061573028564453125, 0.06658172607421875, 0.07159042358398438, 0.07659912109375, 0.08160781860351562, 0.08661651611328125, 0.09162521362304688, 0.0966339111328125, 0.10164260864257812, 0.10665130615234375, 0.11166000366210938, 0.116668701171875, 0.12167739868164062, 0.12668609619140625, 0.13169479370117188, 0.1367034912109375, 0.14171218872070312, 0.14672088623046875, 0.15172958374023438, 0.15673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 6.0, 6.0, 5.0, 8.0, 13.0, 13.0, 17.0, 32.0, 34.0, 30.0, 38.0, 63.0, 103.0, 147.0, 267.0, 609.0, 1355.0, 563.0, 281.0, 130.0, 91.0, 56.0, 52.0, 30.0, 28.0, 25.0, 16.0, 12.0, 13.0, 7.0, 8.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046417236328125, -0.04452180862426758, -0.042626380920410156, -0.040730953216552734, -0.03883552551269531, -0.03694009780883789, -0.03504467010498047, -0.03314924240112305, -0.031253814697265625, -0.029358386993408203, -0.02746295928955078, -0.02556753158569336, -0.023672103881835938, -0.021776676177978516, -0.019881248474121094, -0.017985820770263672, -0.01609039306640625, -0.014194965362548828, -0.012299537658691406, -0.010404109954833984, -0.008508682250976562, -0.006613254547119141, -0.004717826843261719, -0.002822399139404297, -0.000926971435546875, 0.0009684562683105469, 0.0028638839721679688, 0.004759311676025391, 0.0066547393798828125, 0.008550167083740234, 0.010445594787597656, 0.012341022491455078, 0.0142364501953125, 0.016131877899169922, 0.018027305603027344, 0.019922733306884766, 0.021818161010742188, 0.02371358871459961, 0.02560901641845703, 0.027504444122314453, 0.029399871826171875, 0.0312952995300293, 0.03319072723388672, 0.03508615493774414, 0.03698158264160156, 0.038877010345458984, 0.040772438049316406, 0.04266786575317383, 0.04456329345703125, 0.04645872116088867, 0.048354148864746094, 0.050249576568603516, 0.05214500427246094, 0.05404043197631836, 0.05593585968017578, 0.0578312873840332, 0.059726715087890625, 0.06162214279174805, 0.06351757049560547, 0.06541299819946289, 0.06730842590332031, 0.06920385360717773, 0.07109928131103516, 0.07299470901489258, 0.07489013671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 6.0, 8.0, 9.0, 22.0, 52.0, 73.0, 118.0, 153.0, 161.0, 135.0, 103.0, 72.0, 44.0, 21.0, 7.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5998169183731079, -0.5819693803787231, -0.5641219019889832, -0.5462743639945984, -0.5284268856048584, -0.5105793476104736, -0.49273183941841125, -0.4748843312263489, -0.4570368230342865, -0.4391893148422241, -0.42134180665016174, -0.40349429845809937, -0.3856467604637146, -0.3677992820739746, -0.34995174407958984, -0.33210423588752747, -0.3142567276954651, -0.2964092195034027, -0.27856171131134033, -0.26071420311927795, -0.24286668002605438, -0.225019171833992, -0.20717164874076843, -0.18932414054870605, -0.17147663235664368, -0.1536291241645813, -0.13578161597251892, -0.11793409287929535, -0.10008658468723297, -0.0822390764951706, -0.06439156085252762, -0.046544045209884644, -0.028696537017822266, -0.01084902510046959, 0.006998486816883087, 0.024845998734235764, 0.04269351065158844, 0.06054101884365082, 0.07838853448629379, 0.09623605012893677, 0.11408355832099915, 0.13193106651306152, 0.1497785747051239, 0.16762609779834747, 0.18547360599040985, 0.20332111418247223, 0.2211686372756958, 0.23901614546775818, 0.25686365365982056, 0.27471116185188293, 0.2925586700439453, 0.3104061782360077, 0.32825368642807007, 0.34610122442245483, 0.3639487326145172, 0.3817962408065796, 0.39964374899864197, 0.41749125719070435, 0.4353387653827667, 0.4531862735748291, 0.47103381156921387, 0.48888128995895386, 0.5067288279533386, 0.5245763063430786, 0.5424238443374634]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 8.0, 12.0, 8.0, 19.0, 12.0, 18.0, 25.0, 35.0, 37.0, 36.0, 55.0, 52.0, 47.0, 46.0, 53.0, 62.0, 45.0, 53.0, 44.0, 42.0, 33.0, 35.0, 40.0, 30.0, 25.0, 33.0, 26.0, 10.0, 10.0, 12.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29416346549987793, -0.28543680906295776, -0.2767101526260376, -0.26798349618911743, -0.25925686955451965, -0.2505302131175995, -0.24180355668067932, -0.23307690024375916, -0.224350243806839, -0.21562358736991882, -0.20689694583415985, -0.19817028939723969, -0.18944363296031952, -0.18071699142456055, -0.17199033498764038, -0.16326367855072021, -0.15453703701496124, -0.14581038057804108, -0.1370837390422821, -0.12835708260536194, -0.11963042616844177, -0.1109037771821022, -0.10217712819576263, -0.09345047175884247, -0.0847238227725029, -0.07599717378616333, -0.06727051734924316, -0.058543868362903595, -0.04981721565127373, -0.04109056293964386, -0.03236391395330429, -0.023637261241674423, -0.014910608530044556, -0.006183956749737263, 0.00254269503057003, 0.011269345879554749, 0.019995998591184616, 0.028722651302814484, 0.03744930028915405, 0.04617595300078392, 0.05490260571241379, 0.06362925469875336, 0.07235591113567352, 0.08108256012201309, 0.08980920910835266, 0.09853586554527283, 0.1072625145316124, 0.11598916351795197, 0.12471581995487213, 0.1334424763917923, 0.14216911792755127, 0.15089577436447144, 0.1596224308013916, 0.16834908723831177, 0.17707572877407074, 0.1858023852109909, 0.19452902674674988, 0.20325568318367004, 0.21198232471942902, 0.22070898115634918, 0.22943563759326935, 0.23816227912902832, 0.2468889355659485, 0.25561559200286865, 0.2643422484397888]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 16.0, 10.0, 27.0, 35.0, 51.0, 68.0, 127.0, 148.0, 272.0, 471.0, 871.0, 1823.0, 4366.0, 11561.0, 34540.0, 127757.0, 531695.0, 246043.0, 58908.0, 17974.0, 6456.0, 2602.0, 1182.0, 590.0, 318.0, 207.0, 125.0, 84.0, 58.0, 43.0, 23.0, 19.0, 17.0, 14.0, 5.0, 5.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.233154296875, -0.22623825073242188, -0.21932220458984375, -0.21240615844726562, -0.2054901123046875, -0.19857406616210938, -0.19165802001953125, -0.18474197387695312, -0.177825927734375, -0.17090988159179688, -0.16399383544921875, -0.15707778930664062, -0.1501617431640625, -0.14324569702148438, -0.13632965087890625, -0.12941360473632812, -0.12249755859375, -0.11558151245117188, -0.10866546630859375, -0.10174942016601562, -0.0948333740234375, -0.08791732788085938, -0.08100128173828125, -0.07408523559570312, -0.067169189453125, -0.060253143310546875, -0.05333709716796875, -0.046421051025390625, -0.0395050048828125, -0.032588958740234375, -0.02567291259765625, -0.018756866455078125, -0.0118408203125, -0.004924774169921875, 0.00199127197265625, 0.008907318115234375, 0.0158233642578125, 0.022739410400390625, 0.02965545654296875, 0.036571502685546875, 0.043487548828125, 0.050403594970703125, 0.05731964111328125, 0.06423568725585938, 0.0711517333984375, 0.07806777954101562, 0.08498382568359375, 0.09189987182617188, 0.09881591796875, 0.10573196411132812, 0.11264801025390625, 0.11956405639648438, 0.1264801025390625, 0.13339614868164062, 0.14031219482421875, 0.14722824096679688, 0.154144287109375, 0.16106033325195312, 0.16797637939453125, 0.17489242553710938, 0.1818084716796875, 0.18872451782226562, 0.19564056396484375, 0.20255661010742188, 0.20947265625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 12.0, 11.0, 13.0, 12.0, 25.0, 59.0, 53.0, 71.0, 81.0, 94.0, 89.0, 105.0, 83.0, 93.0, 57.0, 53.0, 26.0, 26.0, 8.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053558349609375, -0.05197334289550781, -0.050388336181640625, -0.04880332946777344, -0.04721832275390625, -0.04563331604003906, -0.044048309326171875, -0.04246330261230469, -0.0408782958984375, -0.03929328918457031, -0.037708282470703125, -0.03612327575683594, -0.03453826904296875, -0.03295326232910156, -0.031368255615234375, -0.029783248901367188, -0.0281982421875, -0.026613235473632812, -0.025028228759765625, -0.023443222045898438, -0.02185821533203125, -0.020273208618164062, -0.018688201904296875, -0.017103195190429688, -0.0155181884765625, -0.013933181762695312, -0.012348175048828125, -0.010763168334960938, -0.00917816162109375, -0.0075931549072265625, -0.006008148193359375, -0.0044231414794921875, -0.002838134765625, -0.0012531280517578125, 0.000331878662109375, 0.0019168853759765625, 0.00350189208984375, 0.0050868988037109375, 0.006671905517578125, 0.008256912231445312, 0.0098419189453125, 0.011426925659179688, 0.013011932373046875, 0.014596939086914062, 0.01618194580078125, 0.017766952514648438, 0.019351959228515625, 0.020936965942382812, 0.02252197265625, 0.024106979370117188, 0.025691986083984375, 0.027276992797851562, 0.02886199951171875, 0.030447006225585938, 0.032032012939453125, 0.03361701965332031, 0.0352020263671875, 0.03678703308105469, 0.038372039794921875, 0.03995704650878906, 0.04154205322265625, 0.04312705993652344, 0.044712066650390625, 0.04629707336425781, 0.047882080078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 11.0, 15.0, 21.0, 32.0, 51.0, 57.0, 86.0, 126.0, 158.0, 250.0, 409.0, 634.0, 999.0, 1620.0, 3030.0, 5454.0, 10959.0, 25133.0, 60753.0, 160726.0, 392742.0, 234775.0, 85844.0, 34184.0, 14697.0, 6975.0, 3489.0, 1961.0, 1157.0, 746.0, 449.0, 301.0, 207.0, 149.0, 82.0, 85.0, 55.0, 41.0, 24.0, 11.0, 12.0, 11.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11004638671875, -0.10620975494384766, -0.10237312316894531, -0.09853649139404297, -0.09469985961914062, -0.09086322784423828, -0.08702659606933594, -0.0831899642944336, -0.07935333251953125, -0.0755167007446289, -0.07168006896972656, -0.06784343719482422, -0.06400680541992188, -0.06017017364501953, -0.05633354187011719, -0.052496910095214844, -0.0486602783203125, -0.044823646545410156, -0.04098701477050781, -0.03715038299560547, -0.033313751220703125, -0.02947711944580078, -0.025640487670898438, -0.021803855895996094, -0.01796722412109375, -0.014130592346191406, -0.010293960571289062, -0.006457328796386719, -0.002620697021484375, 0.0012159347534179688, 0.0050525665283203125, 0.008889198303222656, 0.012725830078125, 0.016562461853027344, 0.020399093627929688, 0.02423572540283203, 0.028072357177734375, 0.03190898895263672, 0.03574562072753906, 0.039582252502441406, 0.04341888427734375, 0.047255516052246094, 0.05109214782714844, 0.05492877960205078, 0.058765411376953125, 0.06260204315185547, 0.06643867492675781, 0.07027530670166016, 0.0741119384765625, 0.07794857025146484, 0.08178520202636719, 0.08562183380126953, 0.08945846557617188, 0.09329509735107422, 0.09713172912597656, 0.1009683609008789, 0.10480499267578125, 0.1086416244506836, 0.11247825622558594, 0.11631488800048828, 0.12015151977539062, 0.12398815155029297, 0.1278247833251953, 0.13166141510009766, 0.135498046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 12.0, 14.0, 6.0, 12.0, 12.0, 25.0, 17.0, 22.0, 20.0, 26.0, 38.0, 36.0, 38.0, 36.0, 49.0, 54.0, 48.0, 54.0, 52.0, 41.0, 40.0, 48.0, 39.0, 37.0, 40.0, 37.0, 27.0, 32.0, 21.0, 11.0, 13.0, 14.0, 11.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1583251953125, -0.15381431579589844, -0.14930343627929688, -0.1447925567626953, -0.14028167724609375, -0.1357707977294922, -0.13125991821289062, -0.12674903869628906, -0.1222381591796875, -0.11772727966308594, -0.11321640014648438, -0.10870552062988281, -0.10419464111328125, -0.09968376159667969, -0.09517288208007812, -0.09066200256347656, -0.086151123046875, -0.08164024353027344, -0.07712936401367188, -0.07261848449707031, -0.06810760498046875, -0.06359672546386719, -0.059085845947265625, -0.05457496643066406, -0.0500640869140625, -0.04555320739746094, -0.041042327880859375, -0.03653144836425781, -0.03202056884765625, -0.027509689331054688, -0.022998809814453125, -0.018487930297851562, -0.01397705078125, -0.009466171264648438, -0.004955291748046875, -0.0004444122314453125, 0.00406646728515625, 0.008577346801757812, 0.013088226318359375, 0.017599105834960938, 0.0221099853515625, 0.026620864868164062, 0.031131744384765625, 0.03564262390136719, 0.04015350341796875, 0.04466438293457031, 0.049175262451171875, 0.05368614196777344, 0.058197021484375, 0.06270790100097656, 0.06721878051757812, 0.07172966003417969, 0.07624053955078125, 0.08075141906738281, 0.08526229858398438, 0.08977317810058594, 0.0942840576171875, 0.09879493713378906, 0.10330581665039062, 0.10781669616699219, 0.11232757568359375, 0.11683845520019531, 0.12134933471679688, 0.12586021423339844, 0.13037109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 8.0, 19.0, 16.0, 21.0, 42.0, 77.0, 140.0, 269.0, 456.0, 863.0, 1595.0, 3412.0, 7972.0, 22199.0, 95983.0, 586159.0, 263334.0, 43231.0, 12686.0, 5011.0, 2356.0, 1237.0, 634.0, 320.0, 174.0, 117.0, 76.0, 47.0, 33.0, 14.0, 7.0, 13.0, 12.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.13231277465820312, -0.12827301025390625, -0.12423324584960938, -0.1201934814453125, -0.11615371704101562, -0.11211395263671875, -0.10807418823242188, -0.104034423828125, -0.09999465942382812, -0.09595489501953125, -0.09191513061523438, -0.0878753662109375, -0.08383560180664062, -0.07979583740234375, -0.07575607299804688, -0.07171630859375, -0.06767654418945312, -0.06363677978515625, -0.059597015380859375, -0.0555572509765625, -0.051517486572265625, -0.04747772216796875, -0.043437957763671875, -0.039398193359375, -0.035358428955078125, -0.03131866455078125, -0.027278900146484375, -0.0232391357421875, -0.019199371337890625, -0.01515960693359375, -0.011119842529296875, -0.007080078125, -0.003040313720703125, 0.00099945068359375, 0.005039215087890625, 0.0090789794921875, 0.013118743896484375, 0.01715850830078125, 0.021198272705078125, 0.025238037109375, 0.029277801513671875, 0.03331756591796875, 0.037357330322265625, 0.0413970947265625, 0.045436859130859375, 0.04947662353515625, 0.053516387939453125, 0.05755615234375, 0.061595916748046875, 0.06563568115234375, 0.06967544555664062, 0.0737152099609375, 0.07775497436523438, 0.08179473876953125, 0.08583450317382812, 0.089874267578125, 0.09391403198242188, 0.09795379638671875, 0.10199356079101562, 0.1060333251953125, 0.11007308959960938, 0.11411285400390625, 0.11815261840820312, 0.1221923828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 8.0, 8.0, 2.0, 7.0, 7.0, 15.0, 25.0, 32.0, 46.0, 45.0, 73.0, 94.0, 88.0, 87.0, 87.0, 84.0, 60.0, 51.0, 54.0, 48.0, 22.0, 15.0, 20.0, 12.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.64320182800293e-05, -4.516635090112686e-05, -4.3900683522224426e-05, -4.263501614332199e-05, -4.1369348764419556e-05, -4.010368138551712e-05, -3.8838014006614685e-05, -3.757234662771225e-05, -3.6306679248809814e-05, -3.504101186990738e-05, -3.3775344491004944e-05, -3.250967711210251e-05, -3.124400973320007e-05, -2.9978342354297638e-05, -2.8712674975395203e-05, -2.7447007596492767e-05, -2.6181340217590332e-05, -2.4915672838687897e-05, -2.365000545978546e-05, -2.2384338080883026e-05, -2.111867070198059e-05, -1.9853003323078156e-05, -1.858733594417572e-05, -1.7321668565273285e-05, -1.605600118637085e-05, -1.4790333807468414e-05, -1.3524666428565979e-05, -1.2258999049663544e-05, -1.0993331670761108e-05, -9.727664291858673e-06, -8.461996912956238e-06, -7.1963295340538025e-06, -5.930662155151367e-06, -4.664994776248932e-06, -3.3993273973464966e-06, -2.1336600184440613e-06, -8.67992639541626e-07, 3.976747393608093e-07, 1.6633421182632446e-06, 2.92900949716568e-06, 4.194676876068115e-06, 5.4603442549705505e-06, 6.726011633872986e-06, 7.991679012775421e-06, 9.257346391677856e-06, 1.0523013770580292e-05, 1.1788681149482727e-05, 1.3054348528385162e-05, 1.4320015907287598e-05, 1.5585683286190033e-05, 1.6851350665092468e-05, 1.8117018043994904e-05, 1.938268542289734e-05, 2.0648352801799774e-05, 2.191402018070221e-05, 2.3179687559604645e-05, 2.444535493850708e-05, 2.5711022317409515e-05, 2.697668969631195e-05, 2.8242357075214386e-05, 2.950802445411682e-05, 3.0773691833019257e-05, 3.203935921192169e-05, 3.330502659082413e-05, 3.457069396972656e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 13.0, 13.0, 20.0, 29.0, 46.0, 45.0, 80.0, 118.0, 199.0, 347.0, 602.0, 1313.0, 2903.0, 7025.0, 21087.0, 87356.0, 557240.0, 298482.0, 48954.0, 13447.0, 4935.0, 2085.0, 961.0, 519.0, 267.0, 175.0, 92.0, 67.0, 38.0, 30.0, 15.0, 20.0, 10.0, 6.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1343994140625, -0.13074874877929688, -0.12709808349609375, -0.12344741821289062, -0.1197967529296875, -0.11614608764648438, -0.11249542236328125, -0.10884475708007812, -0.105194091796875, -0.10154342651367188, -0.09789276123046875, -0.09424209594726562, -0.0905914306640625, -0.08694076538085938, -0.08329010009765625, -0.07963943481445312, -0.07598876953125, -0.07233810424804688, -0.06868743896484375, -0.06503677368164062, -0.0613861083984375, -0.057735443115234375, -0.05408477783203125, -0.050434112548828125, -0.046783447265625, -0.043132781982421875, -0.03948211669921875, -0.035831451416015625, -0.0321807861328125, -0.028530120849609375, -0.02487945556640625, -0.021228790283203125, -0.017578125, -0.013927459716796875, -0.01027679443359375, -0.006626129150390625, -0.0029754638671875, 0.000675201416015625, 0.00432586669921875, 0.007976531982421875, 0.011627197265625, 0.015277862548828125, 0.01892852783203125, 0.022579193115234375, 0.0262298583984375, 0.029880523681640625, 0.03353118896484375, 0.037181854248046875, 0.04083251953125, 0.044483184814453125, 0.04813385009765625, 0.051784515380859375, 0.0554351806640625, 0.059085845947265625, 0.06273651123046875, 0.06638717651367188, 0.070037841796875, 0.07368850708007812, 0.07733917236328125, 0.08098983764648438, 0.0846405029296875, 0.08829116821289062, 0.09194183349609375, 0.09559249877929688, 0.0992431640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 7.0, 8.0, 12.0, 12.0, 12.0, 23.0, 27.0, 39.0, 65.0, 103.0, 141.0, 148.0, 125.0, 76.0, 53.0, 31.0, 21.0, 20.0, 15.0, 11.0, 13.0, 6.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09014892578125, -0.08706188201904297, -0.08397483825683594, -0.0808877944946289, -0.07780075073242188, -0.07471370697021484, -0.07162666320800781, -0.06853961944580078, -0.06545257568359375, -0.06236553192138672, -0.05927848815917969, -0.056191444396972656, -0.053104400634765625, -0.050017356872558594, -0.04693031311035156, -0.04384326934814453, -0.0407562255859375, -0.03766918182373047, -0.03458213806152344, -0.031495094299316406, -0.028408050537109375, -0.025321006774902344, -0.022233963012695312, -0.01914691925048828, -0.01605987548828125, -0.012972831726074219, -0.009885787963867188, -0.006798744201660156, -0.003711700439453125, -0.0006246566772460938, 0.0024623870849609375, 0.005549430847167969, 0.008636474609375, 0.011723518371582031, 0.014810562133789062, 0.017897605895996094, 0.020984649658203125, 0.024071693420410156, 0.027158737182617188, 0.03024578094482422, 0.03333282470703125, 0.03641986846923828, 0.03950691223144531, 0.042593955993652344, 0.045680999755859375, 0.048768043518066406, 0.05185508728027344, 0.05494213104248047, 0.0580291748046875, 0.06111621856689453, 0.06420326232910156, 0.0672903060913086, 0.07037734985351562, 0.07346439361572266, 0.07655143737792969, 0.07963848114013672, 0.08272552490234375, 0.08581256866455078, 0.08889961242675781, 0.09198665618896484, 0.09507369995117188, 0.0981607437133789, 0.10124778747558594, 0.10433483123779297, 0.107421875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 8.0, 17.0, 17.0, 42.0, 49.0, 73.0, 111.0, 155.0, 161.0, 135.0, 82.0, 59.0, 26.0, 23.0, 17.0, 13.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6204460859298706, -1.5788004398345947, -1.5371546745300293, -1.4955090284347534, -1.4538633823394775, -1.4122177362442017, -1.3705719709396362, -1.3289263248443604, -1.2872806787490845, -1.2456350326538086, -1.2039892673492432, -1.1623436212539673, -1.1206979751586914, -1.0790523290634155, -1.03740656375885, -0.9957609176635742, -0.9541152119636536, -0.9124695062637329, -0.870823860168457, -0.8291781544685364, -0.7875325083732605, -0.7458868026733398, -0.704241156578064, -0.6625954508781433, -0.6209497451782227, -0.579304039478302, -0.5376583933830261, -0.49601268768310547, -0.4543670415878296, -0.41272133588790894, -0.37107565999031067, -0.3294299840927124, -0.2877843379974365, -0.24613866209983826, -0.20449298620224, -0.16284729540348053, -0.12120161950588226, -0.079555943608284, -0.037910252809524536, 0.0037354230880737305, 0.045381098985672, 0.08702677488327026, 0.12867245078086853, 0.170318141579628, 0.21196381747722626, 0.25360947847366333, 0.295255184173584, 0.33690086007118225, 0.3785465359687805, 0.4201922118663788, 0.46183788776397705, 0.5034835934638977, 0.5451292395591736, 0.5867749452590942, 0.6284205913543701, 0.6700662970542908, 0.7117120027542114, 0.7533577084541321, 0.795003354549408, 0.8366490602493286, 0.8782947063446045, 0.9199404120445251, 0.9615861177444458, 1.0032317638397217, 1.0448774099349976]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 5.0, 4.0, 2.0, 5.0, 10.0, 7.0, 16.0, 17.0, 17.0, 19.0, 21.0, 25.0, 20.0, 37.0, 31.0, 35.0, 43.0, 53.0, 43.0, 44.0, 49.0, 50.0, 51.0, 58.0, 47.0, 29.0, 33.0, 20.0, 28.0, 23.0, 26.0, 15.0, 23.0, 10.0, 13.0, 12.0, 11.0, 14.0, 8.0, 6.0, 7.0, 8.0, 3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0], "bins": [-0.834596574306488, -0.8115134835243225, -0.788430392742157, -0.7653473019599915, -0.7422642111778259, -0.7191811203956604, -0.6960979700088501, -0.6730148792266846, -0.649931788444519, -0.6268486976623535, -0.603765606880188, -0.5806825160980225, -0.5575994253158569, -0.5345163345336914, -0.5114332437515259, -0.48835012316703796, -0.4652670621871948, -0.4421839714050293, -0.41910088062286377, -0.39601778984069824, -0.3729346990585327, -0.3498516082763672, -0.3267684876918793, -0.30368539690971375, -0.2806023061275482, -0.2575192153453827, -0.23443612456321716, -0.21135301887989044, -0.18826992809772491, -0.1651868373155594, -0.14210373163223267, -0.11902064085006714, -0.09593760967254639, -0.07285451889038086, -0.049771420657634735, -0.02668832242488861, -0.0036052316427230835, 0.019477859139442444, 0.042560964822769165, 0.06564405560493469, 0.08872714638710022, 0.11181023716926575, 0.13489332795143127, 0.157976433634758, 0.18105952441692352, 0.20414261519908905, 0.22722572088241577, 0.2503088116645813, 0.2733919024467468, 0.29647499322891235, 0.3195580840110779, 0.3426411747932434, 0.36572426557540894, 0.38880735635757446, 0.4118904769420624, 0.4349735677242279, 0.45805665850639343, 0.48113974928855896, 0.5042228698730469, 0.5273059606552124, 0.5503890514373779, 0.5734721422195435, 0.596555233001709, 0.6196383237838745, 0.64272141456604]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 24.0, 27.0, 36.0, 89.0, 142.0, 224.0, 392.0, 735.0, 1417.0, 3398.0, 10741.0, 49887.0, 2565261.0, 1497441.0, 46888.0, 10646.0, 3518.0, 1538.0, 790.0, 416.0, 243.0, 143.0, 96.0, 58.0, 31.0, 26.0, 19.0, 8.0, 9.0, 6.0, 3.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.286865234375, -0.27889442443847656, -0.2709236145019531, -0.2629528045654297, -0.25498199462890625, -0.2470111846923828, -0.23904037475585938, -0.23106956481933594, -0.2230987548828125, -0.21512794494628906, -0.20715713500976562, -0.1991863250732422, -0.19121551513671875, -0.1832447052001953, -0.17527389526367188, -0.16730308532714844, -0.159332275390625, -0.15136146545410156, -0.14339065551757812, -0.1354198455810547, -0.12744903564453125, -0.11947822570800781, -0.11150741577148438, -0.10353660583496094, -0.0955657958984375, -0.08759498596191406, -0.07962417602539062, -0.07165336608886719, -0.06368255615234375, -0.05571174621582031, -0.047740936279296875, -0.03977012634277344, -0.03179931640625, -0.023828506469726562, -0.015857696533203125, -0.007886886596679688, 8.392333984375e-05, 0.008054733276367188, 0.016025543212890625, 0.023996353149414062, 0.0319671630859375, 0.03993797302246094, 0.047908782958984375, 0.05587959289550781, 0.06385040283203125, 0.07182121276855469, 0.07979202270507812, 0.08776283264160156, 0.095733642578125, 0.10370445251464844, 0.11167526245117188, 0.11964607238769531, 0.12761688232421875, 0.1355876922607422, 0.14355850219726562, 0.15152931213378906, 0.1595001220703125, 0.16747093200683594, 0.17544174194335938, 0.1834125518798828, 0.19138336181640625, 0.1993541717529297, 0.20732498168945312, 0.21529579162597656, 0.2232666015625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 18.0, 23.0, 24.0, 30.0, 47.0, 79.0, 68.0, 87.0, 86.0, 82.0, 75.0, 81.0, 75.0, 57.0, 34.0, 30.0, 31.0, 13.0, 15.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050140380859375, -0.048645973205566406, -0.04715156555175781, -0.04565715789794922, -0.044162750244140625, -0.04266834259033203, -0.04117393493652344, -0.039679527282714844, -0.03818511962890625, -0.036690711975097656, -0.03519630432128906, -0.03370189666748047, -0.032207489013671875, -0.03071308135986328, -0.029218673706054688, -0.027724266052246094, -0.0262298583984375, -0.024735450744628906, -0.023241043090820312, -0.02174663543701172, -0.020252227783203125, -0.01875782012939453, -0.017263412475585938, -0.015769004821777344, -0.01427459716796875, -0.012780189514160156, -0.011285781860351562, -0.009791374206542969, -0.008296966552734375, -0.006802558898925781, -0.0053081512451171875, -0.0038137435913085938, -0.0023193359375, -0.0008249282836914062, 0.0006694793701171875, 0.0021638870239257812, 0.003658294677734375, 0.005152702331542969, 0.0066471099853515625, 0.008141517639160156, 0.00963592529296875, 0.011130332946777344, 0.012624740600585938, 0.014119148254394531, 0.015613555908203125, 0.01710796356201172, 0.018602371215820312, 0.020096778869628906, 0.0215911865234375, 0.023085594177246094, 0.024580001831054688, 0.02607440948486328, 0.027568817138671875, 0.02906322479248047, 0.030557632446289062, 0.032052040100097656, 0.03354644775390625, 0.035040855407714844, 0.03653526306152344, 0.03802967071533203, 0.039524078369140625, 0.04101848602294922, 0.04251289367675781, 0.044007301330566406, 0.045501708984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 8.0, 4.0, 9.0, 9.0, 11.0, 21.0, 17.0, 37.0, 53.0, 67.0, 109.0, 152.0, 296.0, 514.0, 1062.0, 2448.0, 7246.0, 31867.0, 283341.0, 3710269.0, 128691.0, 19264.0, 5036.0, 1842.0, 800.0, 421.0, 264.0, 133.0, 86.0, 64.0, 36.0, 32.0, 29.0, 18.0, 10.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24853515625, -0.23976898193359375, -0.2310028076171875, -0.22223663330078125, -0.213470458984375, -0.20470428466796875, -0.1959381103515625, -0.18717193603515625, -0.17840576171875, -0.16963958740234375, -0.1608734130859375, -0.15210723876953125, -0.143341064453125, -0.13457489013671875, -0.1258087158203125, -0.11704254150390625, -0.1082763671875, -0.09951019287109375, -0.0907440185546875, -0.08197784423828125, -0.073211669921875, -0.06444549560546875, -0.0556793212890625, -0.04691314697265625, -0.03814697265625, -0.02938079833984375, -0.0206146240234375, -0.01184844970703125, -0.003082275390625, 0.00568389892578125, 0.0144500732421875, 0.02321624755859375, 0.031982421875, 0.04074859619140625, 0.0495147705078125, 0.05828094482421875, 0.067047119140625, 0.07581329345703125, 0.0845794677734375, 0.09334564208984375, 0.10211181640625, 0.11087799072265625, 0.1196441650390625, 0.12841033935546875, 0.137176513671875, 0.14594268798828125, 0.1547088623046875, 0.16347503662109375, 0.1722412109375, 0.18100738525390625, 0.1897735595703125, 0.19853973388671875, 0.207305908203125, 0.21607208251953125, 0.2248382568359375, 0.23360443115234375, 0.24237060546875, 0.25113677978515625, 0.2599029541015625, 0.26866912841796875, 0.277435302734375, 0.28620147705078125, 0.2949676513671875, 0.30373382568359375, 0.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 8.0, 10.0, 35.0, 44.0, 74.0, 156.0, 383.0, 2331.0, 609.0, 178.0, 107.0, 68.0, 25.0, 16.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13791370391845703, -0.13434791564941406, -0.1307821273803711, -0.12721633911132812, -0.12365055084228516, -0.12008476257324219, -0.11651897430419922, -0.11295318603515625, -0.10938739776611328, -0.10582160949707031, -0.10225582122802734, -0.09869003295898438, -0.0951242446899414, -0.09155845642089844, -0.08799266815185547, -0.0844268798828125, -0.08086109161376953, -0.07729530334472656, -0.0737295150756836, -0.07016372680664062, -0.06659793853759766, -0.06303215026855469, -0.05946636199951172, -0.05590057373046875, -0.05233478546142578, -0.04876899719238281, -0.045203208923339844, -0.041637420654296875, -0.038071632385253906, -0.03450584411621094, -0.03094005584716797, -0.027374267578125, -0.02380847930908203, -0.020242691040039062, -0.016676902770996094, -0.013111114501953125, -0.009545326232910156, -0.0059795379638671875, -0.0024137496948242188, 0.00115203857421875, 0.004717826843261719, 0.008283615112304688, 0.011849403381347656, 0.015415191650390625, 0.018980979919433594, 0.022546768188476562, 0.02611255645751953, 0.0296783447265625, 0.03324413299560547, 0.03680992126464844, 0.040375709533691406, 0.043941497802734375, 0.047507286071777344, 0.05107307434082031, 0.05463886260986328, 0.05820465087890625, 0.06177043914794922, 0.06533622741699219, 0.06890201568603516, 0.07246780395507812, 0.0760335922241211, 0.07959938049316406, 0.08316516876220703, 0.08673095703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 17.0, 15.0, 40.0, 60.0, 89.0, 117.0, 162.0, 144.0, 111.0, 98.0, 68.0, 28.0, 11.0, 15.0, 10.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5916775465011597, -0.5743805766105652, -0.5570836663246155, -0.539786696434021, -0.5224897861480713, -0.5051928162574768, -0.4878958463668823, -0.47059890627861023, -0.45330196619033813, -0.43600502610206604, -0.41870808601379395, -0.40141111612319946, -0.38411417603492737, -0.3668172359466553, -0.3495202660560608, -0.3322233259677887, -0.3149263858795166, -0.2976294457912445, -0.2803325057029724, -0.26303553581237793, -0.24573859572410583, -0.22844165563583374, -0.21114470064640045, -0.19384774565696716, -0.17655080556869507, -0.15925386548042297, -0.14195691049098969, -0.124659962952137, -0.1073630154132843, -0.09006606787443161, -0.07276912033557892, -0.05547217279672623, -0.03817516565322876, -0.020878218114376068, -0.0035812705755233765, 0.013715676963329315, 0.031012624502182007, 0.0483095720410347, 0.06560651957988739, 0.08290346711874008, 0.10020041465759277, 0.11749736219644547, 0.13479430973529816, 0.15209126472473145, 0.16938820481300354, 0.18668514490127563, 0.20398209989070892, 0.2212790548801422, 0.2385759949684143, 0.2558729350566864, 0.2731698751449585, 0.290466845035553, 0.3077637851238251, 0.32506072521209717, 0.34235769510269165, 0.35965463519096375, 0.37695157527923584, 0.39424851536750793, 0.41154545545578003, 0.4288424253463745, 0.4461393654346466, 0.4634363055229187, 0.4807332754135132, 0.4980302155017853, 0.5153271555900574]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 5.0, 9.0, 10.0, 9.0, 11.0, 13.0, 12.0, 22.0, 38.0, 31.0, 26.0, 27.0, 31.0, 36.0, 43.0, 43.0, 45.0, 26.0, 47.0, 35.0, 49.0, 41.0, 42.0, 46.0, 32.0, 40.0, 37.0, 41.0, 23.0, 22.0, 13.0, 17.0, 11.0, 13.0, 10.0, 8.0, 7.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.25157982110977173, -0.24420452117919922, -0.2368292212486267, -0.2294539213180542, -0.2220786213874817, -0.21470332145690918, -0.20732800662517548, -0.19995270669460297, -0.19257740676403046, -0.18520210683345795, -0.17782680690288544, -0.17045150697231293, -0.16307619214057922, -0.1557008922100067, -0.1483255922794342, -0.1409502923488617, -0.13357499241828918, -0.12619969248771667, -0.11882439255714417, -0.11144908517599106, -0.10407378524541855, -0.09669848531484604, -0.08932317793369293, -0.08194787800312042, -0.07457257807254791, -0.0671972781419754, -0.059821974486112595, -0.052446670830249786, -0.04507137089967728, -0.03769607096910477, -0.03032076731324196, -0.02294546365737915, -0.01557016372680664, -0.008194861933588982, -0.0008195601403713226, 0.006555741652846336, 0.013931043446063995, 0.021306343376636505, 0.028681647032499313, 0.03605695068836212, 0.04343225061893463, 0.05080755054950714, 0.05818285420536995, 0.06555815786123276, 0.07293345779180527, 0.08030875772237778, 0.08768406510353088, 0.0950593650341034, 0.1024346649646759, 0.10980996489524841, 0.11718526482582092, 0.12456057220697403, 0.13193586468696594, 0.13931116461753845, 0.14668647944927216, 0.15406177937984467, 0.16143707931041718, 0.16881237924098969, 0.1761876791715622, 0.1835629791021347, 0.1909382939338684, 0.19831359386444092, 0.20568889379501343, 0.21306419372558594, 0.22043949365615845]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 8.0, 7.0, 8.0, 15.0, 20.0, 20.0, 34.0, 52.0, 68.0, 106.0, 175.0, 289.0, 433.0, 764.0, 1373.0, 2550.0, 5088.0, 10433.0, 23842.0, 59217.0, 156533.0, 389954.0, 244034.0, 89509.0, 34881.0, 14815.0, 6811.0, 3336.0, 1723.0, 1022.0, 551.0, 285.0, 199.0, 145.0, 81.0, 49.0, 38.0, 27.0, 13.0, 18.0, 11.0, 3.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1456298828125, -0.14055824279785156, -0.13548660278320312, -0.1304149627685547, -0.12534332275390625, -0.12027168273925781, -0.11520004272460938, -0.11012840270996094, -0.1050567626953125, -0.09998512268066406, -0.09491348266601562, -0.08984184265136719, -0.08477020263671875, -0.07969856262207031, -0.07462692260742188, -0.06955528259277344, -0.064483642578125, -0.05941200256347656, -0.054340362548828125, -0.04926872253417969, -0.04419708251953125, -0.03912544250488281, -0.034053802490234375, -0.028982162475585938, -0.0239105224609375, -0.018838882446289062, -0.013767242431640625, -0.008695602416992188, -0.00362396240234375, 0.0014476776123046875, 0.006519317626953125, 0.011590957641601562, 0.01666259765625, 0.021734237670898438, 0.026805877685546875, 0.03187751770019531, 0.03694915771484375, 0.04202079772949219, 0.047092437744140625, 0.05216407775878906, 0.0572357177734375, 0.06230735778808594, 0.06737899780273438, 0.07245063781738281, 0.07752227783203125, 0.08259391784667969, 0.08766555786132812, 0.09273719787597656, 0.097808837890625, 0.10288047790527344, 0.10795211791992188, 0.11302375793457031, 0.11809539794921875, 0.12316703796386719, 0.12823867797851562, 0.13331031799316406, 0.1383819580078125, 0.14345359802246094, 0.14852523803710938, 0.1535968780517578, 0.15866851806640625, 0.1637401580810547, 0.16881179809570312, 0.17388343811035156, 0.178955078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 8.0, 21.0, 31.0, 34.0, 37.0, 55.0, 67.0, 58.0, 78.0, 84.0, 73.0, 71.0, 73.0, 53.0, 53.0, 48.0, 37.0, 28.0, 24.0, 16.0, 11.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04705810546875, -0.045607566833496094, -0.04415702819824219, -0.04270648956298828, -0.041255950927734375, -0.03980541229248047, -0.03835487365722656, -0.036904335021972656, -0.03545379638671875, -0.034003257751464844, -0.03255271911621094, -0.03110218048095703, -0.029651641845703125, -0.02820110321044922, -0.026750564575195312, -0.025300025939941406, -0.0238494873046875, -0.022398948669433594, -0.020948410034179688, -0.01949787139892578, -0.018047332763671875, -0.01659679412841797, -0.015146255493164062, -0.013695716857910156, -0.01224517822265625, -0.010794639587402344, -0.009344100952148438, -0.007893562316894531, -0.006443023681640625, -0.004992485046386719, -0.0035419464111328125, -0.0020914077758789062, -0.000640869140625, 0.0008096694946289062, 0.0022602081298828125, 0.0037107467651367188, 0.005161285400390625, 0.006611824035644531, 0.008062362670898438, 0.009512901306152344, 0.01096343994140625, 0.012413978576660156, 0.013864517211914062, 0.015315055847167969, 0.016765594482421875, 0.01821613311767578, 0.019666671752929688, 0.021117210388183594, 0.0225677490234375, 0.024018287658691406, 0.025468826293945312, 0.02691936492919922, 0.028369903564453125, 0.02982044219970703, 0.03127098083496094, 0.032721519470214844, 0.03417205810546875, 0.035622596740722656, 0.03707313537597656, 0.03852367401123047, 0.039974212646484375, 0.04142475128173828, 0.04287528991699219, 0.044325828552246094, 0.0457763671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 10.0, 4.0, 11.0, 13.0, 13.0, 17.0, 25.0, 41.0, 71.0, 79.0, 128.0, 146.0, 246.0, 344.0, 589.0, 1089.0, 2063.0, 4242.0, 9920.0, 25412.0, 71432.0, 212906.0, 424781.0, 190478.0, 63769.0, 23199.0, 9085.0, 3919.0, 1767.0, 989.0, 612.0, 372.0, 226.0, 156.0, 117.0, 81.0, 60.0, 44.0, 24.0, 21.0, 20.0, 15.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1341552734375, -0.12974929809570312, -0.12534332275390625, -0.12093734741210938, -0.1165313720703125, -0.11212539672851562, -0.10771942138671875, -0.10331344604492188, -0.098907470703125, -0.09450149536132812, -0.09009552001953125, -0.08568954467773438, -0.0812835693359375, -0.07687759399414062, -0.07247161865234375, -0.06806564331054688, -0.06365966796875, -0.059253692626953125, -0.05484771728515625, -0.050441741943359375, -0.0460357666015625, -0.041629791259765625, -0.03722381591796875, -0.032817840576171875, -0.028411865234375, -0.024005889892578125, -0.01959991455078125, -0.015193939208984375, -0.0107879638671875, -0.006381988525390625, -0.00197601318359375, 0.002429962158203125, 0.0068359375, 0.011241912841796875, 0.01564788818359375, 0.020053863525390625, 0.0244598388671875, 0.028865814208984375, 0.03327178955078125, 0.037677764892578125, 0.042083740234375, 0.046489715576171875, 0.05089569091796875, 0.055301666259765625, 0.0597076416015625, 0.06411361694335938, 0.06851959228515625, 0.07292556762695312, 0.07733154296875, 0.08173751831054688, 0.08614349365234375, 0.09054946899414062, 0.0949554443359375, 0.09936141967773438, 0.10376739501953125, 0.10817337036132812, 0.112579345703125, 0.11698532104492188, 0.12139129638671875, 0.12579727172851562, 0.1302032470703125, 0.13460922241210938, 0.13901519775390625, 0.14342117309570312, 0.1478271484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 4.0, 9.0, 9.0, 9.0, 10.0, 14.0, 15.0, 29.0, 18.0, 22.0, 25.0, 27.0, 37.0, 32.0, 20.0, 31.0, 37.0, 44.0, 40.0, 48.0, 47.0, 39.0, 36.0, 39.0, 27.0, 39.0, 36.0, 24.0, 22.0, 20.0, 23.0, 28.0, 21.0, 22.0, 12.0, 13.0, 9.0, 14.0, 10.0, 6.0, 4.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 4.0], "bins": [-0.1370849609375, -0.13332366943359375, -0.1295623779296875, -0.12580108642578125, -0.122039794921875, -0.11827850341796875, -0.1145172119140625, -0.11075592041015625, -0.10699462890625, -0.10323333740234375, -0.0994720458984375, -0.09571075439453125, -0.091949462890625, -0.08818817138671875, -0.0844268798828125, -0.08066558837890625, -0.076904296875, -0.07314300537109375, -0.0693817138671875, -0.06562042236328125, -0.061859130859375, -0.05809783935546875, -0.0543365478515625, -0.05057525634765625, -0.04681396484375, -0.04305267333984375, -0.0392913818359375, -0.03553009033203125, -0.031768798828125, -0.02800750732421875, -0.0242462158203125, -0.02048492431640625, -0.0167236328125, -0.01296234130859375, -0.0092010498046875, -0.00543975830078125, -0.001678466796875, 0.00208282470703125, 0.0058441162109375, 0.00960540771484375, 0.01336669921875, 0.01712799072265625, 0.0208892822265625, 0.02465057373046875, 0.028411865234375, 0.03217315673828125, 0.0359344482421875, 0.03969573974609375, 0.04345703125, 0.04721832275390625, 0.0509796142578125, 0.05474090576171875, 0.058502197265625, 0.06226348876953125, 0.0660247802734375, 0.06978607177734375, 0.07354736328125, 0.07730865478515625, 0.0810699462890625, 0.08483123779296875, 0.088592529296875, 0.09235382080078125, 0.0961151123046875, 0.09987640380859375, 0.1036376953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 5.0, 6.0, 17.0, 14.0, 25.0, 38.0, 65.0, 94.0, 151.0, 267.0, 512.0, 1005.0, 2017.0, 4531.0, 10589.0, 28232.0, 88856.0, 331504.0, 408122.0, 114465.0, 34774.0, 12975.0, 5323.0, 2386.0, 1205.0, 601.0, 320.0, 191.0, 87.0, 66.0, 39.0, 30.0, 14.0, 10.0, 4.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09466552734375, -0.09196853637695312, -0.08927154541015625, -0.08657455444335938, -0.0838775634765625, -0.08118057250976562, -0.07848358154296875, -0.07578659057617188, -0.073089599609375, -0.07039260864257812, -0.06769561767578125, -0.06499862670898438, -0.0623016357421875, -0.059604644775390625, -0.05690765380859375, -0.054210662841796875, -0.051513671875, -0.048816680908203125, -0.04611968994140625, -0.043422698974609375, -0.0407257080078125, -0.038028717041015625, -0.03533172607421875, -0.032634735107421875, -0.029937744140625, -0.027240753173828125, -0.02454376220703125, -0.021846771240234375, -0.0191497802734375, -0.016452789306640625, -0.01375579833984375, -0.011058807373046875, -0.00836181640625, -0.005664825439453125, -0.00296783447265625, -0.000270843505859375, 0.0024261474609375, 0.005123138427734375, 0.00782012939453125, 0.010517120361328125, 0.013214111328125, 0.015911102294921875, 0.01860809326171875, 0.021305084228515625, 0.0240020751953125, 0.026699066162109375, 0.02939605712890625, 0.032093048095703125, 0.0347900390625, 0.037487030029296875, 0.04018402099609375, 0.042881011962890625, 0.0455780029296875, 0.048274993896484375, 0.05097198486328125, 0.053668975830078125, 0.056365966796875, 0.059062957763671875, 0.06175994873046875, 0.06445693969726562, 0.0671539306640625, 0.06985092163085938, 0.07254791259765625, 0.07524490356445312, 0.07794189453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 7.0, 12.0, 22.0, 24.0, 28.0, 25.0, 30.0, 47.0, 49.0, 58.0, 61.0, 74.0, 53.0, 58.0, 66.0, 69.0, 50.0, 29.0, 28.0, 26.0, 27.0, 22.0, 25.0, 13.0, 11.0, 8.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-05, -2.2427178919315338e-05, -2.1608546376228333e-05, -2.0789913833141327e-05, -1.997128129005432e-05, -1.9152648746967316e-05, -1.833401620388031e-05, -1.7515383660793304e-05, -1.66967511177063e-05, -1.5878118574619293e-05, -1.5059486031532288e-05, -1.4240853488445282e-05, -1.3422220945358276e-05, -1.260358840227127e-05, -1.1784955859184265e-05, -1.096632331609726e-05, -1.0147690773010254e-05, -9.329058229923248e-06, -8.510425686836243e-06, -7.691793143749237e-06, -6.8731606006622314e-06, -6.054528057575226e-06, -5.23589551448822e-06, -4.417262971401215e-06, -3.598630428314209e-06, -2.7799978852272034e-06, -1.9613653421401978e-06, -1.1427327990531921e-06, -3.241002559661865e-07, 4.945322871208191e-07, 1.3131648302078247e-06, 2.1317973732948303e-06, 2.950429916381836e-06, 3.7690624594688416e-06, 4.587695002555847e-06, 5.406327545642853e-06, 6.224960088729858e-06, 7.043592631816864e-06, 7.86222517490387e-06, 8.680857717990875e-06, 9.499490261077881e-06, 1.0318122804164886e-05, 1.1136755347251892e-05, 1.1955387890338898e-05, 1.2774020433425903e-05, 1.3592652976512909e-05, 1.4411285519599915e-05, 1.522991806268692e-05, 1.6048550605773926e-05, 1.686718314886093e-05, 1.7685815691947937e-05, 1.8504448235034943e-05, 1.9323080778121948e-05, 2.0141713321208954e-05, 2.096034586429596e-05, 2.1778978407382965e-05, 2.259761095046997e-05, 2.3416243493556976e-05, 2.4234876036643982e-05, 2.5053508579730988e-05, 2.5872141122817993e-05, 2.6690773665905e-05, 2.7509406208992004e-05, 2.832803875207901e-05, 2.9146671295166016e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 16.0, 27.0, 29.0, 51.0, 60.0, 106.0, 178.0, 298.0, 527.0, 958.0, 1897.0, 4298.0, 10687.0, 30707.0, 111962.0, 443395.0, 328322.0, 77061.0, 22753.0, 8177.0, 3413.0, 1654.0, 808.0, 424.0, 238.0, 162.0, 109.0, 70.0, 50.0, 25.0, 20.0, 21.0, 8.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07940673828125, -0.07655715942382812, -0.07370758056640625, -0.07085800170898438, -0.0680084228515625, -0.06515884399414062, -0.06230926513671875, -0.059459686279296875, -0.056610107421875, -0.053760528564453125, -0.05091094970703125, -0.048061370849609375, -0.0452117919921875, -0.042362213134765625, -0.03951263427734375, -0.036663055419921875, -0.0338134765625, -0.030963897705078125, -0.02811431884765625, -0.025264739990234375, -0.0224151611328125, -0.019565582275390625, -0.01671600341796875, -0.013866424560546875, -0.011016845703125, -0.008167266845703125, -0.00531768798828125, -0.002468109130859375, 0.0003814697265625, 0.003231048583984375, 0.00608062744140625, 0.008930206298828125, 0.01177978515625, 0.014629364013671875, 0.01747894287109375, 0.020328521728515625, 0.0231781005859375, 0.026027679443359375, 0.02887725830078125, 0.031726837158203125, 0.034576416015625, 0.037425994873046875, 0.04027557373046875, 0.043125152587890625, 0.0459747314453125, 0.048824310302734375, 0.05167388916015625, 0.054523468017578125, 0.057373046875, 0.060222625732421875, 0.06307220458984375, 0.06592178344726562, 0.0687713623046875, 0.07162094116210938, 0.07447052001953125, 0.07732009887695312, 0.080169677734375, 0.08301925659179688, 0.08586883544921875, 0.08871841430664062, 0.0915679931640625, 0.09441757202148438, 0.09726715087890625, 0.10011672973632812, 0.10296630859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 8.0, 12.0, 17.0, 18.0, 20.0, 23.0, 45.0, 40.0, 62.0, 53.0, 49.0, 58.0, 63.0, 77.0, 59.0, 61.0, 54.0, 46.0, 41.0, 32.0, 33.0, 24.0, 17.0, 11.0, 9.0, 7.0, 8.0, 4.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06341552734375, -0.06151771545410156, -0.059619903564453125, -0.05772209167480469, -0.05582427978515625, -0.05392646789550781, -0.052028656005859375, -0.05013084411621094, -0.0482330322265625, -0.04633522033691406, -0.044437408447265625, -0.04253959655761719, -0.04064178466796875, -0.03874397277832031, -0.036846160888671875, -0.03494834899902344, -0.033050537109375, -0.031152725219726562, -0.029254913330078125, -0.027357101440429688, -0.02545928955078125, -0.023561477661132812, -0.021663665771484375, -0.019765853881835938, -0.0178680419921875, -0.015970230102539062, -0.014072418212890625, -0.012174606323242188, -0.01027679443359375, -0.008378982543945312, -0.006481170654296875, -0.0045833587646484375, -0.002685546875, -0.0007877349853515625, 0.001110076904296875, 0.0030078887939453125, 0.00490570068359375, 0.0068035125732421875, 0.008701324462890625, 0.010599136352539062, 0.0124969482421875, 0.014394760131835938, 0.016292572021484375, 0.018190383911132812, 0.02008819580078125, 0.021986007690429688, 0.023883819580078125, 0.025781631469726562, 0.027679443359375, 0.029577255249023438, 0.031475067138671875, 0.03337287902832031, 0.03527069091796875, 0.03716850280761719, 0.039066314697265625, 0.04096412658691406, 0.0428619384765625, 0.04475975036621094, 0.046657562255859375, 0.04855537414550781, 0.05045318603515625, 0.05235099792480469, 0.054248809814453125, 0.05614662170410156, 0.05804443359375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 10.0, 20.0, 32.0, 60.0, 94.0, 111.0, 162.0, 147.0, 127.0, 91.0, 70.0, 33.0, 20.0, 9.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5653105974197388, -1.519366979598999, -1.4734232425689697, -1.4274795055389404, -1.3815358877182007, -1.335592269897461, -1.2896485328674316, -1.2437047958374023, -1.1977611780166626, -1.1518175601959229, -1.1058738231658936, -1.0599300861358643, -1.0139864683151245, -0.96804279088974, -0.9220991134643555, -0.876155436038971, -0.8302117586135864, -0.7842680811882019, -0.7383244037628174, -0.6923807263374329, -0.6464370489120483, -0.6004933714866638, -0.5545496940612793, -0.5086060166358948, -0.46266233921051025, -0.41671866178512573, -0.3707749843597412, -0.3248313069343567, -0.27888762950897217, -0.23294395208358765, -0.18700027465820312, -0.1410565972328186, -0.09511303901672363, -0.04916936159133911, -0.00322568416595459, 0.04271799325942993, 0.08866167068481445, 0.13460534811019897, 0.1805490255355835, 0.22649270296096802, 0.27243638038635254, 0.31838005781173706, 0.3643237352371216, 0.4102674126625061, 0.4562110900878906, 0.5021547675132751, 0.5480984449386597, 0.5940421223640442, 0.6399857997894287, 0.6859294772148132, 0.7318731546401978, 0.7778168320655823, 0.8237605094909668, 0.8697041869163513, 0.9156478643417358, 0.9615915417671204, 1.0075352191925049, 1.0534789562225342, 1.099422574043274, 1.1453661918640137, 1.191309928894043, 1.2372536659240723, 1.283197283744812, 1.3291409015655518, 1.375084638595581]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 3.0, 8.0, 9.0, 8.0, 10.0, 17.0, 20.0, 14.0, 23.0, 24.0, 35.0, 35.0, 36.0, 36.0, 36.0, 48.0, 49.0, 51.0, 47.0, 48.0, 41.0, 46.0, 47.0, 34.0, 34.0, 34.0, 34.0, 32.0, 29.0, 23.0, 20.0, 13.0, 14.0, 9.0, 7.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8134320974349976, -0.7879867553710938, -0.7625414133071899, -0.7370960712432861, -0.7116507291793823, -0.6862053871154785, -0.6607600450515747, -0.6353147029876709, -0.6098693609237671, -0.5844240188598633, -0.5589786767959595, -0.5335333347320557, -0.5080879926681519, -0.48264265060424805, -0.4571973383426666, -0.4317519962787628, -0.4063066840171814, -0.3808613419532776, -0.3554159998893738, -0.32997065782546997, -0.30452531576156616, -0.27907997369766235, -0.25363466143608093, -0.22818931937217712, -0.20274397730827332, -0.1772986352443695, -0.1518532931804657, -0.12640796601772308, -0.10096262395381927, -0.07551728188991547, -0.05007195472717285, -0.024626612663269043, 0.000818789005279541, 0.02626412734389305, 0.05170946568250656, 0.07715480029582977, 0.10260014235973358, 0.1280454844236374, 0.15349081158638, 0.1789361536502838, 0.20438149571418762, 0.22982683777809143, 0.25527217984199524, 0.28071749210357666, 0.30616283416748047, 0.3316081762313843, 0.3570535182952881, 0.3824988603591919, 0.4079442024230957, 0.4333895444869995, 0.4588348865509033, 0.48428022861480713, 0.5097255706787109, 0.5351709127426147, 0.5606162548065186, 0.5860615968704224, 0.6115069389343262, 0.63695228099823, 0.6623976230621338, 0.6878429651260376, 0.7132883071899414, 0.7387336492538452, 0.764178991317749, 0.7896243333816528, 0.8150696158409119]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 18.0, 16.0, 27.0, 36.0, 55.0, 85.0, 142.0, 237.0, 389.0, 664.0, 1113.0, 2017.0, 3946.0, 8124.0, 18769.0, 53958.0, 266129.0, 3533598.0, 222291.0, 48472.0, 17263.0, 7733.0, 3820.0, 2037.0, 1126.0, 746.0, 474.0, 294.0, 208.0, 130.0, 77.0, 78.0, 60.0, 33.0, 21.0, 23.0, 18.0, 8.0, 9.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.1678466796875, -0.16283035278320312, -0.15781402587890625, -0.15279769897460938, -0.1477813720703125, -0.14276504516601562, -0.13774871826171875, -0.13273239135742188, -0.127716064453125, -0.12269973754882812, -0.11768341064453125, -0.11266708374023438, -0.1076507568359375, -0.10263442993164062, -0.09761810302734375, -0.09260177612304688, -0.08758544921875, -0.08256912231445312, -0.07755279541015625, -0.07253646850585938, -0.0675201416015625, -0.06250381469726562, -0.05748748779296875, -0.052471160888671875, -0.047454833984375, -0.042438507080078125, -0.03742218017578125, -0.032405853271484375, -0.0273895263671875, -0.022373199462890625, -0.01735687255859375, -0.012340545654296875, -0.00732421875, -0.002307891845703125, 0.00270843505859375, 0.007724761962890625, 0.0127410888671875, 0.017757415771484375, 0.02277374267578125, 0.027790069580078125, 0.032806396484375, 0.037822723388671875, 0.04283905029296875, 0.047855377197265625, 0.0528717041015625, 0.057888031005859375, 0.06290435791015625, 0.06792068481445312, 0.07293701171875, 0.07795333862304688, 0.08296966552734375, 0.08798599243164062, 0.0930023193359375, 0.09801864624023438, 0.10303497314453125, 0.10805130004882812, 0.113067626953125, 0.11808395385742188, 0.12310028076171875, 0.12811660766601562, 0.1331329345703125, 0.13814926147460938, 0.14316558837890625, 0.14818191528320312, 0.1531982421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 11.0, 8.0, 15.0, 25.0, 37.0, 33.0, 68.0, 59.0, 67.0, 67.0, 91.0, 69.0, 67.0, 61.0, 71.0, 41.0, 55.0, 39.0, 25.0, 21.0, 15.0, 8.0, 8.0, 6.0, 4.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043609619140625, -0.04212760925292969, -0.040645599365234375, -0.03916358947753906, -0.03768157958984375, -0.03619956970214844, -0.034717559814453125, -0.03323554992675781, -0.0317535400390625, -0.030271530151367188, -0.028789520263671875, -0.027307510375976562, -0.02582550048828125, -0.024343490600585938, -0.022861480712890625, -0.021379470825195312, -0.0198974609375, -0.018415451049804688, -0.016933441162109375, -0.015451431274414062, -0.01396942138671875, -0.012487411499023438, -0.011005401611328125, -0.009523391723632812, -0.0080413818359375, -0.0065593719482421875, -0.005077362060546875, -0.0035953521728515625, -0.00211334228515625, -0.0006313323974609375, 0.000850677490234375, 0.0023326873779296875, 0.003814697265625, 0.0052967071533203125, 0.006778717041015625, 0.008260726928710938, 0.00974273681640625, 0.011224746704101562, 0.012706756591796875, 0.014188766479492188, 0.0156707763671875, 0.017152786254882812, 0.018634796142578125, 0.020116806030273438, 0.02159881591796875, 0.023080825805664062, 0.024562835693359375, 0.026044845581054688, 0.02752685546875, 0.029008865356445312, 0.030490875244140625, 0.03197288513183594, 0.03345489501953125, 0.03493690490722656, 0.036418914794921875, 0.03790092468261719, 0.0393829345703125, 0.04086494445800781, 0.042346954345703125, 0.04382896423339844, 0.04531097412109375, 0.04679298400878906, 0.048274993896484375, 0.04975700378417969, 0.051239013671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 8.0, 9.0, 17.0, 23.0, 36.0, 49.0, 89.0, 128.0, 199.0, 334.0, 559.0, 958.0, 1670.0, 3036.0, 6347.0, 14384.0, 36850.0, 119816.0, 1028056.0, 2739306.0, 163639.0, 45781.0, 17267.0, 7518.0, 3621.0, 1919.0, 1029.0, 620.0, 369.0, 235.0, 153.0, 78.0, 61.0, 24.0, 32.0, 12.0, 13.0, 16.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.177734375, -0.17281150817871094, -0.16788864135742188, -0.1629657745361328, -0.15804290771484375, -0.1531200408935547, -0.14819717407226562, -0.14327430725097656, -0.1383514404296875, -0.13342857360839844, -0.12850570678710938, -0.12358283996582031, -0.11865997314453125, -0.11373710632324219, -0.10881423950195312, -0.10389137268066406, -0.098968505859375, -0.09404563903808594, -0.08912277221679688, -0.08419990539550781, -0.07927703857421875, -0.07435417175292969, -0.06943130493164062, -0.06450843811035156, -0.0595855712890625, -0.05466270446777344, -0.049739837646484375, -0.04481697082519531, -0.03989410400390625, -0.03497123718261719, -0.030048370361328125, -0.025125503540039062, -0.02020263671875, -0.015279769897460938, -0.010356903076171875, -0.0054340362548828125, -0.00051116943359375, 0.0044116973876953125, 0.009334564208984375, 0.014257431030273438, 0.0191802978515625, 0.024103164672851562, 0.029026031494140625, 0.03394889831542969, 0.03887176513671875, 0.04379463195800781, 0.048717498779296875, 0.05364036560058594, 0.058563232421875, 0.06348609924316406, 0.06840896606445312, 0.07333183288574219, 0.07825469970703125, 0.08317756652832031, 0.08810043334960938, 0.09302330017089844, 0.0979461669921875, 0.10286903381347656, 0.10779190063476562, 0.11271476745605469, 0.11763763427734375, 0.12256050109863281, 0.12748336791992188, 0.13240623474121094, 0.1373291015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 8.0, 9.0, 14.0, 9.0, 22.0, 28.0, 41.0, 56.0, 71.0, 145.0, 244.0, 674.0, 1650.0, 475.0, 206.0, 139.0, 64.0, 56.0, 41.0, 22.0, 24.0, 15.0, 12.0, 9.0, 5.0, 10.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.09368896484375, -0.09118175506591797, -0.08867454528808594, -0.0861673355102539, -0.08366012573242188, -0.08115291595458984, -0.07864570617675781, -0.07613849639892578, -0.07363128662109375, -0.07112407684326172, -0.06861686706542969, -0.06610965728759766, -0.06360244750976562, -0.061095237731933594, -0.05858802795410156, -0.05608081817626953, -0.0535736083984375, -0.05106639862060547, -0.04855918884277344, -0.046051979064941406, -0.043544769287109375, -0.041037559509277344, -0.03853034973144531, -0.03602313995361328, -0.03351593017578125, -0.03100872039794922, -0.028501510620117188, -0.025994300842285156, -0.023487091064453125, -0.020979881286621094, -0.018472671508789062, -0.01596546173095703, -0.013458251953125, -0.010951042175292969, -0.008443832397460938, -0.005936622619628906, -0.003429412841796875, -0.0009222030639648438, 0.0015850067138671875, 0.004092216491699219, 0.00659942626953125, 0.009106636047363281, 0.011613845825195312, 0.014121055603027344, 0.016628265380859375, 0.019135475158691406, 0.021642684936523438, 0.02414989471435547, 0.0266571044921875, 0.02916431427001953, 0.03167152404785156, 0.034178733825683594, 0.036685943603515625, 0.039193153381347656, 0.04170036315917969, 0.04420757293701172, 0.04671478271484375, 0.04922199249267578, 0.05172920227050781, 0.054236412048339844, 0.056743621826171875, 0.059250831604003906, 0.06175804138183594, 0.06426525115966797, 0.0667724609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 9.0, 19.0, 11.0, 21.0, 39.0, 39.0, 78.0, 87.0, 94.0, 119.0, 114.0, 111.0, 83.0, 55.0, 38.0, 30.0, 20.0, 14.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5666863918304443, -0.5516281723976135, -0.5365700125694275, -0.5215117931365967, -0.5064535737037659, -0.49139538407325745, -0.476337194442749, -0.4612789750099182, -0.4462207853794098, -0.43116259574890137, -0.41610437631607056, -0.40104618668556213, -0.3859879970550537, -0.3709297776222229, -0.3558715879917145, -0.34081339836120605, -0.32575517892837524, -0.3106969892978668, -0.295638769865036, -0.2805805802345276, -0.2655223608016968, -0.25046417117118835, -0.23540598154067993, -0.22034777700901031, -0.2052895724773407, -0.19023136794567108, -0.17517316341400146, -0.16011497378349304, -0.14505676925182343, -0.1299985647201538, -0.11494036763906479, -0.09988217055797577, -0.08482396602630615, -0.06976576149463654, -0.054707564413547516, -0.0396493636071682, -0.02459116280078888, -0.009532958269119263, 0.005525238811969757, 0.020583435893058777, 0.035641640424728394, 0.05069984123110771, 0.06575804203748703, 0.08081623911857605, 0.09587444365024567, 0.11093264818191528, 0.1259908378124237, 0.14104904234409332, 0.15610724687576294, 0.17116545140743256, 0.18622365593910217, 0.2012818455696106, 0.2163400501012802, 0.23139825463294983, 0.24645644426345825, 0.26151466369628906, 0.2765728533267975, 0.2916310429573059, 0.3066892623901367, 0.32174745202064514, 0.33680564165115356, 0.3518638610839844, 0.3669220507144928, 0.3819802403450012, 0.39703845977783203]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 10.0, 10.0, 14.0, 10.0, 9.0, 13.0, 19.0, 30.0, 33.0, 21.0, 34.0, 42.0, 45.0, 34.0, 40.0, 37.0, 48.0, 40.0, 40.0, 50.0, 44.0, 34.0, 44.0, 33.0, 54.0, 32.0, 21.0, 25.0, 24.0, 13.0, 20.0, 11.0, 12.0, 9.0, 6.0, 6.0, 11.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2719373106956482, -0.26371222734451294, -0.2554871439933777, -0.24726206064224243, -0.23903697729110718, -0.23081189393997192, -0.22258679568767548, -0.21436171233654022, -0.20613662898540497, -0.19791154563426971, -0.18968646228313446, -0.1814613789319992, -0.17323628067970276, -0.1650111973285675, -0.15678611397743225, -0.148561030626297, -0.14033594727516174, -0.1321108639240265, -0.12388578057289124, -0.11566068977117538, -0.10743560642004013, -0.09921052306890488, -0.09098543226718903, -0.08276034891605377, -0.07453526556491852, -0.06631018221378326, -0.05808509513735771, -0.04986000806093216, -0.041634924709796906, -0.03340984135866165, -0.0251847542822361, -0.016959667205810547, -0.008734583854675293, -0.0005094986408948898, 0.007715586572885513, 0.015940671786665916, 0.02416575700044632, 0.032390840351581573, 0.040615927428007126, 0.04884101450443268, 0.05706609785556793, 0.06529118120670319, 0.07351626455783844, 0.08174135535955429, 0.08996643871068954, 0.0981915220618248, 0.10641661286354065, 0.1146416962146759, 0.12286677956581116, 0.1310918629169464, 0.13931694626808167, 0.14754202961921692, 0.15576711297035217, 0.16399219632148743, 0.17221729457378387, 0.18044237792491913, 0.18866746127605438, 0.19689254462718964, 0.2051176279783249, 0.21334271132946014, 0.2215678095817566, 0.22979289293289185, 0.2380179762840271, 0.24624305963516235, 0.2544681429862976]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 13.0, 14.0, 21.0, 36.0, 65.0, 132.0, 220.0, 356.0, 761.0, 1626.0, 3701.0, 9836.0, 28742.0, 103420.0, 655218.0, 180032.0, 41640.0, 13604.0, 5064.0, 2061.0, 945.0, 491.0, 224.0, 113.0, 86.0, 42.0, 34.0, 22.0, 13.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.25537109375, -0.24778366088867188, -0.24019622802734375, -0.23260879516601562, -0.2250213623046875, -0.21743392944335938, -0.20984649658203125, -0.20225906372070312, -0.194671630859375, -0.18708419799804688, -0.17949676513671875, -0.17190933227539062, -0.1643218994140625, -0.15673446655273438, -0.14914703369140625, -0.14155960083007812, -0.13397216796875, -0.12638473510742188, -0.11879730224609375, -0.11120986938476562, -0.1036224365234375, -0.09603500366210938, -0.08844757080078125, -0.08086013793945312, -0.073272705078125, -0.06568527221679688, -0.05809783935546875, -0.050510406494140625, -0.0429229736328125, -0.035335540771484375, -0.02774810791015625, -0.020160675048828125, -0.0125732421875, -0.004985809326171875, 0.00260162353515625, 0.010189056396484375, 0.0177764892578125, 0.025363922119140625, 0.03295135498046875, 0.040538787841796875, 0.048126220703125, 0.055713653564453125, 0.06330108642578125, 0.07088851928710938, 0.0784759521484375, 0.08606338500976562, 0.09365081787109375, 0.10123825073242188, 0.10882568359375, 0.11641311645507812, 0.12400054931640625, 0.13158798217773438, 0.1391754150390625, 0.14676284790039062, 0.15435028076171875, 0.16193771362304688, 0.169525146484375, 0.17711257934570312, 0.18470001220703125, 0.19228744506835938, 0.1998748779296875, 0.20746231079101562, 0.21504974365234375, 0.22263717651367188, 0.230224609375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 11.0, 9.0, 25.0, 22.0, 30.0, 54.0, 57.0, 86.0, 79.0, 87.0, 79.0, 85.0, 70.0, 71.0, 54.0, 47.0, 32.0, 28.0, 21.0, 10.0, 9.0, 9.0, 4.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0537109375, -0.0520625114440918, -0.050414085388183594, -0.04876565933227539, -0.04711723327636719, -0.045468807220458984, -0.04382038116455078, -0.04217195510864258, -0.040523529052734375, -0.03887510299682617, -0.03722667694091797, -0.035578250885009766, -0.03392982482910156, -0.03228139877319336, -0.030632972717285156, -0.028984546661376953, -0.02733612060546875, -0.025687694549560547, -0.024039268493652344, -0.02239084243774414, -0.020742416381835938, -0.019093990325927734, -0.01744556427001953, -0.015797138214111328, -0.014148712158203125, -0.012500286102294922, -0.010851860046386719, -0.009203433990478516, -0.0075550079345703125, -0.005906581878662109, -0.004258155822753906, -0.002609729766845703, -0.0009613037109375, 0.0006871223449707031, 0.0023355484008789062, 0.003983974456787109, 0.0056324005126953125, 0.007280826568603516, 0.008929252624511719, 0.010577678680419922, 0.012226104736328125, 0.013874530792236328, 0.015522956848144531, 0.017171382904052734, 0.018819808959960938, 0.02046823501586914, 0.022116661071777344, 0.023765087127685547, 0.02541351318359375, 0.027061939239501953, 0.028710365295410156, 0.03035879135131836, 0.03200721740722656, 0.033655643463134766, 0.03530406951904297, 0.03695249557495117, 0.038600921630859375, 0.04024934768676758, 0.04189777374267578, 0.043546199798583984, 0.04519462585449219, 0.04684305191040039, 0.048491477966308594, 0.0501399040222168, 0.051788330078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 9.0, 5.0, 9.0, 8.0, 11.0, 14.0, 26.0, 16.0, 36.0, 64.0, 105.0, 134.0, 196.0, 309.0, 564.0, 937.0, 1689.0, 3060.0, 6924.0, 18865.0, 68212.0, 492802.0, 368684.0, 56488.0, 16322.0, 6233.0, 3060.0, 1501.0, 877.0, 483.0, 307.0, 197.0, 120.0, 79.0, 55.0, 40.0, 39.0, 19.0, 13.0, 13.0, 7.0, 12.0, 1.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.2152099609375, -0.20922088623046875, -0.2032318115234375, -0.19724273681640625, -0.191253662109375, -0.18526458740234375, -0.1792755126953125, -0.17328643798828125, -0.16729736328125, -0.16130828857421875, -0.1553192138671875, -0.14933013916015625, -0.143341064453125, -0.13735198974609375, -0.1313629150390625, -0.12537384033203125, -0.119384765625, -0.11339569091796875, -0.1074066162109375, -0.10141754150390625, -0.095428466796875, -0.08943939208984375, -0.0834503173828125, -0.07746124267578125, -0.07147216796875, -0.06548309326171875, -0.0594940185546875, -0.05350494384765625, -0.047515869140625, -0.04152679443359375, -0.0355377197265625, -0.02954864501953125, -0.0235595703125, -0.01757049560546875, -0.0115814208984375, -0.00559234619140625, 0.000396728515625, 0.00638580322265625, 0.0123748779296875, 0.01836395263671875, 0.02435302734375, 0.03034210205078125, 0.0363311767578125, 0.04232025146484375, 0.048309326171875, 0.05429840087890625, 0.0602874755859375, 0.06627655029296875, 0.072265625, 0.07825469970703125, 0.0842437744140625, 0.09023284912109375, 0.096221923828125, 0.10221099853515625, 0.1082000732421875, 0.11418914794921875, 0.12017822265625, 0.12616729736328125, 0.1321563720703125, 0.13814544677734375, 0.144134521484375, 0.15012359619140625, 0.1561126708984375, 0.16210174560546875, 0.1680908203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 1.0, 7.0, 10.0, 10.0, 20.0, 21.0, 19.0, 24.0, 28.0, 48.0, 44.0, 51.0, 52.0, 64.0, 70.0, 63.0, 66.0, 57.0, 50.0, 44.0, 52.0, 38.0, 35.0, 32.0, 23.0, 21.0, 10.0, 8.0, 4.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.15790748596191406, -0.15211868286132812, -0.1463298797607422, -0.14054107666015625, -0.1347522735595703, -0.12896347045898438, -0.12317466735839844, -0.1173858642578125, -0.11159706115722656, -0.10580825805664062, -0.10001945495605469, -0.09423065185546875, -0.08844184875488281, -0.08265304565429688, -0.07686424255371094, -0.071075439453125, -0.06528663635253906, -0.059497833251953125, -0.05370903015136719, -0.04792022705078125, -0.04213142395019531, -0.036342620849609375, -0.030553817749023438, -0.0247650146484375, -0.018976211547851562, -0.013187408447265625, -0.0073986053466796875, -0.00160980224609375, 0.0041790008544921875, 0.009967803955078125, 0.015756607055664062, 0.02154541015625, 0.027334213256835938, 0.033123016357421875, 0.03891181945800781, 0.04470062255859375, 0.05048942565917969, 0.056278228759765625, 0.06206703186035156, 0.0678558349609375, 0.07364463806152344, 0.07943344116210938, 0.08522224426269531, 0.09101104736328125, 0.09679985046386719, 0.10258865356445312, 0.10837745666503906, 0.114166259765625, 0.11995506286621094, 0.12574386596679688, 0.1315326690673828, 0.13732147216796875, 0.1431102752685547, 0.14889907836914062, 0.15468788146972656, 0.1604766845703125, 0.16626548767089844, 0.17205429077148438, 0.1778430938720703, 0.18363189697265625, 0.1894207000732422, 0.19520950317382812, 0.20099830627441406, 0.206787109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 10.0, 18.0, 25.0, 33.0, 57.0, 113.0, 198.0, 341.0, 757.0, 1688.0, 4978.0, 17465.0, 84205.0, 786537.0, 120351.0, 22052.0, 5862.0, 2028.0, 881.0, 409.0, 205.0, 138.0, 65.0, 36.0, 27.0, 18.0, 7.0, 10.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.1829833984375, -0.17824077606201172, -0.17349815368652344, -0.16875553131103516, -0.16401290893554688, -0.1592702865600586, -0.1545276641845703, -0.14978504180908203, -0.14504241943359375, -0.14029979705810547, -0.1355571746826172, -0.1308145523071289, -0.12607192993164062, -0.12132930755615234, -0.11658668518066406, -0.11184406280517578, -0.1071014404296875, -0.10235881805419922, -0.09761619567871094, -0.09287357330322266, -0.08813095092773438, -0.0833883285522461, -0.07864570617675781, -0.07390308380126953, -0.06916046142578125, -0.06441783905029297, -0.05967521667480469, -0.054932594299316406, -0.050189971923828125, -0.045447349548339844, -0.04070472717285156, -0.03596210479736328, -0.031219482421875, -0.02647686004638672, -0.021734237670898438, -0.016991615295410156, -0.012248992919921875, -0.007506370544433594, -0.0027637481689453125, 0.0019788742065429688, 0.00672149658203125, 0.011464118957519531, 0.016206741333007812, 0.020949363708496094, 0.025691986083984375, 0.030434608459472656, 0.03517723083496094, 0.03991985321044922, 0.0446624755859375, 0.04940509796142578, 0.05414772033691406, 0.058890342712402344, 0.06363296508789062, 0.0683755874633789, 0.07311820983886719, 0.07786083221435547, 0.08260345458984375, 0.08734607696533203, 0.09208869934082031, 0.0968313217163086, 0.10157394409179688, 0.10631656646728516, 0.11105918884277344, 0.11580181121826172, 0.12054443359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 15.0, 11.0, 17.0, 35.0, 36.0, 66.0, 88.0, 119.0, 135.0, 125.0, 91.0, 69.0, 46.0, 46.0, 30.0, 16.0, 9.0, 14.0, 6.0, 8.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.37905502319336e-05, -7.21421092748642e-05, -7.04936683177948e-05, -6.88452273607254e-05, -6.7196786403656e-05, -6.554834544658661e-05, -6.389990448951721e-05, -6.225146353244781e-05, -6.060302257537842e-05, -5.895458161830902e-05, -5.7306140661239624e-05, -5.565769970417023e-05, -5.400925874710083e-05, -5.236081779003143e-05, -5.0712376832962036e-05, -4.906393587589264e-05, -4.741549491882324e-05, -4.5767053961753845e-05, -4.411861300468445e-05, -4.247017204761505e-05, -4.0821731090545654e-05, -3.917329013347626e-05, -3.752484917640686e-05, -3.587640821933746e-05, -3.4227967262268066e-05, -3.257952630519867e-05, -3.093108534812927e-05, -2.9282644391059875e-05, -2.763420343399048e-05, -2.598576247692108e-05, -2.4337321519851685e-05, -2.2688880562782288e-05, -2.104043960571289e-05, -1.9391998648643494e-05, -1.7743557691574097e-05, -1.60951167345047e-05, -1.4446675777435303e-05, -1.2798234820365906e-05, -1.1149793863296509e-05, -9.501352906227112e-06, -7.852911949157715e-06, -6.204470992088318e-06, -4.556030035018921e-06, -2.907589077949524e-06, -1.259148120880127e-06, 3.8929283618927e-07, 2.037733793258667e-06, 3.686174750328064e-06, 5.334615707397461e-06, 6.983056664466858e-06, 8.631497621536255e-06, 1.0279938578605652e-05, 1.1928379535675049e-05, 1.3576820492744446e-05, 1.5225261449813843e-05, 1.687370240688324e-05, 1.8522143363952637e-05, 2.0170584321022034e-05, 2.181902527809143e-05, 2.3467466235160828e-05, 2.5115907192230225e-05, 2.676434814929962e-05, 2.841278910636902e-05, 3.0061230063438416e-05, 3.170967102050781e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 10.0, 10.0, 7.0, 14.0, 17.0, 21.0, 50.0, 60.0, 75.0, 128.0, 230.0, 378.0, 763.0, 1654.0, 3824.0, 10677.0, 37318.0, 289773.0, 626041.0, 54570.0, 14077.0, 4716.0, 2033.0, 957.0, 466.0, 272.0, 133.0, 83.0, 52.0, 34.0, 24.0, 34.0, 16.0, 13.0, 3.0, 3.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1181640625, -0.11410713195800781, -0.11005020141601562, -0.10599327087402344, -0.10193634033203125, -0.09787940979003906, -0.09382247924804688, -0.08976554870605469, -0.0857086181640625, -0.08165168762207031, -0.07759475708007812, -0.07353782653808594, -0.06948089599609375, -0.06542396545410156, -0.061367034912109375, -0.05731010437011719, -0.053253173828125, -0.04919624328613281, -0.045139312744140625, -0.04108238220214844, -0.03702545166015625, -0.03296852111816406, -0.028911590576171875, -0.024854660034179688, -0.0207977294921875, -0.016740798950195312, -0.012683868408203125, -0.008626937866210938, -0.00457000732421875, -0.0005130767822265625, 0.003543853759765625, 0.0076007843017578125, 0.01165771484375, 0.015714645385742188, 0.019771575927734375, 0.023828506469726562, 0.02788543701171875, 0.03194236755371094, 0.035999298095703125, 0.04005622863769531, 0.0441131591796875, 0.04817008972167969, 0.052227020263671875, 0.05628395080566406, 0.06034088134765625, 0.06439781188964844, 0.06845474243164062, 0.07251167297363281, 0.076568603515625, 0.08062553405761719, 0.08468246459960938, 0.08873939514160156, 0.09279632568359375, 0.09685325622558594, 0.10091018676757812, 0.10496711730957031, 0.1090240478515625, 0.11308097839355469, 0.11713790893554688, 0.12119483947753906, 0.12525177001953125, 0.12930870056152344, 0.13336563110351562, 0.1374225616455078, 0.1414794921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 5.0, 15.0, 17.0, 23.0, 30.0, 60.0, 110.0, 218.0, 203.0, 125.0, 59.0, 47.0, 16.0, 21.0, 10.0, 6.0, 11.0, 5.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1138916015625, -0.1105508804321289, -0.10721015930175781, -0.10386943817138672, -0.10052871704101562, -0.09718799591064453, -0.09384727478027344, -0.09050655364990234, -0.08716583251953125, -0.08382511138916016, -0.08048439025878906, -0.07714366912841797, -0.07380294799804688, -0.07046222686767578, -0.06712150573730469, -0.0637807846069336, -0.0604400634765625, -0.057099342346191406, -0.05375862121582031, -0.05041790008544922, -0.047077178955078125, -0.04373645782470703, -0.04039573669433594, -0.037055015563964844, -0.03371429443359375, -0.030373573303222656, -0.027032852172851562, -0.02369213104248047, -0.020351409912109375, -0.01701068878173828, -0.013669967651367188, -0.010329246520996094, -0.006988525390625, -0.0036478042602539062, -0.0003070831298828125, 0.0030336380004882812, 0.006374359130859375, 0.009715080261230469, 0.013055801391601562, 0.016396522521972656, 0.01973724365234375, 0.023077964782714844, 0.026418685913085938, 0.02975940704345703, 0.033100128173828125, 0.03644084930419922, 0.03978157043457031, 0.043122291564941406, 0.0464630126953125, 0.049803733825683594, 0.05314445495605469, 0.05648517608642578, 0.059825897216796875, 0.06316661834716797, 0.06650733947753906, 0.06984806060791016, 0.07318878173828125, 0.07652950286865234, 0.07987022399902344, 0.08321094512939453, 0.08655166625976562, 0.08989238739013672, 0.09323310852050781, 0.0965738296508789, 0.09991455078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 22.0, 35.0, 118.0, 195.0, 223.0, 219.0, 109.0, 46.0, 23.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.665393352508545, -3.5882980823516846, -3.511202573776245, -3.4341073036193848, -3.3570117950439453, -3.279916524887085, -3.2028210163116455, -3.125725746154785, -3.0486302375793457, -2.9715349674224854, -2.894439458847046, -2.8173441886901855, -2.740248680114746, -2.6631534099578857, -2.5860579013824463, -2.508962631225586, -2.4318673610687256, -2.3547720909118652, -2.277676582336426, -2.2005813121795654, -2.123485803604126, -2.0463905334472656, -1.9692951440811157, -1.8921997547149658, -1.815104365348816, -1.738008975982666, -1.6609135866165161, -1.5838181972503662, -1.5067229270935059, -1.4296274185180664, -1.352532148361206, -1.2754367589950562, -1.1983413696289062, -1.1212459802627563, -1.0441505908966064, -0.9670552611351013, -0.8899598717689514, -0.8128644824028015, -0.7357691526412964, -0.6586737632751465, -0.5815783739089966, -0.5044829845428467, -0.42738762497901917, -0.35029226541519165, -0.27319687604904175, -0.19610148668289185, -0.11900612711906433, -0.041910767555236816, 0.035184621810913086, 0.1122799962759018, 0.1893753707408905, 0.266470730304718, 0.3435661196708679, 0.4206615090370178, 0.49775686860084534, 0.5748522281646729, 0.6519476175308228, 0.7290430068969727, 0.8061383962631226, 0.8832337260246277, 0.9603291153907776, 1.0374245643615723, 1.1145198345184326, 1.1916152238845825, 1.2687106132507324]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 2.0, 8.0, 7.0, 13.0, 14.0, 11.0, 18.0, 30.0, 18.0, 27.0, 25.0, 26.0, 36.0, 28.0, 46.0, 37.0, 44.0, 38.0, 46.0, 30.0, 33.0, 45.0, 40.0, 33.0, 29.0, 28.0, 34.0, 23.0, 35.0, 19.0, 24.0, 23.0, 21.0, 21.0, 12.0, 14.0, 18.0, 6.0, 9.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.6341946125030518, -0.6144767999649048, -0.5947589874267578, -0.5750411748886108, -0.5553233027458191, -0.5356054902076721, -0.5158876776695251, -0.4961698651313782, -0.4764520525932312, -0.45673424005508423, -0.43701639771461487, -0.4172985851764679, -0.3975807726383209, -0.37786293029785156, -0.3581451177597046, -0.3384273052215576, -0.31870946288108826, -0.2989916503429413, -0.2792738080024719, -0.25955599546432495, -0.23983818292617798, -0.2201203554868698, -0.20040252804756165, -0.18068471550941467, -0.1609668880701065, -0.14124906063079834, -0.12153124809265137, -0.1018134206533432, -0.08209560066461563, -0.06237778067588806, -0.042659953236579895, -0.022942140698432922, -0.003224313259124756, 0.016493508592247963, 0.03621133044362068, 0.05592915415763855, 0.07564697414636612, 0.09536479413509369, 0.11508262157440186, 0.13480043411254883, 0.154518261551857, 0.17423608899116516, 0.19395390152931213, 0.2136717289686203, 0.23338955640792847, 0.25310736894607544, 0.2728251814842224, 0.2925429940223694, 0.31226083636283875, 0.3319786489009857, 0.3516964912414551, 0.37141430377960205, 0.391132116317749, 0.410849928855896, 0.43056777119636536, 0.45028558373451233, 0.4700034260749817, 0.48972123861312866, 0.5094390511512756, 0.5291569232940674, 0.5488747358322144, 0.5685925483703613, 0.5883103609085083, 0.6080281734466553, 0.6277459859848022]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 12.0, 6.0, 8.0, 10.0, 30.0, 32.0, 46.0, 63.0, 119.0, 189.0, 268.0, 515.0, 936.0, 1744.0, 3344.0, 7053.0, 17439.0, 56789.0, 483919.0, 3480138.0, 97432.0, 24990.0, 9582.0, 4376.0, 2267.0, 1163.0, 724.0, 386.0, 224.0, 153.0, 106.0, 65.0, 59.0, 32.0, 14.0, 14.0, 13.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.17600440979003906, -0.16975784301757812, -0.1635112762451172, -0.15726470947265625, -0.1510181427001953, -0.14477157592773438, -0.13852500915527344, -0.1322784423828125, -0.12603187561035156, -0.11978530883789062, -0.11353874206542969, -0.10729217529296875, -0.10104560852050781, -0.09479904174804688, -0.08855247497558594, -0.082305908203125, -0.07605934143066406, -0.06981277465820312, -0.06356620788574219, -0.05731964111328125, -0.05107307434082031, -0.044826507568359375, -0.03857994079589844, -0.0323333740234375, -0.026086807250976562, -0.019840240478515625, -0.013593673706054688, -0.00734710693359375, -0.0011005401611328125, 0.005146026611328125, 0.011392593383789062, 0.01763916015625, 0.023885726928710938, 0.030132293701171875, 0.03637886047363281, 0.04262542724609375, 0.04887199401855469, 0.055118560791015625, 0.06136512756347656, 0.0676116943359375, 0.07385826110839844, 0.08010482788085938, 0.08635139465332031, 0.09259796142578125, 0.09884452819824219, 0.10509109497070312, 0.11133766174316406, 0.117584228515625, 0.12383079528808594, 0.13007736206054688, 0.1363239288330078, 0.14257049560546875, 0.1488170623779297, 0.15506362915039062, 0.16131019592285156, 0.1675567626953125, 0.17380332946777344, 0.18004989624023438, 0.1862964630126953, 0.19254302978515625, 0.1987895965576172, 0.20503616333007812, 0.21128273010253906, 0.217529296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 7.0, 12.0, 24.0, 20.0, 27.0, 57.0, 69.0, 69.0, 67.0, 71.0, 88.0, 64.0, 67.0, 74.0, 69.0, 46.0, 39.0, 43.0, 26.0, 12.0, 13.0, 7.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054901123046875, -0.05318927764892578, -0.05147743225097656, -0.049765586853027344, -0.048053741455078125, -0.046341896057128906, -0.04463005065917969, -0.04291820526123047, -0.04120635986328125, -0.03949451446533203, -0.03778266906738281, -0.036070823669433594, -0.034358978271484375, -0.032647132873535156, -0.030935287475585938, -0.02922344207763672, -0.0275115966796875, -0.02579975128173828, -0.024087905883789062, -0.022376060485839844, -0.020664215087890625, -0.018952369689941406, -0.017240524291992188, -0.015528678894042969, -0.01381683349609375, -0.012104988098144531, -0.010393142700195312, -0.008681297302246094, -0.006969451904296875, -0.005257606506347656, -0.0035457611083984375, -0.0018339157104492188, -0.0001220703125, 0.0015897750854492188, 0.0033016204833984375, 0.005013465881347656, 0.006725311279296875, 0.008437156677246094, 0.010149002075195312, 0.011860847473144531, 0.01357269287109375, 0.015284538269042969, 0.016996383666992188, 0.018708229064941406, 0.020420074462890625, 0.022131919860839844, 0.023843765258789062, 0.02555561065673828, 0.0272674560546875, 0.02897930145263672, 0.030691146850585938, 0.032402992248535156, 0.034114837646484375, 0.035826683044433594, 0.03753852844238281, 0.03925037384033203, 0.04096221923828125, 0.04267406463623047, 0.04438591003417969, 0.046097755432128906, 0.047809600830078125, 0.049521446228027344, 0.05123329162597656, 0.05294513702392578, 0.054656982421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 14.0, 14.0, 17.0, 28.0, 45.0, 51.0, 80.0, 91.0, 131.0, 212.0, 287.0, 455.0, 687.0, 1176.0, 2066.0, 3939.0, 9040.0, 23641.0, 77256.0, 793258.0, 3117565.0, 111864.0, 29770.0, 11495.0, 4957.0, 2401.0, 1371.0, 816.0, 513.0, 310.0, 223.0, 142.0, 102.0, 72.0, 38.0, 40.0, 28.0, 22.0, 15.0, 16.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217041015625, -0.2106800079345703, -0.20431900024414062, -0.19795799255371094, -0.19159698486328125, -0.18523597717285156, -0.17887496948242188, -0.1725139617919922, -0.1661529541015625, -0.1597919464111328, -0.15343093872070312, -0.14706993103027344, -0.14070892333984375, -0.13434791564941406, -0.12798690795898438, -0.12162590026855469, -0.115264892578125, -0.10890388488769531, -0.10254287719726562, -0.09618186950683594, -0.08982086181640625, -0.08345985412597656, -0.07709884643554688, -0.07073783874511719, -0.0643768310546875, -0.05801582336425781, -0.051654815673828125, -0.04529380798339844, -0.03893280029296875, -0.03257179260253906, -0.026210784912109375, -0.019849777221679688, -0.01348876953125, -0.0071277618408203125, -0.000766754150390625, 0.0055942535400390625, 0.01195526123046875, 0.018316268920898438, 0.024677276611328125, 0.031038284301757812, 0.0373992919921875, 0.04376029968261719, 0.050121307373046875, 0.05648231506347656, 0.06284332275390625, 0.06920433044433594, 0.07556533813476562, 0.08192634582519531, 0.088287353515625, 0.09464836120605469, 0.10100936889648438, 0.10737037658691406, 0.11373138427734375, 0.12009239196777344, 0.12645339965820312, 0.1328144073486328, 0.1391754150390625, 0.1455364227294922, 0.15189743041992188, 0.15825843811035156, 0.16461944580078125, 0.17098045349121094, 0.17734146118164062, 0.1837024688720703, 0.1900634765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 11.0, 11.0, 11.0, 26.0, 27.0, 43.0, 62.0, 164.0, 392.0, 2082.0, 747.0, 218.0, 98.0, 49.0, 38.0, 23.0, 16.0, 8.0, 12.0, 9.0, 6.0, 6.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11456298828125, -0.1113576889038086, -0.10815238952636719, -0.10494709014892578, -0.10174179077148438, -0.09853649139404297, -0.09533119201660156, -0.09212589263916016, -0.08892059326171875, -0.08571529388427734, -0.08250999450683594, -0.07930469512939453, -0.07609939575195312, -0.07289409637451172, -0.06968879699707031, -0.0664834976196289, -0.0632781982421875, -0.060072898864746094, -0.05686759948730469, -0.05366230010986328, -0.050457000732421875, -0.04725170135498047, -0.04404640197753906, -0.040841102600097656, -0.03763580322265625, -0.034430503845214844, -0.031225204467773438, -0.02801990509033203, -0.024814605712890625, -0.02160930633544922, -0.018404006958007812, -0.015198707580566406, -0.011993408203125, -0.008788108825683594, -0.0055828094482421875, -0.0023775100708007812, 0.000827789306640625, 0.004033088684082031, 0.0072383880615234375, 0.010443687438964844, 0.01364898681640625, 0.016854286193847656, 0.020059585571289062, 0.02326488494873047, 0.026470184326171875, 0.02967548370361328, 0.03288078308105469, 0.036086082458496094, 0.0392913818359375, 0.042496681213378906, 0.04570198059082031, 0.04890727996826172, 0.052112579345703125, 0.05531787872314453, 0.05852317810058594, 0.061728477478027344, 0.06493377685546875, 0.06813907623291016, 0.07134437561035156, 0.07454967498779297, 0.07775497436523438, 0.08096027374267578, 0.08416557312011719, 0.0873708724975586, 0.090576171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 13.0, 15.0, 21.0, 45.0, 64.0, 88.0, 112.0, 141.0, 144.0, 118.0, 104.0, 45.0, 31.0, 25.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5436254143714905, -0.526502788066864, -0.5093802213668823, -0.49225762486457825, -0.47513502836227417, -0.4580124020576477, -0.44088980555534363, -0.42376720905303955, -0.4066446125507355, -0.3895220160484314, -0.3723994195461273, -0.35527682304382324, -0.3381541967391968, -0.3210316300392151, -0.3039090037345886, -0.28678640723228455, -0.26966381072998047, -0.2525412142276764, -0.23541861772537231, -0.21829600632190704, -0.20117340981960297, -0.1840508133172989, -0.16692820191383362, -0.14980560541152954, -0.13268300890922546, -0.11556041240692139, -0.09843780845403671, -0.08131520450115204, -0.06419260799884796, -0.047070011496543884, -0.02994740754365921, -0.012824803590774536, 0.004297852516174316, 0.021420452743768692, 0.03854305297136307, 0.05566565319895744, 0.07278825342655182, 0.0899108499288559, 0.10703345388174057, 0.12415605783462524, 0.14127865433692932, 0.1584012508392334, 0.17552384734153748, 0.19264645874500275, 0.20976905524730682, 0.2268916517496109, 0.24401426315307617, 0.26113685965538025, 0.2782594561576843, 0.2953820526599884, 0.3125046491622925, 0.32962724566459656, 0.34674984216690063, 0.3638724684715271, 0.3809950649738312, 0.39811766147613525, 0.41524025797843933, 0.4323628544807434, 0.4494854509830475, 0.46660804748535156, 0.483730673789978, 0.5008532404899597, 0.5179758667945862, 0.5350984334945679, 0.5522210597991943]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 4.0, 2.0, 9.0, 10.0, 16.0, 14.0, 10.0, 18.0, 23.0, 34.0, 26.0, 24.0, 28.0, 36.0, 40.0, 34.0, 28.0, 28.0, 47.0, 32.0, 38.0, 43.0, 46.0, 40.0, 22.0, 39.0, 31.0, 30.0, 41.0, 30.0, 20.0, 28.0, 17.0, 15.0, 18.0, 14.0, 11.0, 8.0, 8.0, 7.0, 2.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.20087182521820068, -0.19409941136837006, -0.18732699751853943, -0.1805545836687088, -0.17378216981887817, -0.16700975596904755, -0.16023734211921692, -0.1534649133682251, -0.14669251441955566, -0.13992010056972504, -0.1331476867198944, -0.12637527287006378, -0.11960285902023315, -0.11283044517040253, -0.1060580238699913, -0.09928561002016068, -0.09251318871974945, -0.08574077486991882, -0.0789683610200882, -0.07219594717025757, -0.06542353332042694, -0.058651115745306015, -0.05187869817018509, -0.04510628432035446, -0.038333870470523834, -0.03156145662069321, -0.02478904090821743, -0.018016625195741653, -0.011244211345911026, -0.0044717974960803986, 0.0023006200790405273, 0.009073033928871155, 0.015845447778701782, 0.02261786162853241, 0.029390277341008186, 0.03616269305348396, 0.04293510690331459, 0.04970752075314522, 0.056479938328266144, 0.06325235217809677, 0.0700247660279274, 0.07679717987775803, 0.08356959372758865, 0.09034201502799988, 0.0971144288778305, 0.10388684272766113, 0.11065925657749176, 0.11743167042732239, 0.12420408427715302, 0.13097649812698364, 0.13774891197681427, 0.1445213258266449, 0.15129373967647552, 0.15806615352630615, 0.16483858227729797, 0.1716109812259674, 0.17838340997695923, 0.18515582382678986, 0.19192823767662048, 0.1987006515264511, 0.20547306537628174, 0.21224547922611237, 0.219017893075943, 0.22579032182693481, 0.23256272077560425]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 12.0, 35.0, 53.0, 79.0, 140.0, 315.0, 619.0, 1513.0, 3970.0, 11566.0, 39863.0, 219009.0, 650165.0, 87400.0, 22470.0, 7053.0, 2485.0, 879.0, 426.0, 204.0, 115.0, 64.0, 37.0, 30.0, 15.0, 11.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.2386474609375, -0.23168373107910156, -0.22472000122070312, -0.2177562713623047, -0.21079254150390625, -0.2038288116455078, -0.19686508178710938, -0.18990135192871094, -0.1829376220703125, -0.17597389221191406, -0.16901016235351562, -0.1620464324951172, -0.15508270263671875, -0.1481189727783203, -0.14115524291992188, -0.13419151306152344, -0.127227783203125, -0.12026405334472656, -0.11330032348632812, -0.10633659362792969, -0.09937286376953125, -0.09240913391113281, -0.08544540405273438, -0.07848167419433594, -0.0715179443359375, -0.06455421447753906, -0.057590484619140625, -0.05062675476074219, -0.04366302490234375, -0.03669929504394531, -0.029735565185546875, -0.022771835327148438, -0.01580810546875, -0.008844375610351562, -0.001880645751953125, 0.0050830841064453125, 0.01204681396484375, 0.019010543823242188, 0.025974273681640625, 0.03293800354003906, 0.0399017333984375, 0.04686546325683594, 0.053829193115234375, 0.06079292297363281, 0.06775665283203125, 0.07472038269042969, 0.08168411254882812, 0.08864784240722656, 0.095611572265625, 0.10257530212402344, 0.10953903198242188, 0.11650276184082031, 0.12346649169921875, 0.1304302215576172, 0.13739395141601562, 0.14435768127441406, 0.1513214111328125, 0.15828514099121094, 0.16524887084960938, 0.1722126007080078, 0.17917633056640625, 0.1861400604248047, 0.19310379028320312, 0.20006752014160156, 0.20703125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 13.0, 13.0, 24.0, 19.0, 27.0, 50.0, 54.0, 60.0, 55.0, 88.0, 77.0, 65.0, 82.0, 77.0, 73.0, 46.0, 52.0, 35.0, 23.0, 16.0, 14.0, 13.0, 6.0, 5.0, 7.0, 0.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.060821533203125, -0.059103965759277344, -0.05738639831542969, -0.05566883087158203, -0.053951263427734375, -0.05223369598388672, -0.05051612854003906, -0.048798561096191406, -0.04708099365234375, -0.045363426208496094, -0.04364585876464844, -0.04192829132080078, -0.040210723876953125, -0.03849315643310547, -0.03677558898925781, -0.035058021545410156, -0.0333404541015625, -0.031622886657714844, -0.029905319213867188, -0.02818775177001953, -0.026470184326171875, -0.02475261688232422, -0.023035049438476562, -0.021317481994628906, -0.01959991455078125, -0.017882347106933594, -0.016164779663085938, -0.014447212219238281, -0.012729644775390625, -0.011012077331542969, -0.009294509887695312, -0.007576942443847656, -0.005859375, -0.004141807556152344, -0.0024242401123046875, -0.0007066726684570312, 0.001010894775390625, 0.0027284622192382812, 0.0044460296630859375, 0.006163597106933594, 0.00788116455078125, 0.009598731994628906, 0.011316299438476562, 0.013033866882324219, 0.014751434326171875, 0.01646900177001953, 0.018186569213867188, 0.019904136657714844, 0.0216217041015625, 0.023339271545410156, 0.025056838989257812, 0.02677440643310547, 0.028491973876953125, 0.03020954132080078, 0.03192710876464844, 0.033644676208496094, 0.03536224365234375, 0.037079811096191406, 0.03879737854003906, 0.04051494598388672, 0.042232513427734375, 0.04395008087158203, 0.04566764831542969, 0.047385215759277344, 0.049102783203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 13.0, 13.0, 19.0, 27.0, 50.0, 107.0, 148.0, 324.0, 704.0, 1514.0, 3723.0, 9594.0, 28763.0, 121474.0, 753297.0, 90183.0, 24438.0, 8393.0, 3203.0, 1320.0, 573.0, 283.0, 158.0, 90.0, 59.0, 29.0, 24.0, 8.0, 10.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.22017860412597656, -0.21269607543945312, -0.2052135467529297, -0.19773101806640625, -0.1902484893798828, -0.18276596069335938, -0.17528343200683594, -0.1678009033203125, -0.16031837463378906, -0.15283584594726562, -0.1453533172607422, -0.13787078857421875, -0.1303882598876953, -0.12290573120117188, -0.11542320251464844, -0.107940673828125, -0.10045814514160156, -0.09297561645507812, -0.08549308776855469, -0.07801055908203125, -0.07052803039550781, -0.06304550170898438, -0.05556297302246094, -0.0480804443359375, -0.04059791564941406, -0.033115386962890625, -0.025632858276367188, -0.01815032958984375, -0.010667800903320312, -0.003185272216796875, 0.0042972564697265625, 0.01177978515625, 0.019262313842773438, 0.026744842529296875, 0.03422737121582031, 0.04170989990234375, 0.04919242858886719, 0.056674957275390625, 0.06415748596191406, 0.0716400146484375, 0.07912254333496094, 0.08660507202148438, 0.09408760070800781, 0.10157012939453125, 0.10905265808105469, 0.11653518676757812, 0.12401771545410156, 0.131500244140625, 0.13898277282714844, 0.14646530151367188, 0.1539478302001953, 0.16143035888671875, 0.1689128875732422, 0.17639541625976562, 0.18387794494628906, 0.1913604736328125, 0.19884300231933594, 0.20632553100585938, 0.2138080596923828, 0.22129058837890625, 0.2287731170654297, 0.23625564575195312, 0.24373817443847656, 0.251220703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 5.0, 8.0, 11.0, 20.0, 23.0, 37.0, 30.0, 46.0, 42.0, 63.0, 63.0, 78.0, 75.0, 65.0, 67.0, 62.0, 63.0, 41.0, 46.0, 22.0, 27.0, 24.0, 23.0, 12.0, 7.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.277587890625, -0.2702445983886719, -0.26290130615234375, -0.2555580139160156, -0.2482147216796875, -0.24087142944335938, -0.23352813720703125, -0.22618484497070312, -0.218841552734375, -0.21149826049804688, -0.20415496826171875, -0.19681167602539062, -0.1894683837890625, -0.18212509155273438, -0.17478179931640625, -0.16743850708007812, -0.16009521484375, -0.15275192260742188, -0.14540863037109375, -0.13806533813476562, -0.1307220458984375, -0.12337875366210938, -0.11603546142578125, -0.10869216918945312, -0.101348876953125, -0.09400558471679688, -0.08666229248046875, -0.07931900024414062, -0.0719757080078125, -0.06463241577148438, -0.05728912353515625, -0.049945831298828125, -0.0426025390625, -0.035259246826171875, -0.02791595458984375, -0.020572662353515625, -0.0132293701171875, -0.005886077880859375, 0.00145721435546875, 0.008800506591796875, 0.016143798828125, 0.023487091064453125, 0.03083038330078125, 0.038173675537109375, 0.0455169677734375, 0.052860260009765625, 0.06020355224609375, 0.06754684448242188, 0.07489013671875, 0.08223342895507812, 0.08957672119140625, 0.09692001342773438, 0.1042633056640625, 0.11160659790039062, 0.11894989013671875, 0.12629318237304688, 0.133636474609375, 0.14097976684570312, 0.14832305908203125, 0.15566635131835938, 0.1630096435546875, 0.17035293579101562, 0.17769622802734375, 0.18503952026367188, 0.1923828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 5.0, 9.0, 17.0, 17.0, 23.0, 31.0, 56.0, 102.0, 122.0, 203.0, 287.0, 505.0, 931.0, 1755.0, 3780.0, 9428.0, 30452.0, 245933.0, 688643.0, 43933.0, 12698.0, 4802.0, 2144.0, 1053.0, 628.0, 341.0, 208.0, 134.0, 99.0, 64.0, 39.0, 32.0, 23.0, 13.0, 19.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14453125, -0.1395702362060547, -0.13460922241210938, -0.12964820861816406, -0.12468719482421875, -0.11972618103027344, -0.11476516723632812, -0.10980415344238281, -0.1048431396484375, -0.09988212585449219, -0.09492111206054688, -0.08996009826660156, -0.08499908447265625, -0.08003807067871094, -0.07507705688476562, -0.07011604309082031, -0.065155029296875, -0.06019401550292969, -0.055233001708984375, -0.05027198791503906, -0.04531097412109375, -0.04034996032714844, -0.035388946533203125, -0.030427932739257812, -0.0254669189453125, -0.020505905151367188, -0.015544891357421875, -0.010583877563476562, -0.00562286376953125, -0.0006618499755859375, 0.004299163818359375, 0.009260177612304688, 0.01422119140625, 0.019182205200195312, 0.024143218994140625, 0.029104232788085938, 0.03406524658203125, 0.03902626037597656, 0.043987274169921875, 0.04894828796386719, 0.0539093017578125, 0.05887031555175781, 0.06383132934570312, 0.06879234313964844, 0.07375335693359375, 0.07871437072753906, 0.08367538452148438, 0.08863639831542969, 0.093597412109375, 0.09855842590332031, 0.10351943969726562, 0.10848045349121094, 0.11344146728515625, 0.11840248107910156, 0.12336349487304688, 0.1283245086669922, 0.1332855224609375, 0.1382465362548828, 0.14320755004882812, 0.14816856384277344, 0.15312957763671875, 0.15809059143066406, 0.16305160522460938, 0.1680126190185547, 0.1729736328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 5.0, 11.0, 6.0, 17.0, 22.0, 37.0, 56.0, 59.0, 81.0, 120.0, 91.0, 103.0, 110.0, 60.0, 52.0, 36.0, 28.0, 25.0, 26.0, 13.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86102294921875e-05, -2.7223490178585052e-05, -2.5836750864982605e-05, -2.4450011551380157e-05, -2.306327223777771e-05, -2.1676532924175262e-05, -2.0289793610572815e-05, -1.8903054296970367e-05, -1.751631498336792e-05, -1.6129575669765472e-05, -1.4742836356163025e-05, -1.3356097042560577e-05, -1.196935772895813e-05, -1.0582618415355682e-05, -9.195879101753235e-06, -7.809139788150787e-06, -6.42240047454834e-06, -5.035661160945892e-06, -3.648921847343445e-06, -2.2621825337409973e-06, -8.754432201385498e-07, 5.112960934638977e-07, 1.8980354070663452e-06, 3.2847747206687927e-06, 4.67151403427124e-06, 6.058253347873688e-06, 7.444992661476135e-06, 8.831731975078583e-06, 1.021847128868103e-05, 1.1605210602283478e-05, 1.2991949915885925e-05, 1.4378689229488373e-05, 1.576542854309082e-05, 1.7152167856693268e-05, 1.8538907170295715e-05, 1.9925646483898163e-05, 2.131238579750061e-05, 2.2699125111103058e-05, 2.4085864424705505e-05, 2.5472603738307953e-05, 2.68593430519104e-05, 2.8246082365512848e-05, 2.9632821679115295e-05, 3.101956099271774e-05, 3.240630030632019e-05, 3.379303961992264e-05, 3.5179778933525085e-05, 3.656651824712753e-05, 3.795325756072998e-05, 3.933999687433243e-05, 4.0726736187934875e-05, 4.211347550153732e-05, 4.350021481513977e-05, 4.488695412874222e-05, 4.6273693442344666e-05, 4.766043275594711e-05, 4.904717206954956e-05, 5.043391138315201e-05, 5.1820650696754456e-05, 5.32073900103569e-05, 5.459412932395935e-05, 5.59808686375618e-05, 5.7367607951164246e-05, 5.875434726476669e-05, 6.014108657836914e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 18.0, 14.0, 23.0, 42.0, 63.0, 88.0, 174.0, 258.0, 483.0, 1031.0, 2180.0, 5203.0, 14883.0, 53522.0, 780202.0, 149692.0, 26030.0, 8193.0, 3275.0, 1515.0, 678.0, 407.0, 217.0, 130.0, 80.0, 52.0, 26.0, 22.0, 11.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.1596698760986328, -0.15430068969726562, -0.14893150329589844, -0.14356231689453125, -0.13819313049316406, -0.13282394409179688, -0.1274547576904297, -0.1220855712890625, -0.11671638488769531, -0.11134719848632812, -0.10597801208496094, -0.10060882568359375, -0.09523963928222656, -0.08987045288085938, -0.08450126647949219, -0.079132080078125, -0.07376289367675781, -0.06839370727539062, -0.06302452087402344, -0.05765533447265625, -0.05228614807128906, -0.046916961669921875, -0.04154777526855469, -0.0361785888671875, -0.030809402465820312, -0.025440216064453125, -0.020071029663085938, -0.01470184326171875, -0.009332656860351562, -0.003963470458984375, 0.0014057159423828125, 0.00677490234375, 0.012144088745117188, 0.017513275146484375, 0.022882461547851562, 0.02825164794921875, 0.03362083435058594, 0.038990020751953125, 0.04435920715332031, 0.0497283935546875, 0.05509757995605469, 0.060466766357421875, 0.06583595275878906, 0.07120513916015625, 0.07657432556152344, 0.08194351196289062, 0.08731269836425781, 0.092681884765625, 0.09805107116699219, 0.10342025756835938, 0.10878944396972656, 0.11415863037109375, 0.11952781677246094, 0.12489700317382812, 0.1302661895751953, 0.1356353759765625, 0.1410045623779297, 0.14637374877929688, 0.15174293518066406, 0.15711212158203125, 0.16248130798339844, 0.16785049438476562, 0.1732196807861328, 0.1785888671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 7.0, 10.0, 10.0, 7.0, 12.0, 26.0, 32.0, 53.0, 110.0, 264.0, 219.0, 103.0, 36.0, 18.0, 21.0, 18.0, 14.0, 5.0, 6.0, 6.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.08849048614501953, -0.08378028869628906, -0.0790700912475586, -0.07435989379882812, -0.06964969635009766, -0.06493949890136719, -0.06022930145263672, -0.05551910400390625, -0.05080890655517578, -0.04609870910644531, -0.041388511657714844, -0.036678314208984375, -0.031968116760253906, -0.027257919311523438, -0.02254772186279297, -0.0178375244140625, -0.013127326965332031, -0.008417129516601562, -0.0037069320678710938, 0.001003265380859375, 0.005713462829589844, 0.010423660278320312, 0.015133857727050781, 0.01984405517578125, 0.02455425262451172, 0.029264450073242188, 0.033974647521972656, 0.038684844970703125, 0.043395042419433594, 0.04810523986816406, 0.05281543731689453, 0.057525634765625, 0.06223583221435547, 0.06694602966308594, 0.0716562271118164, 0.07636642456054688, 0.08107662200927734, 0.08578681945800781, 0.09049701690673828, 0.09520721435546875, 0.09991741180419922, 0.10462760925292969, 0.10933780670166016, 0.11404800415039062, 0.1187582015991211, 0.12346839904785156, 0.12817859649658203, 0.1328887939453125, 0.13759899139404297, 0.14230918884277344, 0.1470193862915039, 0.15172958374023438, 0.15643978118896484, 0.1611499786376953, 0.16586017608642578, 0.17057037353515625, 0.17528057098388672, 0.1799907684326172, 0.18470096588134766, 0.18941116333007812, 0.1941213607788086, 0.19883155822753906, 0.20354175567626953, 0.208251953125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 18.0, 21.0, 26.0, 40.0, 60.0, 98.0, 95.0, 115.0, 109.0, 108.0, 92.0, 69.0, 40.0, 27.0, 26.0, 14.0, 13.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2618948221206665, -1.2237956523895264, -1.1856964826583862, -1.1475971937179565, -1.1094980239868164, -1.0713988542556763, -1.0332996845245361, -0.995200514793396, -0.9571012854576111, -0.919002115726471, -0.880902886390686, -0.8428037166595459, -0.8047045469284058, -0.7666053175926208, -0.7285061478614807, -0.6904069185256958, -0.6523077487945557, -0.6142085790634155, -0.5761093497276306, -0.5380101799964905, -0.49991098046302795, -0.46181178092956543, -0.4237126111984253, -0.38561341166496277, -0.34751421213150024, -0.3094150125980377, -0.2713158130645752, -0.23321664333343506, -0.19511744379997253, -0.15701824426651, -0.11891905963420868, -0.08081987500190735, -0.042720675468444824, -0.004621483385562897, 0.03347770869731903, 0.07157690078020096, 0.10967609286308289, 0.1477752923965454, 0.18587447702884674, 0.22397366166114807, 0.2620728611946106, 0.3001720607280731, 0.33827126026153564, 0.3763704299926758, 0.4144696295261383, 0.45256882905960083, 0.49066799879074097, 0.5287672281265259, 0.566866397857666, 0.6049655675888062, 0.6430647969245911, 0.6811639666557312, 0.7192631959915161, 0.7573623657226562, 0.7954615354537964, 0.8335607051849365, 0.8716599345207214, 0.9097591042518616, 0.9478583335876465, 0.9859575033187866, 1.0240566730499268, 1.0621559619903564, 1.1002551317214966, 1.1383543014526367, 1.1764534711837769]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 8.0, 8.0, 18.0, 25.0, 25.0, 13.0, 25.0, 29.0, 23.0, 29.0, 41.0, 30.0, 40.0, 39.0, 36.0, 43.0, 37.0, 41.0, 38.0, 42.0, 40.0, 35.0, 30.0, 34.0, 27.0, 24.0, 29.0, 20.0, 22.0, 18.0, 14.0, 20.0, 17.0, 8.0, 10.0, 10.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-0.7505302429199219, -0.727845311164856, -0.7051604390144348, -0.6824755072593689, -0.659790575504303, -0.6371057033538818, -0.6144207715988159, -0.59173583984375, -0.5690509080886841, -0.5463659763336182, -0.523681104183197, -0.5009961724281311, -0.4783112406730652, -0.45562633872032166, -0.4329414367675781, -0.4102565050125122, -0.38757163286209106, -0.36488673090934753, -0.3422017991542816, -0.3195168972015381, -0.29683196544647217, -0.27414706349372864, -0.2514621615409851, -0.22877724468708038, -0.20609232783317566, -0.18340741097927094, -0.1607224941253662, -0.13803759217262268, -0.11535267531871796, -0.09266775846481323, -0.0699828565120697, -0.04729793965816498, -0.024613022804260254, -0.0019281096756458282, 0.020756803452968597, 0.043441712856292725, 0.06612662971019745, 0.08881154656410217, 0.1114964485168457, 0.13418136537075043, 0.15686628222465515, 0.17955119907855988, 0.2022361159324646, 0.22492101788520813, 0.24760593473911285, 0.2702908515930176, 0.2929757535457611, 0.31566065549850464, 0.33834558725357056, 0.3610304892063141, 0.38371542096138, 0.40640032291412354, 0.42908525466918945, 0.451770156621933, 0.4744550585746765, 0.49713999032974243, 0.5198248624801636, 0.5425097942352295, 0.5651946663856506, 0.5878795981407166, 0.6105645298957825, 0.6332494020462036, 0.6559343338012695, 0.6786192655563354, 0.7013041973114014]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 12.0, 18.0, 21.0, 41.0, 52.0, 84.0, 159.0, 239.0, 391.0, 648.0, 1203.0, 2378.0, 5116.0, 11864.0, 31627.0, 123389.0, 3584981.0, 344376.0, 54658.0, 17906.0, 7440.0, 3432.0, 1784.0, 937.0, 558.0, 361.0, 212.0, 140.0, 81.0, 69.0, 33.0, 26.0, 21.0, 7.0, 9.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2828559875488281, -0.27494049072265625, -0.2670249938964844, -0.2591094970703125, -0.2511940002441406, -0.24327850341796875, -0.23536300659179688, -0.227447509765625, -0.21953201293945312, -0.21161651611328125, -0.20370101928710938, -0.1957855224609375, -0.18787002563476562, -0.17995452880859375, -0.17203903198242188, -0.16412353515625, -0.15620803833007812, -0.14829254150390625, -0.14037704467773438, -0.1324615478515625, -0.12454605102539062, -0.11663055419921875, -0.10871505737304688, -0.100799560546875, -0.09288406372070312, -0.08496856689453125, -0.07705307006835938, -0.0691375732421875, -0.061222076416015625, -0.05330657958984375, -0.045391082763671875, -0.0374755859375, -0.029560089111328125, -0.02164459228515625, -0.013729095458984375, -0.0058135986328125, 0.002101898193359375, 0.01001739501953125, 0.017932891845703125, 0.025848388671875, 0.033763885498046875, 0.04167938232421875, 0.049594879150390625, 0.0575103759765625, 0.06542587280273438, 0.07334136962890625, 0.08125686645507812, 0.08917236328125, 0.09708786010742188, 0.10500335693359375, 0.11291885375976562, 0.1208343505859375, 0.12874984741210938, 0.13666534423828125, 0.14458084106445312, 0.152496337890625, 0.16041183471679688, 0.16832733154296875, 0.17624282836914062, 0.1841583251953125, 0.19207382202148438, 0.19998931884765625, 0.20790481567382812, 0.2158203125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 9.0, 19.0, 23.0, 30.0, 35.0, 49.0, 53.0, 61.0, 71.0, 64.0, 69.0, 77.0, 63.0, 57.0, 63.0, 61.0, 45.0, 32.0, 22.0, 21.0, 25.0, 10.0, 8.0, 8.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0576171875, -0.05589008331298828, -0.05416297912597656, -0.052435874938964844, -0.050708770751953125, -0.048981666564941406, -0.04725456237792969, -0.04552745819091797, -0.04380035400390625, -0.04207324981689453, -0.04034614562988281, -0.038619041442871094, -0.036891937255859375, -0.035164833068847656, -0.03343772888183594, -0.03171062469482422, -0.0299835205078125, -0.02825641632080078, -0.026529312133789062, -0.024802207946777344, -0.023075103759765625, -0.021347999572753906, -0.019620895385742188, -0.01789379119873047, -0.01616668701171875, -0.014439582824707031, -0.012712478637695312, -0.010985374450683594, -0.009258270263671875, -0.007531166076660156, -0.0058040618896484375, -0.004076957702636719, -0.002349853515625, -0.0006227493286132812, 0.0011043548583984375, 0.0028314590454101562, 0.004558563232421875, 0.006285667419433594, 0.008012771606445312, 0.009739875793457031, 0.01146697998046875, 0.013194084167480469, 0.014921188354492188, 0.016648292541503906, 0.018375396728515625, 0.020102500915527344, 0.021829605102539062, 0.02355670928955078, 0.0252838134765625, 0.02701091766357422, 0.028738021850585938, 0.030465126037597656, 0.032192230224609375, 0.033919334411621094, 0.03564643859863281, 0.03737354278564453, 0.03910064697265625, 0.04082775115966797, 0.04255485534667969, 0.044281959533691406, 0.046009063720703125, 0.047736167907714844, 0.04946327209472656, 0.05119037628173828, 0.05291748046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 13.0, 21.0, 33.0, 48.0, 60.0, 69.0, 126.0, 145.0, 217.0, 266.0, 432.0, 621.0, 919.0, 1389.0, 2478.0, 4353.0, 8451.0, 17294.0, 39472.0, 113366.0, 743228.0, 3003607.0, 163094.0, 50243.0, 21279.0, 9958.0, 5121.0, 2954.0, 1634.0, 1085.0, 733.0, 451.0, 323.0, 213.0, 174.0, 115.0, 83.0, 68.0, 41.0, 36.0, 16.0, 17.0, 8.0, 12.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2142333984375, -0.2075672149658203, -0.20090103149414062, -0.19423484802246094, -0.18756866455078125, -0.18090248107910156, -0.17423629760742188, -0.1675701141357422, -0.1609039306640625, -0.1542377471923828, -0.14757156372070312, -0.14090538024902344, -0.13423919677734375, -0.12757301330566406, -0.12090682983398438, -0.11424064636230469, -0.107574462890625, -0.10090827941894531, -0.09424209594726562, -0.08757591247558594, -0.08090972900390625, -0.07424354553222656, -0.06757736206054688, -0.06091117858886719, -0.0542449951171875, -0.04757881164550781, -0.040912628173828125, -0.03424644470214844, -0.02758026123046875, -0.020914077758789062, -0.014247894287109375, -0.0075817108154296875, -0.00091552734375, 0.0057506561279296875, 0.012416839599609375, 0.019083023071289062, 0.02574920654296875, 0.03241539001464844, 0.039081573486328125, 0.04574775695800781, 0.0524139404296875, 0.05908012390136719, 0.06574630737304688, 0.07241249084472656, 0.07907867431640625, 0.08574485778808594, 0.09241104125976562, 0.09907722473144531, 0.105743408203125, 0.11240959167480469, 0.11907577514648438, 0.12574195861816406, 0.13240814208984375, 0.13907432556152344, 0.14574050903320312, 0.1524066925048828, 0.1590728759765625, 0.1657390594482422, 0.17240524291992188, 0.17907142639160156, 0.18573760986328125, 0.19240379333496094, 0.19906997680664062, 0.2057361602783203, 0.21240234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 12.0, 17.0, 10.0, 26.0, 30.0, 34.0, 50.0, 92.0, 142.0, 318.0, 2118.0, 687.0, 215.0, 101.0, 63.0, 43.0, 27.0, 21.0, 21.0, 13.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12115478515625, -0.11722278594970703, -0.11329078674316406, -0.1093587875366211, -0.10542678833007812, -0.10149478912353516, -0.09756278991699219, -0.09363079071044922, -0.08969879150390625, -0.08576679229736328, -0.08183479309082031, -0.07790279388427734, -0.07397079467773438, -0.0700387954711914, -0.06610679626464844, -0.06217479705810547, -0.0582427978515625, -0.05431079864501953, -0.05037879943847656, -0.046446800231933594, -0.042514801025390625, -0.038582801818847656, -0.03465080261230469, -0.03071880340576172, -0.02678680419921875, -0.02285480499267578, -0.018922805786132812, -0.014990806579589844, -0.011058807373046875, -0.007126808166503906, -0.0031948089599609375, 0.0007371902465820312, 0.004669189453125, 0.008601188659667969, 0.012533187866210938, 0.016465187072753906, 0.020397186279296875, 0.024329185485839844, 0.028261184692382812, 0.03219318389892578, 0.03612518310546875, 0.04005718231201172, 0.04398918151855469, 0.047921180725097656, 0.051853179931640625, 0.055785179138183594, 0.05971717834472656, 0.06364917755126953, 0.0675811767578125, 0.07151317596435547, 0.07544517517089844, 0.0793771743774414, 0.08330917358398438, 0.08724117279052734, 0.09117317199707031, 0.09510517120361328, 0.09903717041015625, 0.10296916961669922, 0.10690116882324219, 0.11083316802978516, 0.11476516723632812, 0.1186971664428711, 0.12262916564941406, 0.12656116485595703, 0.1304931640625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 12.0, 23.0, 32.0, 58.0, 68.0, 149.0, 152.0, 155.0, 128.0, 93.0, 50.0, 34.0, 20.0, 12.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.161692500114441, -1.1336348056793213, -1.1055772304534912, -1.0775195360183716, -1.0494619607925415, -1.0214042663574219, -0.9933466911315918, -0.9652889966964722, -0.9372313618659973, -0.9091737270355225, -0.8811160922050476, -0.8530584573745728, -0.8250008225440979, -0.796943187713623, -0.7688854932785034, -0.7408278584480286, -0.7127702236175537, -0.6847125887870789, -0.656654953956604, -0.6285973191261292, -0.6005396842956543, -0.5724819898605347, -0.5444244146347046, -0.516366720199585, -0.4883091449737549, -0.46025151014328003, -0.4321938753128052, -0.4041362404823303, -0.3760785758495331, -0.3480209410190582, -0.3199633061885834, -0.29190564155578613, -0.2638480067253113, -0.23579037189483643, -0.20773272216320038, -0.17967508733272552, -0.15161743760108948, -0.12355980277061462, -0.09550216794013977, -0.06744451820850372, -0.03938688337802887, -0.011329242959618568, 0.016728397458791733, 0.044786036014556885, 0.07284367829561234, 0.10090132057666779, 0.12895895540714264, 0.1570166051387787, 0.18507423996925354, 0.2131318747997284, 0.24118952453136444, 0.2692471742630005, 0.29730480909347534, 0.3253624439239502, 0.35342007875442505, 0.3814777135848999, 0.40953534841537476, 0.4375929832458496, 0.46565061807632446, 0.4937082529067993, 0.5217658877372742, 0.549823522567749, 0.5778812170028687, 0.6059388518333435, 0.6339964866638184]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 6.0, 6.0, 16.0, 8.0, 13.0, 13.0, 16.0, 18.0, 28.0, 29.0, 30.0, 36.0, 41.0, 30.0, 30.0, 33.0, 44.0, 39.0, 44.0, 24.0, 43.0, 39.0, 41.0, 46.0, 32.0, 32.0, 34.0, 35.0, 27.0, 12.0, 23.0, 20.0, 17.0, 20.0, 11.0, 13.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31650543212890625, -0.3055785298347473, -0.29465165734291077, -0.28372475504875183, -0.2727978527545929, -0.26187095046043396, -0.2509440779685974, -0.24001717567443848, -0.22909027338027954, -0.2181633859872818, -0.20723648369312286, -0.19630959630012512, -0.1853826940059662, -0.17445580661296844, -0.1635289192199707, -0.15260201692581177, -0.14167512953281403, -0.13074824213981628, -0.11982133984565735, -0.1088944524526596, -0.09796755015850067, -0.08704066276550293, -0.07611376792192459, -0.06518687307834625, -0.054259978234767914, -0.043333083391189575, -0.03240618854761124, -0.021479297429323196, -0.010552402585744858, 0.00037449225783348083, 0.011301383376121521, 0.02222827821969986, 0.0331551730632782, 0.04408206790685654, 0.055008962750434875, 0.06593585014343262, 0.07686275243759155, 0.0877896398305893, 0.09871653467416763, 0.10964342951774597, 0.12057032436132431, 0.13149721920490265, 0.1424241065979004, 0.15335100889205933, 0.16427789628505707, 0.175204798579216, 0.18613168597221375, 0.19705858826637268, 0.20798547565937042, 0.21891236305236816, 0.2298392653465271, 0.24076615273952484, 0.2516930401325226, 0.2626199424266815, 0.27354684472084045, 0.284473717212677, 0.29540061950683594, 0.3063275218009949, 0.3172543942928314, 0.32818129658699036, 0.3391081988811493, 0.3500351011753082, 0.3609619736671448, 0.3718888759613037, 0.38281577825546265]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 11.0, 19.0, 7.0, 20.0, 35.0, 45.0, 83.0, 114.0, 190.0, 340.0, 628.0, 1089.0, 1839.0, 3468.0, 6724.0, 13066.0, 25445.0, 51796.0, 109006.0, 252804.0, 312747.0, 138824.0, 64764.0, 31834.0, 15997.0, 8267.0, 4160.0, 2236.0, 1230.0, 684.0, 407.0, 237.0, 136.0, 119.0, 62.0, 52.0, 25.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12616539001464844, -0.12183761596679688, -0.11750984191894531, -0.11318206787109375, -0.10885429382324219, -0.10452651977539062, -0.10019874572753906, -0.0958709716796875, -0.09154319763183594, -0.08721542358398438, -0.08288764953613281, -0.07855987548828125, -0.07423210144042969, -0.06990432739257812, -0.06557655334472656, -0.061248779296875, -0.05692100524902344, -0.052593231201171875, -0.04826545715332031, -0.04393768310546875, -0.03960990905761719, -0.035282135009765625, -0.030954360961914062, -0.0266265869140625, -0.022298812866210938, -0.017971038818359375, -0.013643264770507812, -0.00931549072265625, -0.0049877166748046875, -0.000659942626953125, 0.0036678314208984375, 0.00799560546875, 0.012323379516601562, 0.016651153564453125, 0.020978927612304688, 0.02530670166015625, 0.029634475708007812, 0.033962249755859375, 0.03829002380371094, 0.0426177978515625, 0.04694557189941406, 0.051273345947265625, 0.05560111999511719, 0.05992889404296875, 0.06425666809082031, 0.06858444213867188, 0.07291221618652344, 0.077239990234375, 0.08156776428222656, 0.08589553833007812, 0.09022331237792969, 0.09455108642578125, 0.09887886047363281, 0.10320663452148438, 0.10753440856933594, 0.1118621826171875, 0.11618995666503906, 0.12051773071289062, 0.12484550476074219, 0.12917327880859375, 0.1335010528564453, 0.13782882690429688, 0.14215660095214844, 0.146484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 26.0, 28.0, 45.0, 32.0, 45.0, 43.0, 42.0, 45.0, 60.0, 59.0, 57.0, 51.0, 50.0, 55.0, 53.0, 50.0, 43.0, 27.0, 31.0, 22.0, 18.0, 25.0, 12.0, 8.0, 8.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.054351806640625, -0.05274486541748047, -0.05113792419433594, -0.049530982971191406, -0.047924041748046875, -0.046317100524902344, -0.04471015930175781, -0.04310321807861328, -0.04149627685546875, -0.03988933563232422, -0.03828239440917969, -0.036675453186035156, -0.035068511962890625, -0.033461570739746094, -0.03185462951660156, -0.03024768829345703, -0.0286407470703125, -0.02703380584716797, -0.025426864624023438, -0.023819923400878906, -0.022212982177734375, -0.020606040954589844, -0.018999099731445312, -0.01739215850830078, -0.01578521728515625, -0.014178276062011719, -0.012571334838867188, -0.010964393615722656, -0.009357452392578125, -0.007750511169433594, -0.0061435699462890625, -0.004536628723144531, -0.0029296875, -0.0013227462768554688, 0.0002841949462890625, 0.0018911361694335938, 0.003498077392578125, 0.005105018615722656, 0.0067119598388671875, 0.008318901062011719, 0.00992584228515625, 0.011532783508300781, 0.013139724731445312, 0.014746665954589844, 0.016353607177734375, 0.017960548400878906, 0.019567489624023438, 0.02117443084716797, 0.0227813720703125, 0.02438831329345703, 0.025995254516601562, 0.027602195739746094, 0.029209136962890625, 0.030816078186035156, 0.03242301940917969, 0.03402996063232422, 0.03563690185546875, 0.03724384307861328, 0.03885078430175781, 0.040457725524902344, 0.042064666748046875, 0.043671607971191406, 0.04527854919433594, 0.04688549041748047, 0.048492431640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 5.0, 10.0, 14.0, 25.0, 36.0, 53.0, 71.0, 127.0, 210.0, 351.0, 600.0, 1218.0, 2775.0, 7222.0, 24065.0, 91723.0, 486394.0, 334972.0, 69317.0, 18767.0, 5924.0, 2254.0, 970.0, 524.0, 301.0, 214.0, 128.0, 86.0, 50.0, 37.0, 26.0, 22.0, 17.0, 11.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248291015625, -0.24074363708496094, -0.23319625854492188, -0.2256488800048828, -0.21810150146484375, -0.2105541229248047, -0.20300674438476562, -0.19545936584472656, -0.1879119873046875, -0.18036460876464844, -0.17281723022460938, -0.1652698516845703, -0.15772247314453125, -0.1501750946044922, -0.14262771606445312, -0.13508033752441406, -0.127532958984375, -0.11998558044433594, -0.11243820190429688, -0.10489082336425781, -0.09734344482421875, -0.08979606628417969, -0.08224868774414062, -0.07470130920410156, -0.0671539306640625, -0.05960655212402344, -0.052059173583984375, -0.04451179504394531, -0.03696441650390625, -0.029417037963867188, -0.021869659423828125, -0.014322280883789062, -0.00677490234375, 0.0007724761962890625, 0.008319854736328125, 0.015867233276367188, 0.02341461181640625, 0.030961990356445312, 0.038509368896484375, 0.04605674743652344, 0.0536041259765625, 0.06115150451660156, 0.06869888305664062, 0.07624626159667969, 0.08379364013671875, 0.09134101867675781, 0.09888839721679688, 0.10643577575683594, 0.113983154296875, 0.12153053283691406, 0.12907791137695312, 0.1366252899169922, 0.14417266845703125, 0.1517200469970703, 0.15926742553710938, 0.16681480407714844, 0.1743621826171875, 0.18190956115722656, 0.18945693969726562, 0.1970043182373047, 0.20455169677734375, 0.2120990753173828, 0.21964645385742188, 0.22719383239746094, 0.2347412109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 8.0, 12.0, 10.0, 7.0, 19.0, 12.0, 25.0, 23.0, 26.0, 37.0, 57.0, 40.0, 35.0, 52.0, 58.0, 51.0, 47.0, 45.0, 33.0, 45.0, 40.0, 43.0, 31.0, 49.0, 29.0, 29.0, 24.0, 14.0, 20.0, 14.0, 14.0, 10.0, 5.0, 2.0, 8.0, 4.0, 2.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2196044921875, -0.21320533752441406, -0.20680618286132812, -0.2004070281982422, -0.19400787353515625, -0.1876087188720703, -0.18120956420898438, -0.17481040954589844, -0.1684112548828125, -0.16201210021972656, -0.15561294555664062, -0.1492137908935547, -0.14281463623046875, -0.1364154815673828, -0.13001632690429688, -0.12361717224121094, -0.117218017578125, -0.11081886291503906, -0.10441970825195312, -0.09802055358886719, -0.09162139892578125, -0.08522224426269531, -0.07882308959960938, -0.07242393493652344, -0.0660247802734375, -0.05962562561035156, -0.053226470947265625, -0.04682731628417969, -0.04042816162109375, -0.03402900695800781, -0.027629852294921875, -0.021230697631835938, -0.01483154296875, -0.008432388305664062, -0.002033233642578125, 0.0043659210205078125, 0.01076507568359375, 0.017164230346679688, 0.023563385009765625, 0.029962539672851562, 0.0363616943359375, 0.04276084899902344, 0.049160003662109375, 0.05555915832519531, 0.06195831298828125, 0.06835746765136719, 0.07475662231445312, 0.08115577697753906, 0.087554931640625, 0.09395408630371094, 0.10035324096679688, 0.10675239562988281, 0.11315155029296875, 0.11955070495605469, 0.12594985961914062, 0.13234901428222656, 0.1387481689453125, 0.14514732360839844, 0.15154647827148438, 0.1579456329345703, 0.16434478759765625, 0.1707439422607422, 0.17714309692382812, 0.18354225158691406, 0.18994140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 14.0, 9.0, 19.0, 27.0, 40.0, 59.0, 106.0, 152.0, 253.0, 388.0, 727.0, 1181.0, 2038.0, 4223.0, 11128.0, 41627.0, 227062.0, 613252.0, 109024.0, 22895.0, 7258.0, 3009.0, 1662.0, 944.0, 541.0, 349.0, 224.0, 121.0, 69.0, 61.0, 29.0, 20.0, 9.0, 9.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.13259315490722656, -0.12773513793945312, -0.12287712097167969, -0.11801910400390625, -0.11316108703613281, -0.10830307006835938, -0.10344505310058594, -0.0985870361328125, -0.09372901916503906, -0.08887100219726562, -0.08401298522949219, -0.07915496826171875, -0.07429695129394531, -0.06943893432617188, -0.06458091735839844, -0.059722900390625, -0.05486488342285156, -0.050006866455078125, -0.04514884948730469, -0.04029083251953125, -0.03543281555175781, -0.030574798583984375, -0.025716781616210938, -0.0208587646484375, -0.016000747680664062, -0.011142730712890625, -0.0062847137451171875, -0.00142669677734375, 0.0034313201904296875, 0.008289337158203125, 0.013147354125976562, 0.01800537109375, 0.022863388061523438, 0.027721405029296875, 0.03257942199707031, 0.03743743896484375, 0.04229545593261719, 0.047153472900390625, 0.05201148986816406, 0.0568695068359375, 0.06172752380371094, 0.06658554077148438, 0.07144355773925781, 0.07630157470703125, 0.08115959167480469, 0.08601760864257812, 0.09087562561035156, 0.095733642578125, 0.10059165954589844, 0.10544967651367188, 0.11030769348144531, 0.11516571044921875, 0.12002372741699219, 0.12488174438476562, 0.12973976135253906, 0.1345977783203125, 0.13945579528808594, 0.14431381225585938, 0.1491718292236328, 0.15402984619140625, 0.1588878631591797, 0.16374588012695312, 0.16860389709472656, 0.1734619140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 9.0, 14.0, 15.0, 23.0, 37.0, 51.0, 43.0, 94.0, 97.0, 148.0, 124.0, 106.0, 73.0, 40.0, 37.0, 33.0, 16.0, 13.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.898143768310547e-05, -3.726687282323837e-05, -3.555230796337128e-05, -3.383774310350418e-05, -3.2123178243637085e-05, -3.040861338376999e-05, -2.8694048523902893e-05, -2.6979483664035797e-05, -2.52649188041687e-05, -2.3550353944301605e-05, -2.183578908443451e-05, -2.0121224224567413e-05, -1.8406659364700317e-05, -1.669209450483322e-05, -1.4977529644966125e-05, -1.326296478509903e-05, -1.1548399925231934e-05, -9.833835065364838e-06, -8.119270205497742e-06, -6.404705345630646e-06, -4.69014048576355e-06, -2.975575625896454e-06, -1.261010766029358e-06, 4.5355409383773804e-07, 2.168118953704834e-06, 3.88268381357193e-06, 5.597248673439026e-06, 7.311813533306122e-06, 9.026378393173218e-06, 1.0740943253040314e-05, 1.245550811290741e-05, 1.4170072972774506e-05, 1.58846378326416e-05, 1.7599202692508698e-05, 1.9313767552375793e-05, 2.102833241224289e-05, 2.2742897272109985e-05, 2.445746213197708e-05, 2.6172026991844177e-05, 2.7886591851711273e-05, 2.960115671157837e-05, 3.1315721571445465e-05, 3.303028643131256e-05, 3.474485129117966e-05, 3.645941615104675e-05, 3.817398101091385e-05, 3.9888545870780945e-05, 4.160311073064804e-05, 4.331767559051514e-05, 4.503224045038223e-05, 4.674680531024933e-05, 4.8461370170116425e-05, 5.017593502998352e-05, 5.1890499889850616e-05, 5.360506474971771e-05, 5.531962960958481e-05, 5.7034194469451904e-05, 5.8748759329319e-05, 6.0463324189186096e-05, 6.217788904905319e-05, 6.389245390892029e-05, 6.560701876878738e-05, 6.732158362865448e-05, 6.903614848852158e-05, 7.075071334838867e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 9.0, 23.0, 36.0, 36.0, 58.0, 95.0, 149.0, 291.0, 466.0, 890.0, 1909.0, 4732.0, 15789.0, 103154.0, 708570.0, 178361.0, 23384.0, 5978.0, 2238.0, 1040.0, 523.0, 284.0, 163.0, 119.0, 63.0, 51.0, 40.0, 28.0, 17.0, 9.0, 5.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2120361328125, -0.20532989501953125, -0.1986236572265625, -0.19191741943359375, -0.185211181640625, -0.17850494384765625, -0.1717987060546875, -0.16509246826171875, -0.15838623046875, -0.15167999267578125, -0.1449737548828125, -0.13826751708984375, -0.131561279296875, -0.12485504150390625, -0.1181488037109375, -0.11144256591796875, -0.104736328125, -0.09803009033203125, -0.0913238525390625, -0.08461761474609375, -0.077911376953125, -0.07120513916015625, -0.0644989013671875, -0.05779266357421875, -0.05108642578125, -0.04438018798828125, -0.0376739501953125, -0.03096771240234375, -0.024261474609375, -0.01755523681640625, -0.0108489990234375, -0.00414276123046875, 0.0025634765625, 0.00926971435546875, 0.0159759521484375, 0.02268218994140625, 0.029388427734375, 0.03609466552734375, 0.0428009033203125, 0.04950714111328125, 0.05621337890625, 0.06291961669921875, 0.0696258544921875, 0.07633209228515625, 0.083038330078125, 0.08974456787109375, 0.0964508056640625, 0.10315704345703125, 0.10986328125, 0.11656951904296875, 0.1232757568359375, 0.12998199462890625, 0.136688232421875, 0.14339447021484375, 0.1501007080078125, 0.15680694580078125, 0.16351318359375, 0.17021942138671875, 0.1769256591796875, 0.18363189697265625, 0.190338134765625, 0.19704437255859375, 0.2037506103515625, 0.21045684814453125, 0.2171630859375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 7.0, 9.0, 9.0, 21.0, 32.0, 45.0, 66.0, 111.0, 178.0, 192.0, 117.0, 74.0, 56.0, 20.0, 23.0, 9.0, 10.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.27978515625, -0.2729530334472656, -0.26612091064453125, -0.2592887878417969, -0.2524566650390625, -0.24562454223632812, -0.23879241943359375, -0.23196029663085938, -0.225128173828125, -0.21829605102539062, -0.21146392822265625, -0.20463180541992188, -0.1977996826171875, -0.19096755981445312, -0.18413543701171875, -0.17730331420898438, -0.17047119140625, -0.16363906860351562, -0.15680694580078125, -0.14997482299804688, -0.1431427001953125, -0.13631057739257812, -0.12947845458984375, -0.12264633178710938, -0.115814208984375, -0.10898208618164062, -0.10214996337890625, -0.09531784057617188, -0.0884857177734375, -0.08165359497070312, -0.07482147216796875, -0.06798934936523438, -0.0611572265625, -0.054325103759765625, -0.04749298095703125, -0.040660858154296875, -0.0338287353515625, -0.026996612548828125, -0.02016448974609375, -0.013332366943359375, -0.006500244140625, 0.000331878662109375, 0.00716400146484375, 0.013996124267578125, 0.0208282470703125, 0.027660369873046875, 0.03449249267578125, 0.041324615478515625, 0.04815673828125, 0.054988861083984375, 0.06182098388671875, 0.06865310668945312, 0.0754852294921875, 0.08231735229492188, 0.08914947509765625, 0.09598159790039062, 0.102813720703125, 0.10964584350585938, 0.11647796630859375, 0.12331008911132812, 0.1301422119140625, 0.13697433471679688, 0.14380645751953125, 0.15063858032226562, 0.157470703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 11.0, 4.0, 19.0, 28.0, 68.0, 98.0, 130.0, 153.0, 170.0, 121.0, 97.0, 53.0, 21.0, 17.0, 10.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9270260334014893, -0.8544597625732422, -0.7818934321403503, -0.7093271017074585, -0.6367608308792114, -0.5641945600509644, -0.4916282296180725, -0.41906189918518066, -0.3464956283569336, -0.27392932772636414, -0.20136302709579468, -0.12879672646522522, -0.05623042583465576, 0.016335874795913696, 0.08890217542648315, 0.161468505859375, 0.23403477668762207, 0.30660107731819153, 0.379167377948761, 0.45173367857933044, 0.5242999792098999, 0.596866250038147, 0.6694325804710388, 0.7419989109039307, 0.8145651817321777, 0.8871314525604248, 0.9596977829933167, 1.0322641134262085, 1.1048303842544556, 1.1773966550827026, 1.2499630451202393, 1.3225293159484863, 1.3950955867767334, 1.4676618576049805, 1.5402281284332275, 1.6127945184707642, 1.6853607892990112, 1.7579270601272583, 1.830493450164795, 1.903059720993042, 1.975625991821289, 2.048192262649536, 2.120758533477783, 2.1933248043060303, 2.2658910751342773, 2.3384575843811035, 2.4110238552093506, 2.4835901260375977, 2.5561563968658447, 2.628722667694092, 2.701288938522339, 2.773855209350586, 2.846421718597412, 2.918987989425659, 2.9915542602539062, 3.0641205310821533, 3.1366868019104004, 3.2092530727386475, 3.2818193435668945, 3.3543856143951416, 3.4269518852233887, 3.499518394470215, 3.572084665298462, 3.644650936126709, 3.717217206954956]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 10.0, 15.0, 7.0, 18.0, 14.0, 17.0, 26.0, 26.0, 24.0, 34.0, 39.0, 42.0, 42.0, 45.0, 37.0, 45.0, 31.0, 43.0, 37.0, 51.0, 45.0, 39.0, 43.0, 31.0, 37.0, 25.0, 29.0, 19.0, 16.0, 13.0, 14.0, 11.0, 8.0, 10.0, 1.0, 6.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9620654582977295, -0.9291619658470154, -0.8962584733963013, -0.8633549213409424, -0.8304514288902283, -0.7975479364395142, -0.7646444439888, -0.7317409515380859, -0.698837399482727, -0.6659339070320129, -0.6330304145812988, -0.6001268625259399, -0.5672233700752258, -0.5343198776245117, -0.5014163851737976, -0.4685128927230835, -0.4356094002723694, -0.4027059078216553, -0.3698023855686188, -0.33689889311790466, -0.30399537086486816, -0.27109187841415405, -0.23818838596343994, -0.20528487861156464, -0.17238137125968933, -0.13947786390781403, -0.10657436400651932, -0.07367086410522461, -0.040767356753349304, -0.007863849401473999, 0.025039643049240112, 0.05794315040111542, 0.09084665775299072, 0.12375016510486603, 0.15665367245674133, 0.18955716490745544, 0.22246067225933075, 0.25536417961120605, 0.28826767206192017, 0.3211711645126343, 0.3540746867656708, 0.3869781792163849, 0.4198817014694214, 0.4527851939201355, 0.4856886863708496, 0.5185922384262085, 0.5514956712722778, 0.5843992233276367, 0.6173027157783508, 0.6502062082290649, 0.683109700679779, 0.7160131931304932, 0.748916745185852, 0.7818202376365662, 0.8147237300872803, 0.8476272225379944, 0.8805307149887085, 0.9134342074394226, 0.9463376998901367, 0.9792412519454956, 1.012144684791565, 1.0450482368469238, 1.0779516696929932, 1.110855221748352, 1.143758773803711]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 16.0, 16.0, 17.0, 28.0, 42.0, 56.0, 107.0, 162.0, 234.0, 376.0, 664.0, 1021.0, 1724.0, 3162.0, 6151.0, 12557.0, 28354.0, 82759.0, 571115.0, 3267357.0, 143995.0, 40657.0, 16332.0, 7868.0, 4061.0, 2180.0, 1252.0, 746.0, 436.0, 292.0, 199.0, 104.0, 81.0, 54.0, 35.0, 16.0, 17.0, 15.0, 8.0, 11.0, 4.0, 3.0, 2.0, 4.0], "bins": [-0.255126953125, -0.24861717224121094, -0.24210739135742188, -0.2355976104736328, -0.22908782958984375, -0.2225780487060547, -0.21606826782226562, -0.20955848693847656, -0.2030487060546875, -0.19653892517089844, -0.19002914428710938, -0.1835193634033203, -0.17700958251953125, -0.1704998016357422, -0.16399002075195312, -0.15748023986816406, -0.150970458984375, -0.14446067810058594, -0.13795089721679688, -0.1314411163330078, -0.12493133544921875, -0.11842155456542969, -0.11191177368164062, -0.10540199279785156, -0.0988922119140625, -0.09238243103027344, -0.08587265014648438, -0.07936286926269531, -0.07285308837890625, -0.06634330749511719, -0.059833526611328125, -0.05332374572753906, -0.04681396484375, -0.04030418395996094, -0.033794403076171875, -0.027284622192382812, -0.02077484130859375, -0.014265060424804688, -0.007755279541015625, -0.0012454986572265625, 0.0052642822265625, 0.011774063110351562, 0.018283843994140625, 0.024793624877929688, 0.03130340576171875, 0.03781318664550781, 0.044322967529296875, 0.05083274841308594, 0.057342529296875, 0.06385231018066406, 0.07036209106445312, 0.07687187194824219, 0.08338165283203125, 0.08989143371582031, 0.09640121459960938, 0.10291099548339844, 0.1094207763671875, 0.11593055725097656, 0.12244033813476562, 0.1289501190185547, 0.13545989990234375, 0.1419696807861328, 0.14847946166992188, 0.15498924255371094, 0.1614990234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 19.0, 16.0, 25.0, 12.0, 25.0, 40.0, 46.0, 43.0, 63.0, 56.0, 55.0, 49.0, 58.0, 79.0, 64.0, 56.0, 39.0, 42.0, 40.0, 30.0, 36.0, 24.0, 18.0, 11.0, 14.0, 9.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.061676025390625, -0.05984067916870117, -0.058005332946777344, -0.056169986724853516, -0.05433464050292969, -0.05249929428100586, -0.05066394805908203, -0.0488286018371582, -0.046993255615234375, -0.04515790939331055, -0.04332256317138672, -0.04148721694946289, -0.03965187072753906, -0.037816524505615234, -0.035981178283691406, -0.03414583206176758, -0.03231048583984375, -0.030475139617919922, -0.028639793395996094, -0.026804447174072266, -0.024969100952148438, -0.02313375473022461, -0.02129840850830078, -0.019463062286376953, -0.017627716064453125, -0.015792369842529297, -0.013957023620605469, -0.01212167739868164, -0.010286331176757812, -0.008450984954833984, -0.006615638732910156, -0.004780292510986328, -0.0029449462890625, -0.0011096000671386719, 0.0007257461547851562, 0.0025610923767089844, 0.0043964385986328125, 0.006231784820556641, 0.008067131042480469, 0.009902477264404297, 0.011737823486328125, 0.013573169708251953, 0.015408515930175781, 0.01724386215209961, 0.019079208374023438, 0.020914554595947266, 0.022749900817871094, 0.024585247039794922, 0.02642059326171875, 0.028255939483642578, 0.030091285705566406, 0.031926631927490234, 0.03376197814941406, 0.03559732437133789, 0.03743267059326172, 0.03926801681518555, 0.041103363037109375, 0.0429387092590332, 0.04477405548095703, 0.04660940170288086, 0.04844474792480469, 0.050280094146728516, 0.052115440368652344, 0.05395078659057617, 0.0557861328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 12.0, 10.0, 12.0, 8.0, 16.0, 21.0, 25.0, 42.0, 40.0, 69.0, 131.0, 192.0, 305.0, 625.0, 1363.0, 3455.0, 9920.0, 35411.0, 200222.0, 3631619.0, 252758.0, 40050.0, 11123.0, 3675.0, 1568.0, 657.0, 370.0, 192.0, 128.0, 70.0, 46.0, 29.0, 32.0, 20.0, 9.0, 16.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.455078125, -0.4422760009765625, -0.429473876953125, -0.4166717529296875, -0.40386962890625, -0.3910675048828125, -0.378265380859375, -0.3654632568359375, -0.3526611328125, -0.3398590087890625, -0.327056884765625, -0.3142547607421875, -0.30145263671875, -0.2886505126953125, -0.275848388671875, -0.2630462646484375, -0.250244140625, -0.2374420166015625, -0.224639892578125, -0.2118377685546875, -0.19903564453125, -0.1862335205078125, -0.173431396484375, -0.1606292724609375, -0.1478271484375, -0.1350250244140625, -0.122222900390625, -0.1094207763671875, -0.09661865234375, -0.0838165283203125, -0.071014404296875, -0.0582122802734375, -0.04541015625, -0.0326080322265625, -0.019805908203125, -0.0070037841796875, 0.00579833984375, 0.0186004638671875, 0.031402587890625, 0.0442047119140625, 0.0570068359375, 0.0698089599609375, 0.082611083984375, 0.0954132080078125, 0.10821533203125, 0.1210174560546875, 0.133819580078125, 0.1466217041015625, 0.159423828125, 0.1722259521484375, 0.185028076171875, 0.1978302001953125, 0.21063232421875, 0.2234344482421875, 0.236236572265625, 0.2490386962890625, 0.2618408203125, 0.2746429443359375, 0.287445068359375, 0.3002471923828125, 0.31304931640625, 0.3258514404296875, 0.338653564453125, 0.3514556884765625, 0.3642578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 10.0, 17.0, 24.0, 28.0, 37.0, 53.0, 93.0, 226.0, 715.0, 2069.0, 362.0, 173.0, 99.0, 53.0, 37.0, 28.0, 15.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1207275390625, -0.11446571350097656, -0.10820388793945312, -0.10194206237792969, -0.09568023681640625, -0.08941841125488281, -0.08315658569335938, -0.07689476013183594, -0.0706329345703125, -0.06437110900878906, -0.058109283447265625, -0.05184745788574219, -0.04558563232421875, -0.03932380676269531, -0.033061981201171875, -0.026800155639648438, -0.020538330078125, -0.014276504516601562, -0.008014678955078125, -0.0017528533935546875, 0.00450897216796875, 0.010770797729492188, 0.017032623291015625, 0.023294448852539062, 0.0295562744140625, 0.03581809997558594, 0.042079925537109375, 0.04834175109863281, 0.05460357666015625, 0.06086540222167969, 0.06712722778320312, 0.07338905334472656, 0.07965087890625, 0.08591270446777344, 0.09217453002929688, 0.09843635559082031, 0.10469818115234375, 0.11096000671386719, 0.11722183227539062, 0.12348365783691406, 0.1297454833984375, 0.13600730895996094, 0.14226913452148438, 0.1485309600830078, 0.15479278564453125, 0.1610546112060547, 0.16731643676757812, 0.17357826232910156, 0.179840087890625, 0.18610191345214844, 0.19236373901367188, 0.1986255645751953, 0.20488739013671875, 0.2111492156982422, 0.21741104125976562, 0.22367286682128906, 0.2299346923828125, 0.23619651794433594, 0.24245834350585938, 0.2487201690673828, 0.25498199462890625, 0.2612438201904297, 0.2675056457519531, 0.27376747131347656, 0.280029296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 11.0, 16.0, 24.0, 50.0, 65.0, 96.0, 108.0, 140.0, 148.0, 101.0, 77.0, 41.0, 44.0, 25.0, 20.0, 10.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3025517463684082, -1.2696025371551514, -1.2366533279418945, -1.2037042379379272, -1.1707550287246704, -1.1378058195114136, -1.1048566102981567, -1.0719074010849, -1.0389583110809326, -1.0060091018676758, -0.9730599522590637, -0.9401107430458069, -0.9071615934371948, -0.874212384223938, -0.8412631750106812, -0.8083139657974243, -0.7753647565841675, -0.7424155473709106, -0.7094663977622986, -0.6765171885490417, -0.6435680389404297, -0.6106188297271729, -0.577669620513916, -0.5447204113006592, -0.5117712616920471, -0.47882208228111267, -0.4458729028701782, -0.4129236936569214, -0.37997451424598694, -0.3470253348350525, -0.31407612562179565, -0.2811269462108612, -0.2481778860092163, -0.21522870659828186, -0.18227951228618622, -0.14933031797409058, -0.11638113856315613, -0.08343195915222168, -0.05048276484012604, -0.017533570528030396, 0.015415608882904053, 0.0483647957444191, 0.08131398260593414, 0.11426316946744919, 0.14721235632896423, 0.18016153573989868, 0.21311073005199432, 0.24605992436408997, 0.2790091037750244, 0.31195828318595886, 0.3449074625968933, 0.37785667181015015, 0.4108058512210846, 0.44375503063201904, 0.4767042398452759, 0.5096534490585327, 0.5426025986671448, 0.5755518078804016, 0.6085009574890137, 0.6414501667022705, 0.6743993759155273, 0.7073485255241394, 0.7402977347373962, 0.7732468843460083, 0.8061960935592651]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 5.0, 14.0, 11.0, 16.0, 27.0, 20.0, 30.0, 19.0, 23.0, 29.0, 30.0, 35.0, 49.0, 46.0, 32.0, 40.0, 44.0, 45.0, 53.0, 36.0, 39.0, 52.0, 40.0, 46.0, 28.0, 18.0, 19.0, 14.0, 17.0, 25.0, 18.0, 12.0, 7.0, 12.0, 7.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5119866728782654, -0.49630919098854065, -0.4806317090988159, -0.4649542570114136, -0.44927677512168884, -0.4335992932319641, -0.41792184114456177, -0.40224435925483704, -0.3865668773651123, -0.3708893954753876, -0.35521191358566284, -0.3395344614982605, -0.32385697960853577, -0.30817949771881104, -0.2925020456314087, -0.27682456374168396, -0.26114708185195923, -0.2454695999622345, -0.22979213297367096, -0.21411466598510742, -0.1984371840953827, -0.18275970220565796, -0.16708223521709442, -0.15140476822853088, -0.13572728633880615, -0.12004981189966202, -0.10437233746051788, -0.08869486302137375, -0.07301738858222961, -0.05733991414308548, -0.041662439703941345, -0.02598496526479721, -0.010307550430297852, 0.005369924008846283, 0.021047398447990417, 0.03672487288713455, 0.052402347326278687, 0.06807982176542282, 0.08375729620456696, 0.09943477064371109, 0.11511224508285522, 0.13078972697257996, 0.1464671939611435, 0.16214466094970703, 0.17782214283943176, 0.1934996247291565, 0.20917709171772003, 0.22485455870628357, 0.2405320405960083, 0.25620952248573303, 0.27188700437545776, 0.2875644564628601, 0.30324193835258484, 0.31891942024230957, 0.3345968723297119, 0.35027435421943665, 0.3659518361091614, 0.3816293179988861, 0.39730679988861084, 0.4129842519760132, 0.4286617338657379, 0.44433921575546265, 0.460016667842865, 0.4756941497325897, 0.49137163162231445]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 8.0, 10.0, 26.0, 37.0, 65.0, 111.0, 172.0, 314.0, 422.0, 814.0, 1410.0, 2691.0, 5175.0, 10372.0, 21409.0, 46179.0, 104629.0, 225853.0, 295772.0, 181743.0, 80579.0, 36095.0, 16982.0, 8356.0, 4206.0, 2260.0, 1201.0, 674.0, 394.0, 240.0, 140.0, 93.0, 52.0, 31.0, 15.0, 10.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.1383838653564453, -0.13382339477539062, -0.12926292419433594, -0.12470245361328125, -0.12014198303222656, -0.11558151245117188, -0.11102104187011719, -0.1064605712890625, -0.10190010070800781, -0.09733963012695312, -0.09277915954589844, -0.08821868896484375, -0.08365821838378906, -0.07909774780273438, -0.07453727722167969, -0.069976806640625, -0.06541633605957031, -0.060855865478515625, -0.05629539489746094, -0.05173492431640625, -0.04717445373535156, -0.042613983154296875, -0.03805351257324219, -0.0334930419921875, -0.028932571411132812, -0.024372100830078125, -0.019811630249023438, -0.01525115966796875, -0.010690689086914062, -0.006130218505859375, -0.0015697479248046875, 0.00299072265625, 0.0075511932373046875, 0.012111663818359375, 0.016672134399414062, 0.02123260498046875, 0.025793075561523438, 0.030353546142578125, 0.03491401672363281, 0.0394744873046875, 0.04403495788574219, 0.048595428466796875, 0.05315589904785156, 0.05771636962890625, 0.06227684020996094, 0.06683731079101562, 0.07139778137207031, 0.075958251953125, 0.08051872253417969, 0.08507919311523438, 0.08963966369628906, 0.09420013427734375, 0.09876060485839844, 0.10332107543945312, 0.10788154602050781, 0.1124420166015625, 0.11700248718261719, 0.12156295776367188, 0.12612342834472656, 0.13068389892578125, 0.13524436950683594, 0.13980484008789062, 0.1443653106689453, 0.14892578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 9.0, 10.0, 11.0, 18.0, 14.0, 16.0, 22.0, 22.0, 35.0, 44.0, 54.0, 47.0, 47.0, 48.0, 52.0, 64.0, 62.0, 47.0, 52.0, 61.0, 47.0, 29.0, 30.0, 28.0, 22.0, 23.0, 16.0, 22.0, 7.0, 9.0, 11.0, 7.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.053253173828125, -0.0514674186706543, -0.049681663513183594, -0.04789590835571289, -0.04611015319824219, -0.044324398040771484, -0.04253864288330078, -0.04075288772583008, -0.038967132568359375, -0.03718137741088867, -0.03539562225341797, -0.033609867095947266, -0.03182411193847656, -0.03003835678100586, -0.028252601623535156, -0.026466846466064453, -0.02468109130859375, -0.022895336151123047, -0.021109580993652344, -0.01932382583618164, -0.017538070678710938, -0.015752315521240234, -0.013966560363769531, -0.012180805206298828, -0.010395050048828125, -0.008609294891357422, -0.006823539733886719, -0.005037784576416016, -0.0032520294189453125, -0.0014662742614746094, 0.00031948089599609375, 0.002105236053466797, 0.0038909912109375, 0.005676746368408203, 0.007462501525878906, 0.00924825668334961, 0.011034011840820312, 0.012819766998291016, 0.014605522155761719, 0.016391277313232422, 0.018177032470703125, 0.019962787628173828, 0.02174854278564453, 0.023534297943115234, 0.025320053100585938, 0.02710580825805664, 0.028891563415527344, 0.030677318572998047, 0.03246307373046875, 0.03424882888793945, 0.036034584045410156, 0.03782033920288086, 0.03960609436035156, 0.041391849517822266, 0.04317760467529297, 0.04496335983276367, 0.046749114990234375, 0.04853487014770508, 0.05032062530517578, 0.052106380462646484, 0.05389213562011719, 0.05567789077758789, 0.057463645935058594, 0.0592494010925293, 0.06103515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 3.0, 5.0, 12.0, 18.0, 11.0, 20.0, 27.0, 34.0, 53.0, 71.0, 118.0, 206.0, 386.0, 593.0, 1374.0, 3443.0, 10386.0, 39918.0, 193196.0, 556755.0, 186670.0, 38916.0, 10153.0, 3300.0, 1325.0, 642.0, 327.0, 209.0, 118.0, 68.0, 53.0, 37.0, 29.0, 10.0, 15.0, 12.0, 3.0, 7.0, 6.0, 9.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2176513671875, -0.2097339630126953, -0.20181655883789062, -0.19389915466308594, -0.18598175048828125, -0.17806434631347656, -0.17014694213867188, -0.1622295379638672, -0.1543121337890625, -0.1463947296142578, -0.13847732543945312, -0.13055992126464844, -0.12264251708984375, -0.11472511291503906, -0.10680770874023438, -0.09889030456542969, -0.090972900390625, -0.08305549621582031, -0.07513809204101562, -0.06722068786621094, -0.05930328369140625, -0.05138587951660156, -0.043468475341796875, -0.03555107116699219, -0.0276336669921875, -0.019716262817382812, -0.011798858642578125, -0.0038814544677734375, 0.00403594970703125, 0.011953353881835938, 0.019870758056640625, 0.027788162231445312, 0.03570556640625, 0.04362297058105469, 0.051540374755859375, 0.05945777893066406, 0.06737518310546875, 0.07529258728027344, 0.08320999145507812, 0.09112739562988281, 0.0990447998046875, 0.10696220397949219, 0.11487960815429688, 0.12279701232910156, 0.13071441650390625, 0.13863182067871094, 0.14654922485351562, 0.1544666290283203, 0.162384033203125, 0.1703014373779297, 0.17821884155273438, 0.18613624572753906, 0.19405364990234375, 0.20197105407714844, 0.20988845825195312, 0.2178058624267578, 0.2257232666015625, 0.2336406707763672, 0.24155807495117188, 0.24947547912597656, 0.25739288330078125, 0.26531028747558594, 0.2732276916503906, 0.2811450958251953, 0.2890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 15.0, 15.0, 19.0, 20.0, 21.0, 31.0, 29.0, 31.0, 40.0, 40.0, 49.0, 41.0, 49.0, 42.0, 52.0, 46.0, 39.0, 50.0, 30.0, 36.0, 27.0, 40.0, 33.0, 34.0, 27.0, 18.0, 13.0, 11.0, 12.0, 9.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23513412475585938, -0.22734832763671875, -0.21956253051757812, -0.2117767333984375, -0.20399093627929688, -0.19620513916015625, -0.18841934204101562, -0.180633544921875, -0.17284774780273438, -0.16506195068359375, -0.15727615356445312, -0.1494903564453125, -0.14170455932617188, -0.13391876220703125, -0.12613296508789062, -0.11834716796875, -0.11056137084960938, -0.10277557373046875, -0.09498977661132812, -0.0872039794921875, -0.07941818237304688, -0.07163238525390625, -0.06384658813476562, -0.056060791015625, -0.048274993896484375, -0.04048919677734375, -0.032703399658203125, -0.0249176025390625, -0.017131805419921875, -0.00934600830078125, -0.001560211181640625, 0.0062255859375, 0.014011383056640625, 0.02179718017578125, 0.029582977294921875, 0.0373687744140625, 0.045154571533203125, 0.05294036865234375, 0.060726165771484375, 0.068511962890625, 0.07629776000976562, 0.08408355712890625, 0.09186935424804688, 0.0996551513671875, 0.10744094848632812, 0.11522674560546875, 0.12301254272460938, 0.13079833984375, 0.13858413696289062, 0.14636993408203125, 0.15415573120117188, 0.1619415283203125, 0.16972732543945312, 0.17751312255859375, 0.18529891967773438, 0.193084716796875, 0.20087051391601562, 0.20865631103515625, 0.21644210815429688, 0.2242279052734375, 0.23201370239257812, 0.23979949951171875, 0.24758529663085938, 0.25537109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 4.0, 14.0, 30.0, 40.0, 51.0, 116.0, 145.0, 393.0, 753.0, 2008.0, 7241.0, 71258.0, 848331.0, 105513.0, 8549.0, 2347.0, 897.0, 377.0, 204.0, 91.0, 79.0, 50.0, 14.0, 15.0, 12.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294677734375, -0.2839851379394531, -0.27329254150390625, -0.2625999450683594, -0.2519073486328125, -0.24121475219726562, -0.23052215576171875, -0.21982955932617188, -0.209136962890625, -0.19844436645507812, -0.18775177001953125, -0.17705917358398438, -0.1663665771484375, -0.15567398071289062, -0.14498138427734375, -0.13428878784179688, -0.12359619140625, -0.11290359497070312, -0.10221099853515625, -0.09151840209960938, -0.0808258056640625, -0.07013320922851562, -0.05944061279296875, -0.048748016357421875, -0.038055419921875, -0.027362823486328125, -0.01667022705078125, -0.005977630615234375, 0.0047149658203125, 0.015407562255859375, 0.02610015869140625, 0.036792755126953125, 0.0474853515625, 0.058177947998046875, 0.06887054443359375, 0.07956314086914062, 0.0902557373046875, 0.10094833374023438, 0.11164093017578125, 0.12233352661132812, 0.133026123046875, 0.14371871948242188, 0.15441131591796875, 0.16510391235351562, 0.1757965087890625, 0.18648910522460938, 0.19718170166015625, 0.20787429809570312, 0.21856689453125, 0.22925949096679688, 0.23995208740234375, 0.2506446838378906, 0.2613372802734375, 0.2720298767089844, 0.28272247314453125, 0.2934150695800781, 0.304107666015625, 0.3148002624511719, 0.32549285888671875, 0.3361854553222656, 0.3468780517578125, 0.3575706481933594, 0.36826324462890625, 0.3789558410644531, 0.3896484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 5.0, 14.0, 15.0, 32.0, 35.0, 27.0, 51.0, 47.0, 63.0, 75.0, 80.0, 96.0, 87.0, 68.0, 62.0, 52.0, 38.0, 42.0, 23.0, 18.0, 13.0, 8.0, 11.0, 7.0, 3.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.060434341430664e-05, -4.932191222906113e-05, -4.803948104381561e-05, -4.67570498585701e-05, -4.5474618673324585e-05, -4.419218748807907e-05, -4.290975630283356e-05, -4.162732511758804e-05, -4.034489393234253e-05, -3.9062462747097015e-05, -3.77800315618515e-05, -3.649760037660599e-05, -3.5215169191360474e-05, -3.393273800611496e-05, -3.2650306820869446e-05, -3.136787563562393e-05, -3.0085444450378418e-05, -2.8803013265132904e-05, -2.752058207988739e-05, -2.6238150894641876e-05, -2.4955719709396362e-05, -2.367328852415085e-05, -2.2390857338905334e-05, -2.110842615365982e-05, -1.9825994968414307e-05, -1.8543563783168793e-05, -1.726113259792328e-05, -1.5978701412677765e-05, -1.4696270227432251e-05, -1.3413839042186737e-05, -1.2131407856941223e-05, -1.084897667169571e-05, -9.566545486450195e-06, -8.284114301204681e-06, -7.0016831159591675e-06, -5.7192519307136536e-06, -4.43682074546814e-06, -3.1543895602226257e-06, -1.8719583749771118e-06, -5.895271897315979e-07, 6.92903995513916e-07, 1.97533518075943e-06, 3.257766366004944e-06, 4.540197551250458e-06, 5.822628736495972e-06, 7.105059921741486e-06, 8.387491106987e-06, 9.669922292232513e-06, 1.0952353477478027e-05, 1.2234784662723541e-05, 1.3517215847969055e-05, 1.4799647033214569e-05, 1.6082078218460083e-05, 1.7364509403705597e-05, 1.864694058895111e-05, 1.9929371774196625e-05, 2.121180295944214e-05, 2.2494234144687653e-05, 2.3776665329933167e-05, 2.505909651517868e-05, 2.6341527700424194e-05, 2.7623958885669708e-05, 2.8906390070915222e-05, 3.0188821256160736e-05, 3.147125244140625e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 9.0, 17.0, 24.0, 30.0, 31.0, 59.0, 77.0, 109.0, 170.0, 211.0, 322.0, 439.0, 705.0, 1216.0, 1959.0, 3881.0, 10919.0, 56263.0, 503543.0, 406065.0, 44109.0, 9611.0, 3729.0, 1842.0, 1075.0, 690.0, 445.0, 298.0, 195.0, 121.0, 98.0, 72.0, 41.0, 43.0, 28.0, 15.0, 16.0, 16.0, 11.0, 6.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2283935546875, -0.22124290466308594, -0.21409225463867188, -0.2069416046142578, -0.19979095458984375, -0.1926403045654297, -0.18548965454101562, -0.17833900451660156, -0.1711883544921875, -0.16403770446777344, -0.15688705444335938, -0.1497364044189453, -0.14258575439453125, -0.1354351043701172, -0.12828445434570312, -0.12113380432128906, -0.113983154296875, -0.10683250427246094, -0.09968185424804688, -0.09253120422363281, -0.08538055419921875, -0.07822990417480469, -0.07107925415039062, -0.06392860412597656, -0.0567779541015625, -0.04962730407714844, -0.042476654052734375, -0.03532600402832031, -0.02817535400390625, -0.021024703979492188, -0.013874053955078125, -0.0067234039306640625, 0.00042724609375, 0.0075778961181640625, 0.014728546142578125, 0.021879196166992188, 0.02902984619140625, 0.03618049621582031, 0.043331146240234375, 0.05048179626464844, 0.0576324462890625, 0.06478309631347656, 0.07193374633789062, 0.07908439636230469, 0.08623504638671875, 0.09338569641113281, 0.10053634643554688, 0.10768699645996094, 0.114837646484375, 0.12198829650878906, 0.12913894653320312, 0.1362895965576172, 0.14344024658203125, 0.1505908966064453, 0.15774154663085938, 0.16489219665527344, 0.1720428466796875, 0.17919349670410156, 0.18634414672851562, 0.1934947967529297, 0.20064544677734375, 0.2077960968017578, 0.21494674682617188, 0.22209739685058594, 0.229248046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 29.0, 30.0, 36.0, 55.0, 88.0, 106.0, 151.0, 134.0, 122.0, 68.0, 59.0, 33.0, 19.0, 18.0, 12.0, 6.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.16943931579589844, -0.16285324096679688, -0.1562671661376953, -0.14968109130859375, -0.1430950164794922, -0.13650894165039062, -0.12992286682128906, -0.1233367919921875, -0.11675071716308594, -0.11016464233398438, -0.10357856750488281, -0.09699249267578125, -0.09040641784667969, -0.08382034301757812, -0.07723426818847656, -0.070648193359375, -0.06406211853027344, -0.057476043701171875, -0.05088996887207031, -0.04430389404296875, -0.03771781921386719, -0.031131744384765625, -0.024545669555664062, -0.0179595947265625, -0.011373519897460938, -0.004787445068359375, 0.0017986297607421875, 0.00838470458984375, 0.014970779418945312, 0.021556854248046875, 0.028142929077148438, 0.03472900390625, 0.04131507873535156, 0.047901153564453125, 0.05448722839355469, 0.06107330322265625, 0.06765937805175781, 0.07424545288085938, 0.08083152770996094, 0.0874176025390625, 0.09400367736816406, 0.10058975219726562, 0.10717582702636719, 0.11376190185546875, 0.12034797668457031, 0.12693405151367188, 0.13352012634277344, 0.140106201171875, 0.14669227600097656, 0.15327835083007812, 0.1598644256591797, 0.16645050048828125, 0.1730365753173828, 0.17962265014648438, 0.18620872497558594, 0.1927947998046875, 0.19938087463378906, 0.20596694946289062, 0.2125530242919922, 0.21913909912109375, 0.2257251739501953, 0.23231124877929688, 0.23889732360839844, 0.2454833984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 11.0, 43.0, 66.0, 169.0, 262.0, 242.0, 125.0, 50.0, 27.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.215538501739502, -3.074989080429077, -2.9344396591186523, -2.7938902378082275, -2.6533408164978027, -2.512791395187378, -2.372241973876953, -2.2316925525665283, -2.0911431312561035, -1.9505937099456787, -1.810044288635254, -1.669494867324829, -1.5289454460144043, -1.3883960247039795, -1.2478466033935547, -1.1072971820831299, -0.9667477607727051, -0.8261983394622803, -0.6856489181518555, -0.5450994968414307, -0.40455007553100586, -0.26400065422058105, -0.12345123291015625, 0.017098188400268555, 0.15764760971069336, 0.29819703102111816, 0.43874645233154297, 0.5792958736419678, 0.7198452949523926, 0.8603947162628174, 1.0009441375732422, 1.141493558883667, 1.28204345703125, 1.4225928783416748, 1.5631422996520996, 1.7036917209625244, 1.8442411422729492, 1.984790563583374, 2.125339984893799, 2.2658894062042236, 2.4064388275146484, 2.5469882488250732, 2.687537670135498, 2.828087091445923, 2.9686365127563477, 3.1091859340667725, 3.2497353553771973, 3.390284776687622, 3.530834197998047, 3.6713836193084717, 3.8119330406188965, 3.9524824619293213, 4.093031883239746, 4.23358154296875, 4.374130725860596, 4.514679908752441, 4.655229568481445, 4.795779228210449, 4.936328411102295, 5.076877593994141, 5.2174272537231445, 5.357976913452148, 5.498526096343994, 5.63907527923584, 5.779624938964844]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 10.0, 5.0, 6.0, 14.0, 13.0, 16.0, 11.0, 24.0, 28.0, 16.0, 21.0, 23.0, 19.0, 30.0, 34.0, 25.0, 26.0, 39.0, 34.0, 46.0, 40.0, 41.0, 40.0, 33.0, 37.0, 47.0, 38.0, 28.0, 31.0, 30.0, 30.0, 25.0, 14.0, 17.0, 13.0, 13.0, 8.0, 14.0, 10.0, 8.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0228466987609863, -0.9889925718307495, -0.9551385045051575, -0.9212844371795654, -0.8874303102493286, -0.8535761833190918, -0.8197221159934998, -0.7858680486679077, -0.7520139217376709, -0.7181597948074341, -0.684305727481842, -0.65045166015625, -0.6165975332260132, -0.5827434062957764, -0.5488893389701843, -0.5150352716445923, -0.48118114471435547, -0.44732704758644104, -0.4134729504585266, -0.3796188533306122, -0.34576475620269775, -0.3119106590747833, -0.2780565619468689, -0.24420246481895447, -0.21034836769104004, -0.1764942705631256, -0.14264017343521118, -0.10878607630729675, -0.07493197917938232, -0.041077882051467896, -0.007223784923553467, 0.026630312204360962, 0.06048452854156494, 0.09433862566947937, 0.1281927227973938, 0.16204681992530823, 0.19590091705322266, 0.22975501418113708, 0.2636091113090515, 0.29746320843696594, 0.33131730556488037, 0.3651714026927948, 0.39902549982070923, 0.43287959694862366, 0.4667336940765381, 0.5005878210067749, 0.5344418883323669, 0.568295955657959, 0.6021500825881958, 0.6360042095184326, 0.6698582768440247, 0.7037123441696167, 0.7375664710998535, 0.7714205980300903, 0.8052746653556824, 0.8391287326812744, 0.8729828596115112, 0.906836986541748, 0.9406910538673401, 0.9745451211929321, 1.008399248123169, 1.0422533750534058, 1.0761075019836426, 1.1099615097045898, 1.1438156366348267]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 10.0, 20.0, 20.0, 23.0, 32.0, 30.0, 59.0, 69.0, 90.0, 115.0, 173.0, 214.0, 289.0, 452.0, 635.0, 1102.0, 2431.0, 6842.0, 32377.0, 4075820.0, 57591.0, 9001.0, 3015.0, 1366.0, 734.0, 467.0, 336.0, 224.0, 172.0, 140.0, 103.0, 63.0, 54.0, 49.0, 38.0, 28.0, 12.0, 12.0, 12.0, 12.0, 7.0, 2.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.482421875, -0.4671630859375, -0.451904296875, -0.4366455078125, -0.42138671875, -0.4061279296875, -0.390869140625, -0.3756103515625, -0.3603515625, -0.3450927734375, -0.329833984375, -0.3145751953125, -0.29931640625, -0.2840576171875, -0.268798828125, -0.2535400390625, -0.23828125, -0.2230224609375, -0.207763671875, -0.1925048828125, -0.17724609375, -0.1619873046875, -0.146728515625, -0.1314697265625, -0.1162109375, -0.1009521484375, -0.085693359375, -0.0704345703125, -0.05517578125, -0.0399169921875, -0.024658203125, -0.0093994140625, 0.005859375, 0.0211181640625, 0.036376953125, 0.0516357421875, 0.06689453125, 0.0821533203125, 0.097412109375, 0.1126708984375, 0.1279296875, 0.1431884765625, 0.158447265625, 0.1737060546875, 0.18896484375, 0.2042236328125, 0.219482421875, 0.2347412109375, 0.25, 0.2652587890625, 0.280517578125, 0.2957763671875, 0.31103515625, 0.3262939453125, 0.341552734375, 0.3568115234375, 0.3720703125, 0.3873291015625, 0.402587890625, 0.4178466796875, 0.43310546875, 0.4483642578125, 0.463623046875, 0.4788818359375, 0.494140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 7.0, 8.0, 13.0, 12.0, 23.0, 16.0, 22.0, 32.0, 41.0, 50.0, 48.0, 39.0, 55.0, 57.0, 69.0, 55.0, 47.0, 52.0, 53.0, 47.0, 40.0, 26.0, 37.0, 35.0, 16.0, 13.0, 18.0, 16.0, 13.0, 12.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058349609375, -0.0563507080078125, -0.054351806640625, -0.0523529052734375, -0.05035400390625, -0.0483551025390625, -0.046356201171875, -0.0443572998046875, -0.0423583984375, -0.0403594970703125, -0.038360595703125, -0.0363616943359375, -0.03436279296875, -0.0323638916015625, -0.030364990234375, -0.0283660888671875, -0.0263671875, -0.0243682861328125, -0.022369384765625, -0.0203704833984375, -0.01837158203125, -0.0163726806640625, -0.014373779296875, -0.0123748779296875, -0.0103759765625, -0.0083770751953125, -0.006378173828125, -0.0043792724609375, -0.00238037109375, -0.0003814697265625, 0.001617431640625, 0.0036163330078125, 0.005615234375, 0.0076141357421875, 0.009613037109375, 0.0116119384765625, 0.01361083984375, 0.0156097412109375, 0.017608642578125, 0.0196075439453125, 0.0216064453125, 0.0236053466796875, 0.025604248046875, 0.0276031494140625, 0.02960205078125, 0.0316009521484375, 0.033599853515625, 0.0355987548828125, 0.03759765625, 0.0395965576171875, 0.041595458984375, 0.0435943603515625, 0.04559326171875, 0.0475921630859375, 0.049591064453125, 0.0515899658203125, 0.0535888671875, 0.0555877685546875, 0.057586669921875, 0.0595855712890625, 0.06158447265625, 0.0635833740234375, 0.065582275390625, 0.0675811767578125, 0.069580078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 7.0, 6.0, 10.0, 12.0, 12.0, 15.0, 19.0, 24.0, 34.0, 39.0, 52.0, 66.0, 76.0, 131.0, 162.0, 248.0, 382.0, 707.0, 1570.0, 4907.0, 33642.0, 4114129.0, 29877.0, 4634.0, 1429.0, 720.0, 407.0, 265.0, 172.0, 113.0, 109.0, 72.0, 53.0, 37.0, 35.0, 22.0, 24.0, 15.0, 10.0, 15.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8603515625, -0.82904052734375, -0.7977294921875, -0.76641845703125, -0.735107421875, -0.70379638671875, -0.6724853515625, -0.64117431640625, -0.60986328125, -0.57855224609375, -0.5472412109375, -0.51593017578125, -0.484619140625, -0.45330810546875, -0.4219970703125, -0.39068603515625, -0.359375, -0.32806396484375, -0.2967529296875, -0.26544189453125, -0.234130859375, -0.20281982421875, -0.1715087890625, -0.14019775390625, -0.10888671875, -0.07757568359375, -0.0462646484375, -0.01495361328125, 0.016357421875, 0.04766845703125, 0.0789794921875, 0.11029052734375, 0.1416015625, 0.17291259765625, 0.2042236328125, 0.23553466796875, 0.266845703125, 0.29815673828125, 0.3294677734375, 0.36077880859375, 0.39208984375, 0.42340087890625, 0.4547119140625, 0.48602294921875, 0.517333984375, 0.54864501953125, 0.5799560546875, 0.61126708984375, 0.642578125, 0.67388916015625, 0.7052001953125, 0.73651123046875, 0.767822265625, 0.79913330078125, 0.8304443359375, 0.86175537109375, 0.89306640625, 0.92437744140625, 0.9556884765625, 0.98699951171875, 1.018310546875, 1.04962158203125, 1.0809326171875, 1.11224365234375, 1.1435546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 14.0, 20.0, 57.0, 383.0, 3450.0, 81.0, 29.0, 15.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08343505859375, -0.07790851593017578, -0.07238197326660156, -0.06685543060302734, -0.061328887939453125, -0.055802345275878906, -0.05027580261230469, -0.04474925994873047, -0.03922271728515625, -0.03369617462158203, -0.028169631958007812, -0.022643089294433594, -0.017116546630859375, -0.011590003967285156, -0.0060634613037109375, -0.0005369186401367188, 0.0049896240234375, 0.010516166687011719, 0.016042709350585938, 0.021569252014160156, 0.027095794677734375, 0.032622337341308594, 0.03814888000488281, 0.04367542266845703, 0.04920196533203125, 0.05472850799560547, 0.06025505065917969, 0.0657815933227539, 0.07130813598632812, 0.07683467864990234, 0.08236122131347656, 0.08788776397705078, 0.093414306640625, 0.09894084930419922, 0.10446739196777344, 0.10999393463134766, 0.11552047729492188, 0.1210470199584961, 0.1265735626220703, 0.13210010528564453, 0.13762664794921875, 0.14315319061279297, 0.1486797332763672, 0.1542062759399414, 0.15973281860351562, 0.16525936126708984, 0.17078590393066406, 0.17631244659423828, 0.1818389892578125, 0.18736553192138672, 0.19289207458496094, 0.19841861724853516, 0.20394515991210938, 0.2094717025756836, 0.2149982452392578, 0.22052478790283203, 0.22605133056640625, 0.23157787322998047, 0.2371044158935547, 0.2426309585571289, 0.24815750122070312, 0.25368404388427734, 0.25921058654785156, 0.2647371292114258, 0.270263671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 12.0, 23.0, 35.0, 60.0, 93.0, 115.0, 142.0, 145.0, 100.0, 74.0, 47.0, 39.0, 31.0, 19.0, 12.0, 13.0, 10.0, 9.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5047615766525269, -0.4841006398200989, -0.4634397327899933, -0.4427787959575653, -0.42211785912513733, -0.40145695209503174, -0.38079601526260376, -0.3601350784301758, -0.3394741415977478, -0.3188132047653198, -0.29815229773521423, -0.27749136090278625, -0.2568304240703583, -0.2361695021390915, -0.2155085802078247, -0.19484764337539673, -0.17418673634529114, -0.15352581441402435, -0.13286487758159637, -0.11220395565032959, -0.09154302626848221, -0.07088209688663483, -0.05022117495536804, -0.029560238122940063, -0.008899316191673279, 0.011761611327528954, 0.032422538846731186, 0.05308346450328827, 0.07374439388513565, 0.09440532326698303, 0.11506624519824982, 0.1357271820306778, 0.15638810396194458, 0.17704902589321136, 0.19770996272563934, 0.21837088465690613, 0.2390318214893341, 0.2596927285194397, 0.2803536653518677, 0.30101460218429565, 0.32167553901672363, 0.3423364758491516, 0.3629973828792572, 0.3836583197116852, 0.40431925654411316, 0.42498016357421875, 0.44564110040664673, 0.4663020372390747, 0.4869629442691803, 0.5076238512992859, 0.5282847881317139, 0.5489457249641418, 0.5696066617965698, 0.5902675986289978, 0.6109285354614258, 0.631589412689209, 0.652250349521637, 0.6729112863540649, 0.6935722231864929, 0.7142331600189209, 0.7348940372467041, 0.7555549740791321, 0.7762159109115601, 0.796876847743988, 0.817537784576416]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 9.0, 11.0, 10.0, 11.0, 14.0, 15.0, 15.0, 20.0, 24.0, 23.0, 13.0, 25.0, 35.0, 23.0, 39.0, 28.0, 34.0, 35.0, 48.0, 37.0, 31.0, 37.0, 35.0, 25.0, 33.0, 28.0, 33.0, 30.0, 19.0, 26.0, 30.0, 24.0, 25.0, 26.0, 24.0, 16.0, 15.0, 19.0, 12.0, 9.0, 9.0, 8.0, 7.0, 3.0, 3.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26647669076919556, -0.2576553225517273, -0.24883392453193665, -0.2400125414133072, -0.23119115829467773, -0.22236977517604828, -0.21354839205741882, -0.20472700893878937, -0.1959056258201599, -0.18708424270153046, -0.178262859582901, -0.16944147646427155, -0.1606200933456421, -0.15179871022701263, -0.14297732710838318, -0.13415594398975372, -0.12533456087112427, -0.11651317775249481, -0.10769179463386536, -0.0988704115152359, -0.09004902839660645, -0.08122764527797699, -0.07240626215934753, -0.06358487904071808, -0.05476349592208862, -0.04594211280345917, -0.03712072968482971, -0.028299346566200256, -0.0194779634475708, -0.010656580328941345, -0.0018351972103118896, 0.006986185908317566, 0.01580756902694702, 0.024628952145576477, 0.03345033526420593, 0.04227171838283539, 0.051093101501464844, 0.0599144846200943, 0.06873586773872375, 0.07755725085735321, 0.08637863397598267, 0.09520001709461212, 0.10402140021324158, 0.11284278333187103, 0.12166416645050049, 0.13048554956912994, 0.1393069326877594, 0.14812831580638885, 0.1569496989250183, 0.16577108204364777, 0.17459246516227722, 0.18341384828090668, 0.19223523139953613, 0.2010566145181656, 0.20987799763679504, 0.2186993807554245, 0.22752076387405396, 0.2363421469926834, 0.24516353011131287, 0.2539849281311035, 0.2628062963485718, 0.27162766456604004, 0.2804490625858307, 0.28927046060562134, 0.2980918288230896]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 8.0, 3.0, 7.0, 6.0, 10.0, 14.0, 16.0, 18.0, 34.0, 41.0, 43.0, 63.0, 101.0, 154.0, 169.0, 218.0, 302.0, 422.0, 567.0, 792.0, 1166.0, 1913.0, 3396.0, 6975.0, 17413.0, 51179.0, 174831.0, 428342.0, 245726.0, 71790.0, 23090.0, 8846.0, 4049.0, 2272.0, 1308.0, 897.0, 634.0, 432.0, 322.0, 266.0, 196.0, 144.0, 91.0, 67.0, 55.0, 44.0, 33.0, 30.0, 18.0, 15.0, 14.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.24755859375, -0.23947906494140625, -0.2313995361328125, -0.22332000732421875, -0.215240478515625, -0.20716094970703125, -0.1990814208984375, -0.19100189208984375, -0.18292236328125, -0.17484283447265625, -0.1667633056640625, -0.15868377685546875, -0.150604248046875, -0.14252471923828125, -0.1344451904296875, -0.12636566162109375, -0.1182861328125, -0.11020660400390625, -0.1021270751953125, -0.09404754638671875, -0.085968017578125, -0.07788848876953125, -0.0698089599609375, -0.06172943115234375, -0.05364990234375, -0.04557037353515625, -0.0374908447265625, -0.02941131591796875, -0.021331787109375, -0.01325225830078125, -0.0051727294921875, 0.00290679931640625, 0.010986328125, 0.01906585693359375, 0.0271453857421875, 0.03522491455078125, 0.043304443359375, 0.05138397216796875, 0.0594635009765625, 0.06754302978515625, 0.07562255859375, 0.08370208740234375, 0.0917816162109375, 0.09986114501953125, 0.107940673828125, 0.11602020263671875, 0.1240997314453125, 0.13217926025390625, 0.1402587890625, 0.14833831787109375, 0.1564178466796875, 0.16449737548828125, 0.172576904296875, 0.18065643310546875, 0.1887359619140625, 0.19681549072265625, 0.20489501953125, 0.21297454833984375, 0.2210540771484375, 0.22913360595703125, 0.237213134765625, 0.24529266357421875, 0.2533721923828125, 0.26145172119140625, 0.26953125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 7.0, 1.0, 4.0, 10.0, 13.0, 7.0, 8.0, 16.0, 19.0, 24.0, 21.0, 26.0, 29.0, 41.0, 29.0, 52.0, 50.0, 59.0, 49.0, 56.0, 53.0, 46.0, 35.0, 48.0, 41.0, 37.0, 40.0, 39.0, 15.0, 29.0, 21.0, 13.0, 11.0, 11.0, 13.0, 5.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06689453125, -0.06449222564697266, -0.06208992004394531, -0.05968761444091797, -0.057285308837890625, -0.05488300323486328, -0.05248069763183594, -0.050078392028808594, -0.04767608642578125, -0.045273780822753906, -0.04287147521972656, -0.04046916961669922, -0.038066864013671875, -0.03566455841064453, -0.03326225280761719, -0.030859947204589844, -0.0284576416015625, -0.026055335998535156, -0.023653030395507812, -0.02125072479248047, -0.018848419189453125, -0.01644611358642578, -0.014043807983398438, -0.011641502380371094, -0.00923919677734375, -0.006836891174316406, -0.0044345855712890625, -0.0020322799682617188, 0.000370025634765625, 0.0027723312377929688, 0.0051746368408203125, 0.007576942443847656, 0.009979248046875, 0.012381553649902344, 0.014783859252929688, 0.01718616485595703, 0.019588470458984375, 0.02199077606201172, 0.024393081665039062, 0.026795387268066406, 0.02919769287109375, 0.031599998474121094, 0.03400230407714844, 0.03640460968017578, 0.038806915283203125, 0.04120922088623047, 0.04361152648925781, 0.046013832092285156, 0.0484161376953125, 0.050818443298339844, 0.05322074890136719, 0.05562305450439453, 0.058025360107421875, 0.06042766571044922, 0.06282997131347656, 0.0652322769165039, 0.06763458251953125, 0.0700368881225586, 0.07243919372558594, 0.07484149932861328, 0.07724380493164062, 0.07964611053466797, 0.08204841613769531, 0.08445072174072266, 0.08685302734375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 5.0, 9.0, 10.0, 18.0, 30.0, 33.0, 61.0, 77.0, 114.0, 157.0, 241.0, 387.0, 667.0, 1085.0, 2051.0, 4188.0, 10835.0, 42503.0, 293717.0, 577867.0, 84894.0, 17471.0, 5859.0, 2651.0, 1446.0, 779.0, 467.0, 276.0, 183.0, 134.0, 92.0, 83.0, 50.0, 33.0, 24.0, 11.0, 8.0, 12.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.348388671875, -0.336456298828125, -0.32452392578125, -0.312591552734375, -0.3006591796875, -0.288726806640625, -0.27679443359375, -0.264862060546875, -0.2529296875, -0.240997314453125, -0.22906494140625, -0.217132568359375, -0.2052001953125, -0.193267822265625, -0.18133544921875, -0.169403076171875, -0.157470703125, -0.145538330078125, -0.13360595703125, -0.121673583984375, -0.1097412109375, -0.097808837890625, -0.08587646484375, -0.073944091796875, -0.06201171875, -0.050079345703125, -0.03814697265625, -0.026214599609375, -0.0142822265625, -0.002349853515625, 0.00958251953125, 0.021514892578125, 0.033447265625, 0.045379638671875, 0.05731201171875, 0.069244384765625, 0.0811767578125, 0.093109130859375, 0.10504150390625, 0.116973876953125, 0.12890625, 0.140838623046875, 0.15277099609375, 0.164703369140625, 0.1766357421875, 0.188568115234375, 0.20050048828125, 0.212432861328125, 0.224365234375, 0.236297607421875, 0.24822998046875, 0.260162353515625, 0.2720947265625, 0.284027099609375, 0.29595947265625, 0.307891845703125, 0.31982421875, 0.331756591796875, 0.34368896484375, 0.355621337890625, 0.3675537109375, 0.379486083984375, 0.39141845703125, 0.403350830078125, 0.415283203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 5.0, 1.0, 8.0, 11.0, 10.0, 11.0, 18.0, 22.0, 14.0, 33.0, 36.0, 36.0, 41.0, 49.0, 43.0, 43.0, 45.0, 46.0, 58.0, 56.0, 44.0, 49.0, 52.0, 49.0, 26.0, 39.0, 36.0, 23.0, 22.0, 12.0, 14.0, 8.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40478515625, -0.3912239074707031, -0.37766265869140625, -0.3641014099121094, -0.3505401611328125, -0.3369789123535156, -0.32341766357421875, -0.3098564147949219, -0.296295166015625, -0.2827339172363281, -0.26917266845703125, -0.2556114196777344, -0.2420501708984375, -0.22848892211914062, -0.21492767333984375, -0.20136642456054688, -0.18780517578125, -0.17424392700195312, -0.16068267822265625, -0.14712142944335938, -0.1335601806640625, -0.11999893188476562, -0.10643768310546875, -0.09287643432617188, -0.079315185546875, -0.06575393676757812, -0.05219268798828125, -0.038631439208984375, -0.0250701904296875, -0.011508941650390625, 0.00205230712890625, 0.015613555908203125, 0.0291748046875, 0.042736053466796875, 0.05629730224609375, 0.06985855102539062, 0.0834197998046875, 0.09698104858398438, 0.11054229736328125, 0.12410354614257812, 0.137664794921875, 0.15122604370117188, 0.16478729248046875, 0.17834854125976562, 0.1919097900390625, 0.20547103881835938, 0.21903228759765625, 0.23259353637695312, 0.24615478515625, 0.2597160339355469, 0.27327728271484375, 0.2868385314941406, 0.3003997802734375, 0.3139610290527344, 0.32752227783203125, 0.3410835266113281, 0.354644775390625, 0.3682060241699219, 0.38176727294921875, 0.3953285217285156, 0.4088897705078125, 0.4224510192871094, 0.43601226806640625, 0.4495735168457031, 0.463134765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 12.0, 11.0, 22.0, 23.0, 35.0, 51.0, 79.0, 111.0, 188.0, 320.0, 589.0, 1358.0, 3203.0, 11584.0, 122810.0, 836472.0, 58445.0, 8056.0, 2714.0, 1123.0, 533.0, 319.0, 152.0, 92.0, 81.0, 41.0, 26.0, 18.0, 18.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3408203125, -0.3302955627441406, -0.31977081298828125, -0.3092460632324219, -0.2987213134765625, -0.2881965637207031, -0.27767181396484375, -0.2671470642089844, -0.256622314453125, -0.24609756469726562, -0.23557281494140625, -0.22504806518554688, -0.2145233154296875, -0.20399856567382812, -0.19347381591796875, -0.18294906616210938, -0.17242431640625, -0.16189956665039062, -0.15137481689453125, -0.14085006713867188, -0.1303253173828125, -0.11980056762695312, -0.10927581787109375, -0.09875106811523438, -0.088226318359375, -0.07770156860351562, -0.06717681884765625, -0.056652069091796875, -0.0461273193359375, -0.035602569580078125, -0.02507781982421875, -0.014553070068359375, -0.0040283203125, 0.006496429443359375, 0.01702117919921875, 0.027545928955078125, 0.0380706787109375, 0.048595428466796875, 0.05912017822265625, 0.06964492797851562, 0.080169677734375, 0.09069442749023438, 0.10121917724609375, 0.11174392700195312, 0.1222686767578125, 0.13279342651367188, 0.14331817626953125, 0.15384292602539062, 0.16436767578125, 0.17489242553710938, 0.18541717529296875, 0.19594192504882812, 0.2064666748046875, 0.21699142456054688, 0.22751617431640625, 0.23804092407226562, 0.248565673828125, 0.2590904235839844, 0.26961517333984375, 0.2801399230957031, 0.2906646728515625, 0.3011894226074219, 0.31171417236328125, 0.3222389221191406, 0.332763671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 21.0, 46.0, 73.0, 135.0, 167.0, 187.0, 135.0, 102.0, 59.0, 28.0, 24.0, 15.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012093782424926758, -0.00011814013123512268, -0.00011534243822097778, -0.00011254474520683289, -0.00010974705219268799, -0.00010694935917854309, -0.0001041516661643982, -0.0001013539731502533, -9.85562801361084e-05, -9.57585871219635e-05, -9.29608941078186e-05, -9.01632010936737e-05, -8.736550807952881e-05, -8.456781506538391e-05, -8.177012205123901e-05, -7.897242903709412e-05, -7.617473602294922e-05, -7.337704300880432e-05, -7.057934999465942e-05, -6.778165698051453e-05, -6.498396396636963e-05, -6.218627095222473e-05, -5.9388577938079834e-05, -5.6590884923934937e-05, -5.379319190979004e-05, -5.099549889564514e-05, -4.8197805881500244e-05, -4.540011286735535e-05, -4.260241985321045e-05, -3.980472683906555e-05, -3.7007033824920654e-05, -3.420934081077576e-05, -3.141164779663086e-05, -2.8613954782485962e-05, -2.5816261768341064e-05, -2.3018568754196167e-05, -2.022087574005127e-05, -1.7423182725906372e-05, -1.4625489711761475e-05, -1.1827796697616577e-05, -9.03010368347168e-06, -6.232410669326782e-06, -3.4347176551818848e-06, -6.370246410369873e-07, 2.16066837310791e-06, 4.958361387252808e-06, 7.756054401397705e-06, 1.0553747415542603e-05, 1.33514404296875e-05, 1.6149133443832397e-05, 1.8946826457977295e-05, 2.1744519472122192e-05, 2.454221248626709e-05, 2.7339905500411987e-05, 3.0137598514556885e-05, 3.293529152870178e-05, 3.573298454284668e-05, 3.853067755699158e-05, 4.1328370571136475e-05, 4.412606358528137e-05, 4.692375659942627e-05, 4.972144961357117e-05, 5.2519142627716064e-05, 5.531683564186096e-05, 5.811452865600586e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 15.0, 11.0, 27.0, 26.0, 45.0, 71.0, 108.0, 178.0, 407.0, 860.0, 2465.0, 10992.0, 242324.0, 764658.0, 20549.0, 3617.0, 1136.0, 489.0, 223.0, 140.0, 72.0, 47.0, 26.0, 24.0, 7.0, 12.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.387451171875, -0.3726387023925781, -0.35782623291015625, -0.3430137634277344, -0.3282012939453125, -0.3133888244628906, -0.29857635498046875, -0.2837638854980469, -0.268951416015625, -0.2541389465332031, -0.23932647705078125, -0.22451400756835938, -0.2097015380859375, -0.19488906860351562, -0.18007659912109375, -0.16526412963867188, -0.15045166015625, -0.13563919067382812, -0.12082672119140625, -0.10601425170898438, -0.0912017822265625, -0.07638931274414062, -0.06157684326171875, -0.046764373779296875, -0.031951904296875, -0.017139434814453125, -0.00232696533203125, 0.012485504150390625, 0.0272979736328125, 0.042110443115234375, 0.05692291259765625, 0.07173538208007812, 0.0865478515625, 0.10136032104492188, 0.11617279052734375, 0.13098526000976562, 0.1457977294921875, 0.16061019897460938, 0.17542266845703125, 0.19023513793945312, 0.205047607421875, 0.21986007690429688, 0.23467254638671875, 0.24948501586914062, 0.2642974853515625, 0.2791099548339844, 0.29392242431640625, 0.3087348937988281, 0.32354736328125, 0.3383598327636719, 0.35317230224609375, 0.3679847717285156, 0.3827972412109375, 0.3976097106933594, 0.41242218017578125, 0.4272346496582031, 0.442047119140625, 0.4568595886230469, 0.47167205810546875, 0.4864845275878906, 0.5012969970703125, 0.5161094665527344, 0.5309219360351562, 0.5457344055175781, 0.560546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 12.0, 14.0, 23.0, 46.0, 84.0, 149.0, 171.0, 201.0, 129.0, 69.0, 30.0, 17.0, 12.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2186279296875, -0.2075939178466797, -0.19655990600585938, -0.18552589416503906, -0.17449188232421875, -0.16345787048339844, -0.15242385864257812, -0.1413898468017578, -0.1303558349609375, -0.11932182312011719, -0.10828781127929688, -0.09725379943847656, -0.08621978759765625, -0.07518577575683594, -0.06415176391601562, -0.05311775207519531, -0.042083740234375, -0.031049728393554688, -0.020015716552734375, -0.008981704711914062, 0.00205230712890625, 0.013086318969726562, 0.024120330810546875, 0.03515434265136719, 0.0461883544921875, 0.05722236633300781, 0.06825637817382812, 0.07929039001464844, 0.09032440185546875, 0.10135841369628906, 0.11239242553710938, 0.12342643737792969, 0.13446044921875, 0.1454944610595703, 0.15652847290039062, 0.16756248474121094, 0.17859649658203125, 0.18963050842285156, 0.20066452026367188, 0.2116985321044922, 0.2227325439453125, 0.2337665557861328, 0.24480056762695312, 0.25583457946777344, 0.26686859130859375, 0.27790260314941406, 0.2889366149902344, 0.2999706268310547, 0.311004638671875, 0.3220386505126953, 0.3330726623535156, 0.34410667419433594, 0.35514068603515625, 0.36617469787597656, 0.3772087097167969, 0.3882427215576172, 0.3992767333984375, 0.4103107452392578, 0.4213447570800781, 0.43237876892089844, 0.44341278076171875, 0.45444679260253906, 0.4654808044433594, 0.4765148162841797, 0.487548828125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 7.0, 20.0, 32.0, 62.0, 104.0, 171.0, 180.0, 150.0, 116.0, 49.0, 51.0, 21.0, 17.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.660822868347168, -6.519661903381348, -6.3785014152526855, -6.237340927124023, -6.096179962158203, -5.955018997192383, -5.813858509063721, -5.672698020935059, -5.531537055969238, -5.390376091003418, -5.249215602874756, -5.108055114746094, -4.966894149780273, -4.825733184814453, -4.684572696685791, -4.543412208557129, -4.402251243591309, -4.261090278625488, -4.119929790496826, -3.978769063949585, -3.8376083374023438, -3.6964476108551025, -3.5552868843078613, -3.41412615776062, -3.272965431213379, -3.1318047046661377, -2.9906439781188965, -2.8494832515716553, -2.708322525024414, -2.567161798477173, -2.4260010719299316, -2.2848403453826904, -2.143679141998291, -2.00251841545105, -1.8613576889038086, -1.7201969623565674, -1.5790362358093262, -1.437875509262085, -1.2967147827148438, -1.1555540561676025, -1.0143933296203613, -0.8732326030731201, -0.7320718765258789, -0.5909111499786377, -0.4497504234313965, -0.3085896968841553, -0.16742897033691406, -0.02626824378967285, 0.11489248275756836, 0.25605320930480957, 0.3972139358520508, 0.538374662399292, 0.6795353889465332, 0.8206961154937744, 0.9618568420410156, 1.1030175685882568, 1.244178295135498, 1.3853390216827393, 1.5264997482299805, 1.6676604747772217, 1.808821201324463, 1.949981927871704, 2.0911426544189453, 2.2323033809661865, 2.3734641075134277]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 13.0, 18.0, 8.0, 17.0, 19.0, 33.0, 47.0, 35.0, 31.0, 40.0, 52.0, 58.0, 54.0, 58.0, 64.0, 55.0, 48.0, 51.0, 42.0, 32.0, 30.0, 30.0, 29.0, 18.0, 18.0, 25.0, 10.0, 9.0, 4.0, 5.0, 4.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7773356437683105, -2.6994147300720215, -2.6214938163757324, -2.5435729026794434, -2.4656519889831543, -2.3877310752868652, -2.309810161590576, -2.231889247894287, -2.153968334197998, -2.076047420501709, -1.99812650680542, -1.9202055931091309, -1.8422846794128418, -1.7643637657165527, -1.6864429712295532, -1.6085220575332642, -1.5306012630462646, -1.4526803493499756, -1.3747594356536865, -1.2968385219573975, -1.2189176082611084, -1.1409966945648193, -1.0630759000778198, -0.9851549863815308, -0.9072340726852417, -0.8293131589889526, -0.7513922452926636, -0.6734713912010193, -0.5955504775047302, -0.5176295638084412, -0.4397086799144745, -0.3617877960205078, -0.28386712074279785, -0.20594622194766998, -0.12802532315254211, -0.050104424357414246, 0.027816474437713623, 0.10573738813400269, 0.18365827202796936, 0.26157915592193604, 0.3395000696182251, 0.41742098331451416, 0.49534186720848083, 0.5732627511024475, 0.6511836647987366, 0.7291045784950256, 0.8070254325866699, 0.884946346282959, 0.962867259979248, 1.040788173675537, 1.1187090873718262, 1.1966300010681152, 1.2745509147644043, 1.3524718284606934, 1.4303926229476929, 1.508313536643982, 1.586234450340271, 1.66415536403656, 1.7420762777328491, 1.8199971914291382, 1.8979179859161377, 1.9758388996124268, 2.053759813308716, 2.131680727005005, 2.209601640701294]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 4.0, 12.0, 14.0, 27.0, 30.0, 39.0, 51.0, 85.0, 146.0, 232.0, 564.0, 1616.0, 7209.0, 156395.0, 4014860.0, 9607.0, 2000.0, 636.0, 274.0, 157.0, 101.0, 47.0, 40.0, 36.0, 25.0, 13.0, 14.0, 11.0, 4.0, 4.0, 3.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7444839477539062, -0.7179718017578125, -0.6914596557617188, -0.664947509765625, -0.6384353637695312, -0.6119232177734375, -0.5854110717773438, -0.55889892578125, -0.5323867797851562, -0.5058746337890625, -0.47936248779296875, -0.452850341796875, -0.42633819580078125, -0.3998260498046875, -0.37331390380859375, -0.3468017578125, -0.32028961181640625, -0.2937774658203125, -0.26726531982421875, -0.240753173828125, -0.21424102783203125, -0.1877288818359375, -0.16121673583984375, -0.13470458984375, -0.10819244384765625, -0.0816802978515625, -0.05516815185546875, -0.028656005859375, -0.00214385986328125, 0.0243682861328125, 0.05088043212890625, 0.077392578125, 0.10390472412109375, 0.1304168701171875, 0.15692901611328125, 0.183441162109375, 0.20995330810546875, 0.2364654541015625, 0.26297760009765625, 0.28948974609375, 0.31600189208984375, 0.3425140380859375, 0.36902618408203125, 0.395538330078125, 0.42205047607421875, 0.4485626220703125, 0.47507476806640625, 0.5015869140625, 0.5280990600585938, 0.5546112060546875, 0.5811233520507812, 0.607635498046875, 0.6341476440429688, 0.6606597900390625, 0.6871719360351562, 0.71368408203125, 0.7401962280273438, 0.7667083740234375, 0.7932205200195312, 0.819732666015625, 0.8462448120117188, 0.8727569580078125, 0.8992691040039062, 0.92578125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 3.0, 5.0, 0.0, 10.0, 14.0, 10.0, 31.0, 31.0, 57.0, 61.0, 56.0, 77.0, 77.0, 88.0, 68.0, 76.0, 72.0, 56.0, 47.0, 53.0, 33.0, 25.0, 15.0, 8.0, 7.0, 9.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10809326171875, -0.10405254364013672, -0.10001182556152344, -0.09597110748291016, -0.09193038940429688, -0.0878896713256836, -0.08384895324707031, -0.07980823516845703, -0.07576751708984375, -0.07172679901123047, -0.06768608093261719, -0.0636453628540039, -0.059604644775390625, -0.055563926696777344, -0.05152320861816406, -0.04748249053955078, -0.0434417724609375, -0.03940105438232422, -0.03536033630371094, -0.031319618225097656, -0.027278900146484375, -0.023238182067871094, -0.019197463989257812, -0.015156745910644531, -0.01111602783203125, -0.007075309753417969, -0.0030345916748046875, 0.0010061264038085938, 0.005046844482421875, 0.009087562561035156, 0.013128280639648438, 0.01716899871826172, 0.021209716796875, 0.02525043487548828, 0.029291152954101562, 0.033331871032714844, 0.037372589111328125, 0.041413307189941406, 0.04545402526855469, 0.04949474334716797, 0.05353546142578125, 0.05757617950439453, 0.06161689758300781, 0.0656576156616211, 0.06969833374023438, 0.07373905181884766, 0.07777976989746094, 0.08182048797607422, 0.0858612060546875, 0.08990192413330078, 0.09394264221191406, 0.09798336029052734, 0.10202407836914062, 0.1060647964477539, 0.11010551452636719, 0.11414623260498047, 0.11818695068359375, 0.12222766876220703, 0.1262683868408203, 0.1303091049194336, 0.13434982299804688, 0.13839054107666016, 0.14243125915527344, 0.14647197723388672, 0.1505126953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 11.0, 10.0, 5.0, 12.0, 9.0, 18.0, 17.0, 21.0, 33.0, 41.0, 49.0, 57.0, 69.0, 109.0, 222.0, 658.0, 3168.0, 57981.0, 4121619.0, 8057.0, 1211.0, 366.0, 149.0, 96.0, 57.0, 40.0, 35.0, 33.0, 22.0, 23.0, 18.0, 14.0, 13.0, 5.0, 8.0, 8.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8662109375, -1.811676025390625, -1.75714111328125, -1.702606201171875, -1.6480712890625, -1.593536376953125, -1.53900146484375, -1.484466552734375, -1.429931640625, -1.375396728515625, -1.32086181640625, -1.266326904296875, -1.2117919921875, -1.157257080078125, -1.10272216796875, -1.048187255859375, -0.99365234375, -0.939117431640625, -0.88458251953125, -0.830047607421875, -0.7755126953125, -0.720977783203125, -0.66644287109375, -0.611907958984375, -0.557373046875, -0.502838134765625, -0.44830322265625, -0.393768310546875, -0.3392333984375, -0.284698486328125, -0.23016357421875, -0.175628662109375, -0.12109375, -0.066558837890625, -0.01202392578125, 0.042510986328125, 0.0970458984375, 0.151580810546875, 0.20611572265625, 0.260650634765625, 0.315185546875, 0.369720458984375, 0.42425537109375, 0.478790283203125, 0.5333251953125, 0.587860107421875, 0.64239501953125, 0.696929931640625, 0.75146484375, 0.805999755859375, 0.86053466796875, 0.915069580078125, 0.9696044921875, 1.024139404296875, 1.07867431640625, 1.133209228515625, 1.187744140625, 1.242279052734375, 1.29681396484375, 1.351348876953125, 1.4058837890625, 1.460418701171875, 1.51495361328125, 1.569488525390625, 1.6240234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 14.0, 29.0, 119.0, 3786.0, 94.0, 20.0, 9.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1868896484375, -0.17484474182128906, -0.16279983520507812, -0.1507549285888672, -0.13871002197265625, -0.1266651153564453, -0.11462020874023438, -0.10257530212402344, -0.0905303955078125, -0.07848548889160156, -0.06644058227539062, -0.05439567565917969, -0.04235076904296875, -0.030305862426757812, -0.018260955810546875, -0.0062160491943359375, 0.005828857421875, 0.017873764038085938, 0.029918670654296875, 0.04196357727050781, 0.05400848388671875, 0.06605339050292969, 0.07809829711914062, 0.09014320373535156, 0.1021881103515625, 0.11423301696777344, 0.12627792358398438, 0.1383228302001953, 0.15036773681640625, 0.1624126434326172, 0.17445755004882812, 0.18650245666503906, 0.19854736328125, 0.21059226989746094, 0.22263717651367188, 0.2346820831298828, 0.24672698974609375, 0.2587718963623047, 0.2708168029785156, 0.28286170959472656, 0.2949066162109375, 0.30695152282714844, 0.3189964294433594, 0.3310413360595703, 0.34308624267578125, 0.3551311492919922, 0.3671760559082031, 0.37922096252441406, 0.391265869140625, 0.40331077575683594, 0.4153556823730469, 0.4274005889892578, 0.43944549560546875, 0.4514904022216797, 0.4635353088378906, 0.47558021545410156, 0.4876251220703125, 0.49967002868652344, 0.5117149353027344, 0.5237598419189453, 0.5358047485351562, 0.5478496551513672, 0.5598945617675781, 0.5719394683837891, 0.583984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 11.0, 11.0, 8.0, 11.0, 11.0, 17.0, 40.0, 43.0, 65.0, 98.0, 98.0, 124.0, 108.0, 105.0, 58.0, 51.0, 48.0, 20.0, 27.0, 13.0, 10.0, 2.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6872037649154663, -0.6650705933570862, -0.6429374814033508, -0.6208043098449707, -0.5986711978912354, -0.5765380263328552, -0.5544048547744751, -0.5322717428207397, -0.5101385712623596, -0.4880054295063019, -0.46587228775024414, -0.443739116191864, -0.4216059744358063, -0.39947283267974854, -0.3773396909236908, -0.35520654916763306, -0.3330734074115753, -0.3109402656555176, -0.28880712389945984, -0.2666739821434021, -0.24454081058502197, -0.22240766882896423, -0.2002745270729065, -0.17814137041568756, -0.15600822865962982, -0.13387508690357208, -0.11174193024635315, -0.08960878849029541, -0.06747563928365707, -0.04534249007701874, -0.023209348320961, -0.0010761916637420654, 0.021056950092315674, 0.04319009929895401, 0.06532324850559235, 0.08745639026165009, 0.10958953946828842, 0.13172268867492676, 0.1538558304309845, 0.17598898708820343, 0.19812212884426117, 0.2202552706003189, 0.24238842725753784, 0.2645215690135956, 0.2866547107696533, 0.30878788232803345, 0.3309209942817688, 0.3530541658401489, 0.37518730759620667, 0.3973204493522644, 0.41945359110832214, 0.4415867328643799, 0.46371990442276, 0.48585304617881775, 0.5079861879348755, 0.5301193594932556, 0.552252471446991, 0.5743856430053711, 0.5965187549591064, 0.6186519265174866, 0.6407850384712219, 0.662918210029602, 0.6850513219833374, 0.7071844935417175, 0.7293176651000977]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 4.0, 4.0, 7.0, 11.0, 7.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 22.0, 26.0, 31.0, 30.0, 24.0, 33.0, 40.0, 30.0, 35.0, 42.0, 41.0, 48.0, 31.0, 34.0, 42.0, 37.0, 39.0, 33.0, 22.0, 32.0, 30.0, 23.0, 26.0, 17.0, 16.0, 16.0, 12.0, 11.0, 10.0, 7.0, 2.0, 9.0, 3.0, 7.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3262641429901123, -0.3152258098125458, -0.30418750643730164, -0.2931491732597351, -0.28211086988449097, -0.27107253670692444, -0.2600342035293579, -0.24899590015411377, -0.23795756697654724, -0.2269192487001419, -0.21588093042373657, -0.20484259724617004, -0.1938042789697647, -0.18276596069335938, -0.17172764241695404, -0.1606893241405487, -0.14965100586414337, -0.13861268758773804, -0.1275743693113327, -0.11653604358434677, -0.10549771785736084, -0.0944593995809555, -0.08342108130455017, -0.07238275557756424, -0.061344437301158905, -0.05030611529946327, -0.03926779329776764, -0.028229475021362305, -0.017191153019666672, -0.006152831017971039, 0.004885487258434296, 0.015923812985420227, 0.02696213126182556, 0.038000453263521194, 0.04903877526521683, 0.06007709354162216, 0.0711154192686081, 0.08215373754501343, 0.09319205582141876, 0.1042303815484047, 0.11526869982481003, 0.12630702555179596, 0.1373453438282013, 0.14838366210460663, 0.15942198038101196, 0.1704603135585785, 0.18149861693382263, 0.19253695011138916, 0.2035752683877945, 0.21461358666419983, 0.22565190494060516, 0.2366902232170105, 0.24772855639457703, 0.25876688957214355, 0.2698051929473877, 0.2808435261249542, 0.29188182950019836, 0.3029201626777649, 0.31395846605300903, 0.32499679923057556, 0.3360351026058197, 0.34707343578338623, 0.35811173915863037, 0.3691500723361969, 0.3801884055137634]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 1.0, 4.0, 5.0, 11.0, 10.0, 17.0, 24.0, 37.0, 49.0, 99.0, 152.0, 220.0, 387.0, 619.0, 1067.0, 1700.0, 2976.0, 5454.0, 10506.0, 22134.0, 49002.0, 117040.0, 264234.0, 306284.0, 149049.0, 62241.0, 27102.0, 12999.0, 6513.0, 3542.0, 1986.0, 1156.0, 741.0, 423.0, 297.0, 172.0, 105.0, 88.0, 29.0, 28.0, 16.0, 16.0, 6.0, 0.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.224365234375, -0.2181568145751953, -0.21194839477539062, -0.20573997497558594, -0.19953155517578125, -0.19332313537597656, -0.18711471557617188, -0.1809062957763672, -0.1746978759765625, -0.1684894561767578, -0.16228103637695312, -0.15607261657714844, -0.14986419677734375, -0.14365577697753906, -0.13744735717773438, -0.1312389373779297, -0.125030517578125, -0.11882209777832031, -0.11261367797851562, -0.10640525817871094, -0.10019683837890625, -0.09398841857910156, -0.08777999877929688, -0.08157157897949219, -0.0753631591796875, -0.06915473937988281, -0.06294631958007812, -0.05673789978027344, -0.05052947998046875, -0.04432106018066406, -0.038112640380859375, -0.03190422058105469, -0.02569580078125, -0.019487380981445312, -0.013278961181640625, -0.0070705413818359375, -0.00086212158203125, 0.0053462982177734375, 0.011554718017578125, 0.017763137817382812, 0.0239715576171875, 0.030179977416992188, 0.036388397216796875, 0.04259681701660156, 0.04880523681640625, 0.05501365661621094, 0.061222076416015625, 0.06743049621582031, 0.073638916015625, 0.07984733581542969, 0.08605575561523438, 0.09226417541503906, 0.09847259521484375, 0.10468101501464844, 0.11088943481445312, 0.11709785461425781, 0.1233062744140625, 0.1295146942138672, 0.13572311401367188, 0.14193153381347656, 0.14813995361328125, 0.15434837341308594, 0.16055679321289062, 0.1667652130126953, 0.1729736328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 18.0, 24.0, 20.0, 28.0, 38.0, 32.0, 49.0, 43.0, 48.0, 61.0, 48.0, 57.0, 73.0, 73.0, 63.0, 48.0, 52.0, 25.0, 36.0, 26.0, 25.0, 14.0, 14.0, 12.0, 6.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1474609375, -0.14361858367919922, -0.13977622985839844, -0.13593387603759766, -0.13209152221679688, -0.1282491683959961, -0.12440681457519531, -0.12056446075439453, -0.11672210693359375, -0.11287975311279297, -0.10903739929199219, -0.1051950454711914, -0.10135269165039062, -0.09751033782958984, -0.09366798400878906, -0.08982563018798828, -0.0859832763671875, -0.08214092254638672, -0.07829856872558594, -0.07445621490478516, -0.07061386108398438, -0.0667715072631836, -0.06292915344238281, -0.05908679962158203, -0.05524444580078125, -0.05140209197998047, -0.04755973815917969, -0.043717384338378906, -0.039875030517578125, -0.036032676696777344, -0.03219032287597656, -0.02834796905517578, -0.024505615234375, -0.02066326141357422, -0.016820907592773438, -0.012978553771972656, -0.009136199951171875, -0.005293846130371094, -0.0014514923095703125, 0.0023908615112304688, 0.00623321533203125, 0.010075569152832031, 0.013917922973632812, 0.017760276794433594, 0.021602630615234375, 0.025444984436035156, 0.029287338256835938, 0.03312969207763672, 0.0369720458984375, 0.04081439971923828, 0.04465675354003906, 0.048499107360839844, 0.052341461181640625, 0.056183815002441406, 0.06002616882324219, 0.06386852264404297, 0.06771087646484375, 0.07155323028564453, 0.07539558410644531, 0.0792379379272461, 0.08308029174804688, 0.08692264556884766, 0.09076499938964844, 0.09460735321044922, 0.09844970703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 17.0, 14.0, 22.0, 36.0, 48.0, 81.0, 147.0, 185.0, 294.0, 541.0, 1037.0, 2499.0, 7853.0, 40465.0, 405540.0, 524198.0, 50763.0, 9367.0, 2862.0, 1103.0, 564.0, 320.0, 184.0, 126.0, 76.0, 61.0, 36.0, 31.0, 22.0, 15.0, 7.0, 3.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.568359375, -0.5525970458984375, -0.536834716796875, -0.5210723876953125, -0.50531005859375, -0.4895477294921875, -0.473785400390625, -0.4580230712890625, -0.4422607421875, -0.4264984130859375, -0.410736083984375, -0.3949737548828125, -0.37921142578125, -0.3634490966796875, -0.347686767578125, -0.3319244384765625, -0.316162109375, -0.3003997802734375, -0.284637451171875, -0.2688751220703125, -0.25311279296875, -0.2373504638671875, -0.221588134765625, -0.2058258056640625, -0.1900634765625, -0.1743011474609375, -0.158538818359375, -0.1427764892578125, -0.12701416015625, -0.1112518310546875, -0.095489501953125, -0.0797271728515625, -0.06396484375, -0.0482025146484375, -0.032440185546875, -0.0166778564453125, -0.00091552734375, 0.0148468017578125, 0.030609130859375, 0.0463714599609375, 0.0621337890625, 0.0778961181640625, 0.093658447265625, 0.1094207763671875, 0.12518310546875, 0.1409454345703125, 0.156707763671875, 0.1724700927734375, 0.188232421875, 0.2039947509765625, 0.219757080078125, 0.2355194091796875, 0.25128173828125, 0.2670440673828125, 0.282806396484375, 0.2985687255859375, 0.3143310546875, 0.3300933837890625, 0.345855712890625, 0.3616180419921875, 0.37738037109375, 0.3931427001953125, 0.408905029296875, 0.4246673583984375, 0.4404296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 18.0, 8.0, 15.0, 25.0, 27.0, 33.0, 27.0, 32.0, 44.0, 34.0, 38.0, 45.0, 46.0, 53.0, 45.0, 54.0, 47.0, 38.0, 44.0, 38.0, 36.0, 38.0, 32.0, 21.0, 22.0, 20.0, 14.0, 18.0, 18.0, 7.0, 15.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5185546875, -0.5017929077148438, -0.4850311279296875, -0.46826934814453125, -0.451507568359375, -0.43474578857421875, -0.4179840087890625, -0.40122222900390625, -0.38446044921875, -0.36769866943359375, -0.3509368896484375, -0.33417510986328125, -0.317413330078125, -0.30065155029296875, -0.2838897705078125, -0.26712799072265625, -0.2503662109375, -0.23360443115234375, -0.2168426513671875, -0.20008087158203125, -0.183319091796875, -0.16655731201171875, -0.1497955322265625, -0.13303375244140625, -0.11627197265625, -0.09951019287109375, -0.0827484130859375, -0.06598663330078125, -0.049224853515625, -0.03246307373046875, -0.0157012939453125, 0.00106048583984375, 0.017822265625, 0.03458404541015625, 0.0513458251953125, 0.06810760498046875, 0.084869384765625, 0.10163116455078125, 0.1183929443359375, 0.13515472412109375, 0.15191650390625, 0.16867828369140625, 0.1854400634765625, 0.20220184326171875, 0.218963623046875, 0.23572540283203125, 0.2524871826171875, 0.26924896240234375, 0.2860107421875, 0.30277252197265625, 0.3195343017578125, 0.33629608154296875, 0.353057861328125, 0.36981964111328125, 0.3865814208984375, 0.40334320068359375, 0.42010498046875, 0.43686676025390625, 0.4536285400390625, 0.47039031982421875, 0.487152099609375, 0.5039138793945312, 0.5206756591796875, 0.5374374389648438, 0.55419921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 10.0, 14.0, 17.0, 43.0, 55.0, 98.0, 195.0, 330.0, 808.0, 2241.0, 9113.0, 65845.0, 767635.0, 179653.0, 16793.0, 3499.0, 1171.0, 471.0, 231.0, 131.0, 85.0, 40.0, 17.0, 23.0, 10.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.345458984375, -0.3348884582519531, -0.32431793212890625, -0.3137474060058594, -0.3031768798828125, -0.2926063537597656, -0.28203582763671875, -0.2714653015136719, -0.260894775390625, -0.2503242492675781, -0.23975372314453125, -0.22918319702148438, -0.2186126708984375, -0.20804214477539062, -0.19747161865234375, -0.18690109252929688, -0.17633056640625, -0.16576004028320312, -0.15518951416015625, -0.14461898803710938, -0.1340484619140625, -0.12347793579101562, -0.11290740966796875, -0.10233688354492188, -0.091766357421875, -0.08119583129882812, -0.07062530517578125, -0.060054779052734375, -0.0494842529296875, -0.038913726806640625, -0.02834320068359375, -0.017772674560546875, -0.0072021484375, 0.003368377685546875, 0.01393890380859375, 0.024509429931640625, 0.0350799560546875, 0.045650482177734375, 0.05622100830078125, 0.06679153442382812, 0.077362060546875, 0.08793258666992188, 0.09850311279296875, 0.10907363891601562, 0.1196441650390625, 0.13021469116210938, 0.14078521728515625, 0.15135574340820312, 0.16192626953125, 0.17249679565429688, 0.18306732177734375, 0.19363784790039062, 0.2042083740234375, 0.21477890014648438, 0.22534942626953125, 0.23591995239257812, 0.246490478515625, 0.2570610046386719, 0.26763153076171875, 0.2782020568847656, 0.2887725830078125, 0.2993431091308594, 0.30991363525390625, 0.3204841613769531, 0.3310546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 6.0, 6.0, 12.0, 9.0, 13.0, 28.0, 34.0, 40.0, 77.0, 66.0, 98.0, 92.0, 84.0, 100.0, 62.0, 66.0, 46.0, 39.0, 30.0, 11.0, 11.0, 18.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.463029861450195e-05, -3.327615559101105e-05, -3.192201256752014e-05, -3.0567869544029236e-05, -2.921372652053833e-05, -2.7859583497047424e-05, -2.650544047355652e-05, -2.5151297450065613e-05, -2.3797154426574707e-05, -2.24430114030838e-05, -2.1088868379592896e-05, -1.973472535610199e-05, -1.8380582332611084e-05, -1.7026439309120178e-05, -1.5672296285629272e-05, -1.4318153262138367e-05, -1.2964010238647461e-05, -1.1609867215156555e-05, -1.025572419166565e-05, -8.901581168174744e-06, -7.547438144683838e-06, -6.193295121192932e-06, -4.839152097702026e-06, -3.4850090742111206e-06, -2.130866050720215e-06, -7.767230272293091e-07, 5.774199962615967e-07, 1.9315630197525024e-06, 3.285706043243408e-06, 4.639849066734314e-06, 5.99399209022522e-06, 7.3481351137161255e-06, 8.702278137207031e-06, 1.0056421160697937e-05, 1.1410564184188843e-05, 1.2764707207679749e-05, 1.4118850231170654e-05, 1.547299325466156e-05, 1.6827136278152466e-05, 1.818127930164337e-05, 1.9535422325134277e-05, 2.0889565348625183e-05, 2.224370837211609e-05, 2.3597851395606995e-05, 2.49519944190979e-05, 2.6306137442588806e-05, 2.7660280466079712e-05, 2.9014423489570618e-05, 3.0368566513061523e-05, 3.172270953655243e-05, 3.3076852560043335e-05, 3.443099558353424e-05, 3.5785138607025146e-05, 3.713928163051605e-05, 3.849342465400696e-05, 3.9847567677497864e-05, 4.120171070098877e-05, 4.2555853724479675e-05, 4.390999674797058e-05, 4.526413977146149e-05, 4.661828279495239e-05, 4.79724258184433e-05, 4.9326568841934204e-05, 5.068071186542511e-05, 5.2034854888916016e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 0.0, 6.0, 10.0, 7.0, 15.0, 22.0, 29.0, 60.0, 102.0, 176.0, 336.0, 736.0, 1810.0, 5548.0, 25670.0, 274539.0, 664772.0, 60126.0, 9707.0, 2792.0, 1018.0, 483.0, 230.0, 127.0, 74.0, 50.0, 36.0, 28.0, 10.0, 12.0, 9.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23136329650878906, -0.22139358520507812, -0.2114238739013672, -0.20145416259765625, -0.1914844512939453, -0.18151473999023438, -0.17154502868652344, -0.1615753173828125, -0.15160560607910156, -0.14163589477539062, -0.1316661834716797, -0.12169647216796875, -0.11172676086425781, -0.10175704956054688, -0.09178733825683594, -0.081817626953125, -0.07184791564941406, -0.061878204345703125, -0.05190849304199219, -0.04193878173828125, -0.03196907043457031, -0.021999359130859375, -0.012029647827148438, -0.0020599365234375, 0.007909774780273438, 0.017879486083984375, 0.027849197387695312, 0.03781890869140625, 0.04778861999511719, 0.057758331298828125, 0.06772804260253906, 0.07769775390625, 0.08766746520996094, 0.09763717651367188, 0.10760688781738281, 0.11757659912109375, 0.1275463104248047, 0.13751602172851562, 0.14748573303222656, 0.1574554443359375, 0.16742515563964844, 0.17739486694335938, 0.1873645782470703, 0.19733428955078125, 0.2073040008544922, 0.21727371215820312, 0.22724342346191406, 0.237213134765625, 0.24718284606933594, 0.2571525573730469, 0.2671222686767578, 0.27709197998046875, 0.2870616912841797, 0.2970314025878906, 0.30700111389160156, 0.3169708251953125, 0.32694053649902344, 0.3369102478027344, 0.3468799591064453, 0.35684967041015625, 0.3668193817138672, 0.3767890930175781, 0.38675880432128906, 0.396728515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 14.0, 22.0, 33.0, 42.0, 65.0, 83.0, 113.0, 112.0, 97.0, 94.0, 91.0, 63.0, 32.0, 28.0, 26.0, 17.0, 14.0, 11.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22362518310546875, -0.2153167724609375, -0.20700836181640625, -0.198699951171875, -0.19039154052734375, -0.1820831298828125, -0.17377471923828125, -0.16546630859375, -0.15715789794921875, -0.1488494873046875, -0.14054107666015625, -0.132232666015625, -0.12392425537109375, -0.1156158447265625, -0.10730743408203125, -0.0989990234375, -0.09069061279296875, -0.0823822021484375, -0.07407379150390625, -0.065765380859375, -0.05745697021484375, -0.0491485595703125, -0.04084014892578125, -0.03253173828125, -0.02422332763671875, -0.0159149169921875, -0.00760650634765625, 0.000701904296875, 0.00901031494140625, 0.0173187255859375, 0.02562713623046875, 0.033935546875, 0.04224395751953125, 0.0505523681640625, 0.05886077880859375, 0.067169189453125, 0.07547760009765625, 0.0837860107421875, 0.09209442138671875, 0.10040283203125, 0.10871124267578125, 0.1170196533203125, 0.12532806396484375, 0.133636474609375, 0.14194488525390625, 0.1502532958984375, 0.15856170654296875, 0.1668701171875, 0.17517852783203125, 0.1834869384765625, 0.19179534912109375, 0.200103759765625, 0.20841217041015625, 0.2167205810546875, 0.22502899169921875, 0.23333740234375, 0.24164581298828125, 0.2499542236328125, 0.25826263427734375, 0.266571044921875, 0.27487945556640625, 0.2831878662109375, 0.29149627685546875, 0.2998046875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 18.0, 25.0, 70.0, 96.0, 146.0, 183.0, 171.0, 124.0, 81.0, 38.0, 18.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.785530090332031, -4.6339921951293945, -4.482454776763916, -4.330916881561279, -4.179378986358643, -4.027841567993164, -3.8763036727905273, -3.7247657775878906, -3.573228120803833, -3.4216904640197754, -3.2701525688171387, -3.118614912033081, -2.9670772552490234, -2.8155393600463867, -2.664001703262329, -2.5124640464782715, -2.3609261512756348, -2.209388494491577, -2.0578505992889404, -1.9063129425048828, -1.7547751665115356, -1.6032373905181885, -1.4516997337341309, -1.3001619577407837, -1.1486241817474365, -0.9970864057540894, -0.845548689365387, -0.6940109729766846, -0.5424731969833374, -0.39093542098999023, -0.23939770460128784, -0.08785998821258545, 0.06367778778076172, 0.2152155339717865, 0.3667532801628113, 0.5182909965515137, 0.6698287725448608, 0.821366548538208, 0.9729042649269104, 1.1244419813156128, 1.27597975730896, 1.4275175333023071, 1.5790553092956543, 1.730592966079712, 1.882130742073059, 2.0336685180664062, 2.185206174850464, 2.3367438316345215, 2.488281726837158, 2.639819383621216, 2.7913572788238525, 2.94289493560791, 3.094432830810547, 3.2459704875946045, 3.397508144378662, 3.549046039581299, 3.7005836963653564, 3.852121353149414, 4.003659248352051, 4.1551971435546875, 4.306734561920166, 4.458272457122803, 4.6098103523254395, 4.761347770690918, 4.912885665893555]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 8.0, 9.0, 8.0, 13.0, 13.0, 13.0, 18.0, 15.0, 20.0, 23.0, 25.0, 21.0, 35.0, 53.0, 44.0, 53.0, 54.0, 51.0, 51.0, 51.0, 43.0, 42.0, 42.0, 33.0, 36.0, 37.0, 24.0, 18.0, 23.0, 15.0, 17.0, 11.0, 16.0, 9.0, 11.0, 8.0, 6.0, 4.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.340937376022339, -2.2659387588500977, -2.1909403800964355, -2.1159417629241943, -2.0409433841705322, -1.965944766998291, -1.8909462690353394, -1.8159477710723877, -1.740949273109436, -1.6659507751464844, -1.5909522771835327, -1.515953779220581, -1.4409551620483398, -1.3659567832946777, -1.2909581661224365, -1.2159596681594849, -1.1409611701965332, -1.0659626722335815, -0.9909641742706299, -0.9159656167030334, -0.8409671187400818, -0.7659686207771301, -0.6909700632095337, -0.615971565246582, -0.5409730672836304, -0.4659745693206787, -0.39097604155540466, -0.3159775137901306, -0.24097901582717896, -0.1659805178642273, -0.09098199009895325, -0.0159834623336792, 0.05901527404785156, 0.13401378691196442, 0.20901229977607727, 0.2840108275413513, 0.359009325504303, 0.43400782346725464, 0.5090063810348511, 0.5840048789978027, 0.6590033769607544, 0.734001874923706, 0.8090003728866577, 0.8839989304542542, 0.9589974284172058, 1.0339958667755127, 1.108994483947754, 1.1839929819107056, 1.2589914798736572, 1.3339899778366089, 1.4089884757995605, 1.4839869737625122, 1.5589854717254639, 1.633984088897705, 1.7089825868606567, 1.7839810848236084, 1.85897958278656, 1.9339780807495117, 2.008976697921753, 2.083975076675415, 2.1589736938476562, 2.2339720726013184, 2.3089706897735596, 2.383969306945801, 2.458967685699463]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 20.0, 25.0, 34.0, 30.0, 57.0, 63.0, 89.0, 142.0, 222.0, 280.0, 407.0, 707.0, 1224.0, 2449.0, 6496.0, 33467.0, 4114581.0, 23304.0, 5353.0, 2220.0, 1155.0, 606.0, 419.0, 256.0, 168.0, 132.0, 85.0, 81.0, 58.0, 44.0, 23.0, 26.0, 19.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5263671875, -0.5101318359375, -0.493896484375, -0.4776611328125, -0.46142578125, -0.4451904296875, -0.428955078125, -0.4127197265625, -0.396484375, -0.3802490234375, -0.364013671875, -0.3477783203125, -0.33154296875, -0.3153076171875, -0.299072265625, -0.2828369140625, -0.2666015625, -0.2503662109375, -0.234130859375, -0.2178955078125, -0.20166015625, -0.1854248046875, -0.169189453125, -0.1529541015625, -0.13671875, -0.1204833984375, -0.104248046875, -0.0880126953125, -0.07177734375, -0.0555419921875, -0.039306640625, -0.0230712890625, -0.0068359375, 0.0093994140625, 0.025634765625, 0.0418701171875, 0.05810546875, 0.0743408203125, 0.090576171875, 0.1068115234375, 0.123046875, 0.1392822265625, 0.155517578125, 0.1717529296875, 0.18798828125, 0.2042236328125, 0.220458984375, 0.2366943359375, 0.2529296875, 0.2691650390625, 0.285400390625, 0.3016357421875, 0.31787109375, 0.3341064453125, 0.350341796875, 0.3665771484375, 0.3828125, 0.3990478515625, 0.415283203125, 0.4315185546875, 0.44775390625, 0.4639892578125, 0.480224609375, 0.4964599609375, 0.5126953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 7.0, 12.0, 13.0, 15.0, 14.0, 29.0, 21.0, 28.0, 31.0, 29.0, 43.0, 69.0, 59.0, 68.0, 64.0, 70.0, 62.0, 61.0, 52.0, 42.0, 44.0, 43.0, 30.0, 35.0, 7.0, 16.0, 4.0, 11.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.1522216796875, -0.1479644775390625, -0.143707275390625, -0.1394500732421875, -0.13519287109375, -0.1309356689453125, -0.126678466796875, -0.1224212646484375, -0.1181640625, -0.1139068603515625, -0.109649658203125, -0.1053924560546875, -0.10113525390625, -0.0968780517578125, -0.092620849609375, -0.0883636474609375, -0.0841064453125, -0.0798492431640625, -0.075592041015625, -0.0713348388671875, -0.06707763671875, -0.0628204345703125, -0.058563232421875, -0.0543060302734375, -0.050048828125, -0.0457916259765625, -0.041534423828125, -0.0372772216796875, -0.03302001953125, -0.0287628173828125, -0.024505615234375, -0.0202484130859375, -0.0159912109375, -0.0117340087890625, -0.007476806640625, -0.0032196044921875, 0.00103759765625, 0.0052947998046875, 0.009552001953125, 0.0138092041015625, 0.01806640625, 0.0223236083984375, 0.026580810546875, 0.0308380126953125, 0.03509521484375, 0.0393524169921875, 0.043609619140625, 0.0478668212890625, 0.0521240234375, 0.0563812255859375, 0.060638427734375, 0.0648956298828125, 0.06915283203125, 0.0734100341796875, 0.077667236328125, 0.0819244384765625, 0.086181640625, 0.0904388427734375, 0.094696044921875, 0.0989532470703125, 0.10321044921875, 0.1074676513671875, 0.111724853515625, 0.1159820556640625, 0.1202392578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 7.0, 12.0, 10.0, 29.0, 34.0, 49.0, 64.0, 67.0, 98.0, 158.0, 244.0, 376.0, 667.0, 1408.0, 3572.0, 12472.0, 289997.0, 3864122.0, 13750.0, 3830.0, 1461.0, 695.0, 389.0, 220.0, 161.0, 102.0, 78.0, 59.0, 37.0, 23.0, 28.0, 17.0, 11.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8232421875, -0.7975387573242188, -0.7718353271484375, -0.7461318969726562, -0.720428466796875, -0.6947250366210938, -0.6690216064453125, -0.6433181762695312, -0.61761474609375, -0.5919113159179688, -0.5662078857421875, -0.5405044555664062, -0.514801025390625, -0.48909759521484375, -0.4633941650390625, -0.43769073486328125, -0.4119873046875, -0.38628387451171875, -0.3605804443359375, -0.33487701416015625, -0.309173583984375, -0.28347015380859375, -0.2577667236328125, -0.23206329345703125, -0.20635986328125, -0.18065643310546875, -0.1549530029296875, -0.12924957275390625, -0.103546142578125, -0.07784271240234375, -0.0521392822265625, -0.02643585205078125, -0.000732421875, 0.02497100830078125, 0.0506744384765625, 0.07637786865234375, 0.102081298828125, 0.12778472900390625, 0.1534881591796875, 0.17919158935546875, 0.20489501953125, 0.23059844970703125, 0.2563018798828125, 0.28200531005859375, 0.307708740234375, 0.33341217041015625, 0.3591156005859375, 0.38481903076171875, 0.4105224609375, 0.43622589111328125, 0.4619293212890625, 0.48763275146484375, 0.513336181640625, 0.5390396118164062, 0.5647430419921875, 0.5904464721679688, 0.61614990234375, 0.6418533325195312, 0.6675567626953125, 0.6932601928710938, 0.718963623046875, 0.7446670532226562, 0.7703704833984375, 0.7960739135742188, 0.82177734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 4.0, 4.0, 6.0, 3.0, 8.0, 23.0, 41.0, 423.0, 3468.0, 49.0, 22.0, 13.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.23950576782226562, -0.23303985595703125, -0.22657394409179688, -0.2201080322265625, -0.21364212036132812, -0.20717620849609375, -0.20071029663085938, -0.194244384765625, -0.18777847290039062, -0.18131256103515625, -0.17484664916992188, -0.1683807373046875, -0.16191482543945312, -0.15544891357421875, -0.14898300170898438, -0.14251708984375, -0.13605117797851562, -0.12958526611328125, -0.12311935424804688, -0.1166534423828125, -0.11018753051757812, -0.10372161865234375, -0.09725570678710938, -0.090789794921875, -0.08432388305664062, -0.07785797119140625, -0.07139205932617188, -0.0649261474609375, -0.058460235595703125, -0.05199432373046875, -0.045528411865234375, -0.0390625, -0.032596588134765625, -0.02613067626953125, -0.019664764404296875, -0.0131988525390625, -0.006732940673828125, -0.00026702880859375, 0.006198883056640625, 0.012664794921875, 0.019130706787109375, 0.02559661865234375, 0.032062530517578125, 0.0385284423828125, 0.044994354248046875, 0.05146026611328125, 0.057926177978515625, 0.06439208984375, 0.07085800170898438, 0.07732391357421875, 0.08378982543945312, 0.0902557373046875, 0.09672164916992188, 0.10318756103515625, 0.10965347290039062, 0.116119384765625, 0.12258529663085938, 0.12905120849609375, 0.13551712036132812, 0.1419830322265625, 0.14844894409179688, 0.15491485595703125, 0.16138076782226562, 0.1678466796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 2.0, 8.0, 4.0, 5.0, 9.0, 16.0, 27.0, 40.0, 55.0, 96.0, 109.0, 114.0, 131.0, 121.0, 92.0, 63.0, 28.0, 26.0, 20.0, 16.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5904878377914429, -0.574653148651123, -0.5588184595108032, -0.5429837107658386, -0.5271490216255188, -0.511314332485199, -0.49547961354255676, -0.47964489459991455, -0.4638102054595947, -0.4479755163192749, -0.4321407973766327, -0.4163060784339905, -0.40047138929367065, -0.38463670015335083, -0.3688019812107086, -0.3529672622680664, -0.3371325731277466, -0.32129788398742676, -0.30546316504478455, -0.28962844610214233, -0.2737937569618225, -0.2579590678215027, -0.24212434887886047, -0.22628964483737946, -0.21045494079589844, -0.19462023675441742, -0.1787855327129364, -0.16295082867145538, -0.14711612462997437, -0.13128142058849335, -0.11544671654701233, -0.09961201250553131, -0.08377724885940552, -0.0679425448179245, -0.05210784077644348, -0.03627313673496246, -0.020438432693481445, -0.004603728652000427, 0.01123097538948059, 0.02706567943096161, 0.04290038347244263, 0.058735087513923645, 0.07456979155540466, 0.09040449559688568, 0.1062391996383667, 0.12207390367984772, 0.13790860772132874, 0.15374331176280975, 0.16957801580429077, 0.1854127198457718, 0.2012474238872528, 0.21708212792873383, 0.23291683197021484, 0.24875153601169586, 0.2645862400531769, 0.2804209589958191, 0.2962556481361389, 0.31209033727645874, 0.32792505621910095, 0.34375977516174316, 0.359594464302063, 0.3754291534423828, 0.391263872385025, 0.40709859132766724, 0.42293328046798706]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 6.0, 5.0, 7.0, 8.0, 12.0, 13.0, 19.0, 19.0, 16.0, 23.0, 22.0, 32.0, 20.0, 33.0, 33.0, 40.0, 33.0, 48.0, 29.0, 44.0, 41.0, 43.0, 36.0, 28.0, 37.0, 31.0, 45.0, 36.0, 33.0, 15.0, 20.0, 22.0, 17.0, 18.0, 18.0, 13.0, 18.0, 18.0, 8.0, 8.0, 12.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22275447845458984, -0.21590979397296906, -0.20906510949134827, -0.20222041010856628, -0.1953757256269455, -0.1885310411453247, -0.18168634176254272, -0.17484165728092194, -0.16799697279930115, -0.16115228831768036, -0.15430760383605957, -0.1474629044532776, -0.1406182199716568, -0.133773535490036, -0.12692883610725403, -0.12008415162563324, -0.11323946714401245, -0.10639478266239166, -0.09955009073019028, -0.09270539879798889, -0.0858607143163681, -0.07901602983474731, -0.07217133790254593, -0.06532664597034454, -0.058481961488723755, -0.05163727328181267, -0.04479258507490158, -0.037947896867990494, -0.031103208661079407, -0.02425852045416832, -0.017413832247257233, -0.010569144040346146, -0.0037244558334350586, 0.0031202323734760284, 0.009964920580387115, 0.016809608787298203, 0.02365429699420929, 0.030498985201120377, 0.037343673408031464, 0.04418836161494255, 0.05103304982185364, 0.057877738028764725, 0.06472242623567581, 0.0715671181678772, 0.07841180264949799, 0.08525648713111877, 0.09210117906332016, 0.09894587099552155, 0.10579055547714233, 0.11263523995876312, 0.11947993189096451, 0.1263246238231659, 0.13316930830478668, 0.14001399278640747, 0.14685869216918945, 0.15370337665081024, 0.16054806113243103, 0.16739274561405182, 0.1742374300956726, 0.1810821294784546, 0.18792681396007538, 0.19477149844169617, 0.20161619782447815, 0.20846088230609894, 0.21530556678771973]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 14.0, 37.0, 38.0, 61.0, 129.0, 171.0, 272.0, 444.0, 669.0, 1182.0, 1931.0, 3572.0, 6511.0, 12468.0, 24290.0, 49406.0, 100855.0, 199051.0, 279832.0, 183705.0, 91317.0, 44958.0, 22230.0, 11420.0, 5958.0, 3249.0, 1872.0, 1094.0, 639.0, 401.0, 240.0, 172.0, 96.0, 73.0, 53.0, 31.0, 26.0, 20.0, 14.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1552734375, -0.15048599243164062, -0.14569854736328125, -0.14091110229492188, -0.1361236572265625, -0.13133621215820312, -0.12654876708984375, -0.12176132202148438, -0.116973876953125, -0.11218643188476562, -0.10739898681640625, -0.10261154174804688, -0.0978240966796875, -0.09303665161132812, -0.08824920654296875, -0.08346176147460938, -0.07867431640625, -0.07388687133789062, -0.06909942626953125, -0.06431198120117188, -0.0595245361328125, -0.054737091064453125, -0.04994964599609375, -0.045162200927734375, -0.040374755859375, -0.035587310791015625, -0.03079986572265625, -0.026012420654296875, -0.0212249755859375, -0.016437530517578125, -0.01165008544921875, -0.006862640380859375, -0.0020751953125, 0.002712249755859375, 0.00749969482421875, 0.012287139892578125, 0.0170745849609375, 0.021862030029296875, 0.02664947509765625, 0.031436920166015625, 0.036224365234375, 0.041011810302734375, 0.04579925537109375, 0.050586700439453125, 0.0553741455078125, 0.060161590576171875, 0.06494903564453125, 0.06973648071289062, 0.07452392578125, 0.07931137084960938, 0.08409881591796875, 0.08888626098632812, 0.0936737060546875, 0.09846115112304688, 0.10324859619140625, 0.10803604125976562, 0.112823486328125, 0.11761093139648438, 0.12239837646484375, 0.12718582153320312, 0.1319732666015625, 0.13676071166992188, 0.14154815673828125, 0.14633560180664062, 0.151123046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 13.0, 10.0, 18.0, 16.0, 24.0, 26.0, 35.0, 42.0, 41.0, 38.0, 63.0, 73.0, 72.0, 63.0, 60.0, 67.0, 67.0, 47.0, 48.0, 39.0, 31.0, 22.0, 22.0, 17.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15725326538085938, -0.15251922607421875, -0.14778518676757812, -0.1430511474609375, -0.13831710815429688, -0.13358306884765625, -0.12884902954101562, -0.124114990234375, -0.11938095092773438, -0.11464691162109375, -0.10991287231445312, -0.1051788330078125, -0.10044479370117188, -0.09571075439453125, -0.09097671508789062, -0.08624267578125, -0.08150863647460938, -0.07677459716796875, -0.07204055786132812, -0.0673065185546875, -0.06257247924804688, -0.05783843994140625, -0.053104400634765625, -0.048370361328125, -0.043636322021484375, -0.03890228271484375, -0.034168243408203125, -0.0294342041015625, -0.024700164794921875, -0.01996612548828125, -0.015232086181640625, -0.010498046875, -0.005764007568359375, -0.00102996826171875, 0.003704071044921875, 0.0084381103515625, 0.013172149658203125, 0.01790618896484375, 0.022640228271484375, 0.027374267578125, 0.032108306884765625, 0.03684234619140625, 0.041576385498046875, 0.0463104248046875, 0.051044464111328125, 0.05577850341796875, 0.060512542724609375, 0.06524658203125, 0.06998062133789062, 0.07471466064453125, 0.07944869995117188, 0.0841827392578125, 0.08891677856445312, 0.09365081787109375, 0.09838485717773438, 0.103118896484375, 0.10785293579101562, 0.11258697509765625, 0.11732101440429688, 0.1220550537109375, 0.12678909301757812, 0.13152313232421875, 0.13625717163085938, 0.1409912109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 7.0, 9.0, 14.0, 21.0, 9.0, 31.0, 30.0, 43.0, 60.0, 81.0, 75.0, 124.0, 175.0, 249.0, 333.0, 472.0, 740.0, 1428.0, 3172.0, 9614.0, 40706.0, 249322.0, 597281.0, 112280.0, 21213.0, 5680.0, 2170.0, 1099.0, 630.0, 419.0, 255.0, 179.0, 141.0, 114.0, 92.0, 66.0, 55.0, 33.0, 31.0, 20.0, 16.0, 6.0, 11.0, 13.0, 9.0, 2.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.283203125, -0.2738533020019531, -0.26450347900390625, -0.2551536560058594, -0.2458038330078125, -0.23645401000976562, -0.22710418701171875, -0.21775436401367188, -0.208404541015625, -0.19905471801757812, -0.18970489501953125, -0.18035507202148438, -0.1710052490234375, -0.16165542602539062, -0.15230560302734375, -0.14295578002929688, -0.13360595703125, -0.12425613403320312, -0.11490631103515625, -0.10555648803710938, -0.0962066650390625, -0.08685684204101562, -0.07750701904296875, -0.06815719604492188, -0.058807373046875, -0.049457550048828125, -0.04010772705078125, -0.030757904052734375, -0.0214080810546875, -0.012058258056640625, -0.00270843505859375, 0.006641387939453125, 0.0159912109375, 0.025341033935546875, 0.03469085693359375, 0.044040679931640625, 0.0533905029296875, 0.06274032592773438, 0.07209014892578125, 0.08143997192382812, 0.090789794921875, 0.10013961791992188, 0.10948944091796875, 0.11883926391601562, 0.1281890869140625, 0.13753890991210938, 0.14688873291015625, 0.15623855590820312, 0.16558837890625, 0.17493820190429688, 0.18428802490234375, 0.19363784790039062, 0.2029876708984375, 0.21233749389648438, 0.22168731689453125, 0.23103713989257812, 0.240386962890625, 0.24973678588867188, 0.25908660888671875, 0.2684364318847656, 0.2777862548828125, 0.2871360778808594, 0.29648590087890625, 0.3058357238769531, 0.315185546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 15.0, 10.0, 5.0, 9.0, 17.0, 21.0, 24.0, 24.0, 28.0, 23.0, 30.0, 24.0, 34.0, 39.0, 41.0, 54.0, 39.0, 60.0, 39.0, 39.0, 38.0, 38.0, 28.0, 29.0, 30.0, 38.0, 36.0, 24.0, 10.0, 24.0, 32.0, 15.0, 15.0, 12.0, 11.0, 8.0, 5.0, 1.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.3796272277832031, -0.36545562744140625, -0.3512840270996094, -0.3371124267578125, -0.3229408264160156, -0.30876922607421875, -0.2945976257324219, -0.280426025390625, -0.2662544250488281, -0.25208282470703125, -0.23791122436523438, -0.2237396240234375, -0.20956802368164062, -0.19539642333984375, -0.18122482299804688, -0.16705322265625, -0.15288162231445312, -0.13871002197265625, -0.12453842163085938, -0.1103668212890625, -0.09619522094726562, -0.08202362060546875, -0.06785202026367188, -0.053680419921875, -0.039508819580078125, -0.02533721923828125, -0.011165618896484375, 0.0030059814453125, 0.017177581787109375, 0.03134918212890625, 0.045520782470703125, 0.0596923828125, 0.07386398315429688, 0.08803558349609375, 0.10220718383789062, 0.1163787841796875, 0.13055038452148438, 0.14472198486328125, 0.15889358520507812, 0.173065185546875, 0.18723678588867188, 0.20140838623046875, 0.21557998657226562, 0.2297515869140625, 0.24392318725585938, 0.25809478759765625, 0.2722663879394531, 0.28643798828125, 0.3006095886230469, 0.31478118896484375, 0.3289527893066406, 0.3431243896484375, 0.3572959899902344, 0.37146759033203125, 0.3856391906738281, 0.399810791015625, 0.4139823913574219, 0.42815399169921875, 0.4423255920410156, 0.4564971923828125, 0.4706687927246094, 0.48484039306640625, 0.4990119934082031, 0.51318359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 16.0, 22.0, 13.0, 37.0, 38.0, 91.0, 144.0, 261.0, 592.0, 1465.0, 4899.0, 28057.0, 422791.0, 548192.0, 33543.0, 5479.0, 1610.0, 626.0, 281.0, 134.0, 87.0, 44.0, 38.0, 19.0, 19.0, 6.0, 9.0, 7.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.288330078125, -0.2803306579589844, -0.27233123779296875, -0.2643318176269531, -0.2563323974609375, -0.24833297729492188, -0.24033355712890625, -0.23233413696289062, -0.224334716796875, -0.21633529663085938, -0.20833587646484375, -0.20033645629882812, -0.1923370361328125, -0.18433761596679688, -0.17633819580078125, -0.16833877563476562, -0.16033935546875, -0.15233993530273438, -0.14434051513671875, -0.13634109497070312, -0.1283416748046875, -0.12034225463867188, -0.11234283447265625, -0.10434341430664062, -0.096343994140625, -0.08834457397460938, -0.08034515380859375, -0.07234573364257812, -0.0643463134765625, -0.056346893310546875, -0.04834747314453125, -0.040348052978515625, -0.0323486328125, -0.024349212646484375, -0.01634979248046875, -0.008350372314453125, -0.0003509521484375, 0.007648468017578125, 0.01564788818359375, 0.023647308349609375, 0.031646728515625, 0.039646148681640625, 0.04764556884765625, 0.055644989013671875, 0.0636444091796875, 0.07164382934570312, 0.07964324951171875, 0.08764266967773438, 0.09564208984375, 0.10364151000976562, 0.11164093017578125, 0.11964035034179688, 0.1276397705078125, 0.13563919067382812, 0.14363861083984375, 0.15163803100585938, 0.159637451171875, 0.16763687133789062, 0.17563629150390625, 0.18363571166992188, 0.1916351318359375, 0.19963455200195312, 0.20763397216796875, 0.21563339233398438, 0.2236328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 9.0, 13.0, 17.0, 34.0, 34.0, 49.0, 75.0, 124.0, 157.0, 133.0, 103.0, 74.0, 57.0, 29.0, 26.0, 15.0, 17.0, 10.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.667043685913086e-05, -4.479195922613144e-05, -4.291348159313202e-05, -4.10350039601326e-05, -3.915652632713318e-05, -3.727804869413376e-05, -3.539957106113434e-05, -3.352109342813492e-05, -3.16426157951355e-05, -2.9764138162136078e-05, -2.7885660529136658e-05, -2.6007182896137238e-05, -2.4128705263137817e-05, -2.2250227630138397e-05, -2.0371749997138977e-05, -1.8493272364139557e-05, -1.6614794731140137e-05, -1.4736317098140717e-05, -1.2857839465141296e-05, -1.0979361832141876e-05, -9.100884199142456e-06, -7.222406566143036e-06, -5.343928933143616e-06, -3.4654513001441956e-06, -1.5869736671447754e-06, 2.915039658546448e-07, 2.169981598854065e-06, 4.048459231853485e-06, 5.926936864852905e-06, 7.805414497852325e-06, 9.683892130851746e-06, 1.1562369763851166e-05, 1.3440847396850586e-05, 1.5319325029850006e-05, 1.7197802662849426e-05, 1.9076280295848846e-05, 2.0954757928848267e-05, 2.2833235561847687e-05, 2.4711713194847107e-05, 2.6590190827846527e-05, 2.8468668460845947e-05, 3.0347146093845367e-05, 3.222562372684479e-05, 3.410410135984421e-05, 3.598257899284363e-05, 3.786105662584305e-05, 3.973953425884247e-05, 4.161801189184189e-05, 4.349648952484131e-05, 4.537496715784073e-05, 4.725344479084015e-05, 4.913192242383957e-05, 5.101040005683899e-05, 5.288887768983841e-05, 5.476735532283783e-05, 5.664583295583725e-05, 5.852431058883667e-05, 6.040278822183609e-05, 6.228126585483551e-05, 6.415974348783493e-05, 6.603822112083435e-05, 6.791669875383377e-05, 6.979517638683319e-05, 7.167365401983261e-05, 7.355213165283203e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 26.0, 32.0, 61.0, 108.0, 172.0, 332.0, 820.0, 2184.0, 10323.0, 106401.0, 816587.0, 97932.0, 9754.0, 2267.0, 800.0, 326.0, 168.0, 86.0, 52.0, 31.0, 22.0, 13.0, 7.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3324413299560547, -0.3233299255371094, -0.31421852111816406, -0.30510711669921875, -0.29599571228027344, -0.2868843078613281, -0.2777729034423828, -0.2686614990234375, -0.2595500946044922, -0.2504386901855469, -0.24132728576660156, -0.23221588134765625, -0.22310447692871094, -0.21399307250976562, -0.2048816680908203, -0.195770263671875, -0.1866588592529297, -0.17754745483398438, -0.16843605041503906, -0.15932464599609375, -0.15021324157714844, -0.14110183715820312, -0.1319904327392578, -0.1228790283203125, -0.11376762390136719, -0.10465621948242188, -0.09554481506347656, -0.08643341064453125, -0.07732200622558594, -0.06821060180664062, -0.05909919738769531, -0.04998779296875, -0.04087638854980469, -0.031764984130859375, -0.022653579711914062, -0.01354217529296875, -0.0044307708740234375, 0.004680633544921875, 0.013792037963867188, 0.0229034423828125, 0.03201484680175781, 0.041126251220703125, 0.05023765563964844, 0.05934906005859375, 0.06846046447753906, 0.07757186889648438, 0.08668327331542969, 0.095794677734375, 0.10490608215332031, 0.11401748657226562, 0.12312889099121094, 0.13224029541015625, 0.14135169982910156, 0.15046310424804688, 0.1595745086669922, 0.1686859130859375, 0.1777973175048828, 0.18690872192382812, 0.19602012634277344, 0.20513153076171875, 0.21424293518066406, 0.22335433959960938, 0.2324657440185547, 0.2415771484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 8.0, 15.0, 23.0, 33.0, 48.0, 73.0, 70.0, 119.0, 97.0, 136.0, 91.0, 94.0, 63.0, 41.0, 23.0, 18.0, 14.0, 9.0, 1.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2871742248535156, -0.28015899658203125, -0.2731437683105469, -0.2661285400390625, -0.2591133117675781, -0.25209808349609375, -0.24508285522460938, -0.238067626953125, -0.23105239868164062, -0.22403717041015625, -0.21702194213867188, -0.2100067138671875, -0.20299148559570312, -0.19597625732421875, -0.18896102905273438, -0.18194580078125, -0.17493057250976562, -0.16791534423828125, -0.16090011596679688, -0.1538848876953125, -0.14686965942382812, -0.13985443115234375, -0.13283920288085938, -0.125823974609375, -0.11880874633789062, -0.11179351806640625, -0.10477828979492188, -0.0977630615234375, -0.09074783325195312, -0.08373260498046875, -0.07671737670898438, -0.0697021484375, -0.06268692016601562, -0.05567169189453125, -0.048656463623046875, -0.0416412353515625, -0.034626007080078125, -0.02761077880859375, -0.020595550537109375, -0.013580322265625, -0.006565093994140625, 0.00045013427734375, 0.007465362548828125, 0.0144805908203125, 0.021495819091796875, 0.02851104736328125, 0.035526275634765625, 0.04254150390625, 0.049556732177734375, 0.05657196044921875, 0.06358718872070312, 0.0706024169921875, 0.07761764526367188, 0.08463287353515625, 0.09164810180664062, 0.098663330078125, 0.10567855834960938, 0.11269378662109375, 0.11970901489257812, 0.1267242431640625, 0.13373947143554688, 0.14075469970703125, 0.14776992797851562, 0.15478515625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 8.0, 15.0, 37.0, 75.0, 106.0, 142.0, 178.0, 167.0, 114.0, 66.0, 43.0, 20.0, 8.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.119657516479492, -4.010087490081787, -3.900517702102661, -3.790947914123535, -3.681378126144409, -3.571808338165283, -3.462238311767578, -3.352668523788452, -3.243098735809326, -3.1335289478302, -3.023958921432495, -2.914389133453369, -2.804819345474243, -2.695249557495117, -2.585679531097412, -2.476109743118286, -2.366539716720581, -2.256969928741455, -2.14739990234375, -2.037830114364624, -1.928260326385498, -1.8186904191970825, -1.709120512008667, -1.599550724029541, -1.4899808168411255, -1.38041090965271, -1.270841121673584, -1.1612712144851685, -1.051701307296753, -0.942131519317627, -0.8325616121292114, -0.7229917645454407, -0.6134216785430908, -0.5038518309593201, -0.39428195357322693, -0.2847120761871338, -0.17514222860336304, -0.06557238101959229, 0.04399752616882324, 0.153567373752594, 0.26313722133636475, 0.3727070689201355, 0.48227694630622864, 0.5918468236923218, 0.7014166712760925, 0.8109865188598633, 0.9205564260482788, 1.0301263332366943, 1.1396961212158203, 1.2492660284042358, 1.3588358163833618, 1.4684057235717773, 1.5779755115509033, 1.6875454187393188, 1.7971153259277344, 1.9066851139068604, 2.0162549018859863, 2.1258246898651123, 2.2353947162628174, 2.3449645042419434, 2.4545342922210693, 2.5641040802001953, 2.6736741065979004, 2.7832438945770264, 2.8928139209747314]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 9.0, 9.0, 7.0, 5.0, 16.0, 15.0, 20.0, 22.0, 26.0, 32.0, 40.0, 33.0, 54.0, 43.0, 52.0, 69.0, 74.0, 61.0, 60.0, 46.0, 52.0, 43.0, 31.0, 33.0, 26.0, 21.0, 19.0, 19.0, 13.0, 13.0, 10.0, 3.0, 8.0, 5.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-3.3458478450775146, -3.259589195251465, -3.173330307006836, -3.087071657180786, -3.0008130073547363, -2.9145543575286865, -2.8282957077026367, -2.742036819458008, -2.655778169631958, -2.569519519805908, -2.4832606315612793, -2.3970019817352295, -2.3107433319091797, -2.22448468208313, -2.13822603225708, -2.051967144012451, -1.9657084941864014, -1.8794498443603516, -1.7931910753250122, -1.7069323062896729, -1.620673656463623, -1.5344150066375732, -1.4481562376022339, -1.3618974685668945, -1.2756388187408447, -1.189380168914795, -1.1031213998794556, -1.0168626308441162, -0.9306039810180664, -0.8443452715873718, -0.7580865621566772, -0.6718278527259827, -0.5855693817138672, -0.4993106722831726, -0.413051962852478, -0.32679325342178345, -0.24053454399108887, -0.1542758345603943, -0.06801712512969971, 0.018241584300994873, 0.10450029373168945, 0.19075900316238403, 0.2770177125930786, 0.3632764220237732, 0.4495351314544678, 0.5357938408851624, 0.6220525503158569, 0.7083112597465515, 0.7945699691772461, 0.8808286786079407, 0.9670873880386353, 1.0533461570739746, 1.1396048069000244, 1.2258634567260742, 1.3121222257614136, 1.398380994796753, 1.4846396446228027, 1.5708982944488525, 1.657157063484192, 1.7434158325195312, 1.829674482345581, 1.9159331321716309, 2.0021920204162598, 2.0884506702423096, 2.1747093200683594]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 2.0, 3.0, 8.0, 6.0, 15.0, 19.0, 35.0, 53.0, 59.0, 100.0, 130.0, 188.0, 325.0, 424.0, 655.0, 1057.0, 1864.0, 3379.0, 7028.0, 18008.0, 94084.0, 3977468.0, 61372.0, 14475.0, 6002.0, 2989.0, 1683.0, 1003.0, 597.0, 406.0, 258.0, 179.0, 119.0, 76.0, 51.0, 46.0, 27.0, 23.0, 15.0, 15.0, 8.0, 4.0, 7.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2844200134277344, -0.27440643310546875, -0.2643928527832031, -0.2543792724609375, -0.24436569213867188, -0.23435211181640625, -0.22433853149414062, -0.214324951171875, -0.20431137084960938, -0.19429779052734375, -0.18428421020507812, -0.1742706298828125, -0.16425704956054688, -0.15424346923828125, -0.14422988891601562, -0.13421630859375, -0.12420272827148438, -0.11418914794921875, -0.10417556762695312, -0.0941619873046875, -0.08414840698242188, -0.07413482666015625, -0.06412124633789062, -0.054107666015625, -0.044094085693359375, -0.03408050537109375, -0.024066925048828125, -0.0140533447265625, -0.004039764404296875, 0.00597381591796875, 0.015987396240234375, 0.0260009765625, 0.036014556884765625, 0.04602813720703125, 0.056041717529296875, 0.0660552978515625, 0.07606887817382812, 0.08608245849609375, 0.09609603881835938, 0.106109619140625, 0.11612319946289062, 0.12613677978515625, 0.13615036010742188, 0.1461639404296875, 0.15617752075195312, 0.16619110107421875, 0.17620468139648438, 0.18621826171875, 0.19623184204101562, 0.20624542236328125, 0.21625900268554688, 0.2262725830078125, 0.23628616333007812, 0.24629974365234375, 0.2563133239746094, 0.266326904296875, 0.2763404846191406, 0.28635406494140625, 0.2963676452636719, 0.3063812255859375, 0.3163948059082031, 0.32640838623046875, 0.3364219665527344, 0.346435546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 7.0, 7.0, 8.0, 14.0, 14.0, 15.0, 19.0, 28.0, 29.0, 34.0, 38.0, 46.0, 50.0, 60.0, 61.0, 65.0, 70.0, 58.0, 57.0, 62.0, 44.0, 38.0, 28.0, 35.0, 23.0, 20.0, 19.0, 15.0, 9.0, 13.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.1629638671875, -0.1585378646850586, -0.1541118621826172, -0.14968585968017578, -0.14525985717773438, -0.14083385467529297, -0.13640785217285156, -0.13198184967041016, -0.12755584716796875, -0.12312984466552734, -0.11870384216308594, -0.11427783966064453, -0.10985183715820312, -0.10542583465576172, -0.10099983215332031, -0.0965738296508789, -0.0921478271484375, -0.0877218246459961, -0.08329582214355469, -0.07886981964111328, -0.07444381713867188, -0.07001781463623047, -0.06559181213378906, -0.061165809631347656, -0.05673980712890625, -0.052313804626464844, -0.04788780212402344, -0.04346179962158203, -0.039035797119140625, -0.03460979461669922, -0.030183792114257812, -0.025757789611816406, -0.021331787109375, -0.016905784606933594, -0.012479782104492188, -0.008053779602050781, -0.003627777099609375, 0.0007982254028320312, 0.0052242279052734375, 0.009650230407714844, 0.01407623291015625, 0.018502235412597656, 0.022928237915039062, 0.02735424041748047, 0.031780242919921875, 0.03620624542236328, 0.04063224792480469, 0.045058250427246094, 0.0494842529296875, 0.053910255432128906, 0.05833625793457031, 0.06276226043701172, 0.06718826293945312, 0.07161426544189453, 0.07604026794433594, 0.08046627044677734, 0.08489227294921875, 0.08931827545166016, 0.09374427795410156, 0.09817028045654297, 0.10259628295898438, 0.10702228546142578, 0.11144828796386719, 0.1158742904663086, 0.12030029296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 10.0, 9.0, 10.0, 10.0, 21.0, 20.0, 32.0, 51.0, 78.0, 128.0, 229.0, 444.0, 970.0, 2551.0, 9695.0, 81384.0, 4053118.0, 35802.0, 6255.0, 1817.0, 736.0, 367.0, 198.0, 109.0, 80.0, 32.0, 25.0, 25.0, 15.0, 13.0, 10.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.8662109375, -0.840240478515625, -0.81427001953125, -0.788299560546875, -0.7623291015625, -0.736358642578125, -0.71038818359375, -0.684417724609375, -0.658447265625, -0.632476806640625, -0.60650634765625, -0.580535888671875, -0.5545654296875, -0.528594970703125, -0.50262451171875, -0.476654052734375, -0.45068359375, -0.424713134765625, -0.39874267578125, -0.372772216796875, -0.3468017578125, -0.320831298828125, -0.29486083984375, -0.268890380859375, -0.242919921875, -0.216949462890625, -0.19097900390625, -0.165008544921875, -0.1390380859375, -0.113067626953125, -0.08709716796875, -0.061126708984375, -0.03515625, -0.009185791015625, 0.01678466796875, 0.042755126953125, 0.0687255859375, 0.094696044921875, 0.12066650390625, 0.146636962890625, 0.172607421875, 0.198577880859375, 0.22454833984375, 0.250518798828125, 0.2764892578125, 0.302459716796875, 0.32843017578125, 0.354400634765625, 0.38037109375, 0.406341552734375, 0.43231201171875, 0.458282470703125, 0.4842529296875, 0.510223388671875, 0.53619384765625, 0.562164306640625, 0.588134765625, 0.614105224609375, 0.64007568359375, 0.666046142578125, 0.6920166015625, 0.717987060546875, 0.74395751953125, 0.769927978515625, 0.7958984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 15.0, 24.0, 39.0, 73.0, 235.0, 3345.0, 188.0, 61.0, 22.0, 17.0, 10.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.18571853637695312, -0.17661285400390625, -0.16750717163085938, -0.1584014892578125, -0.14929580688476562, -0.14019012451171875, -0.13108444213867188, -0.121978759765625, -0.11287307739257812, -0.10376739501953125, -0.09466171264648438, -0.0855560302734375, -0.07645034790039062, -0.06734466552734375, -0.058238983154296875, -0.04913330078125, -0.040027618408203125, -0.03092193603515625, -0.021816253662109375, -0.0127105712890625, -0.003604888916015625, 0.00550079345703125, 0.014606475830078125, 0.023712158203125, 0.032817840576171875, 0.04192352294921875, 0.051029205322265625, 0.0601348876953125, 0.06924057006835938, 0.07834625244140625, 0.08745193481445312, 0.0965576171875, 0.10566329956054688, 0.11476898193359375, 0.12387466430664062, 0.1329803466796875, 0.14208602905273438, 0.15119171142578125, 0.16029739379882812, 0.169403076171875, 0.17850875854492188, 0.18761444091796875, 0.19672012329101562, 0.2058258056640625, 0.21493148803710938, 0.22403717041015625, 0.23314285278320312, 0.24224853515625, 0.2513542175292969, 0.26045989990234375, 0.2695655822753906, 0.2786712646484375, 0.2877769470214844, 0.29688262939453125, 0.3059883117675781, 0.315093994140625, 0.3241996765136719, 0.33330535888671875, 0.3424110412597656, 0.3515167236328125, 0.3606224060058594, 0.36972808837890625, 0.3788337707519531, 0.387939453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 8.0, 4.0, 9.0, 15.0, 16.0, 19.0, 27.0, 39.0, 38.0, 48.0, 59.0, 65.0, 79.0, 82.0, 70.0, 68.0, 62.0, 59.0, 43.0, 27.0, 36.0, 33.0, 19.0, 9.0, 5.0, 9.0, 12.0, 3.0, 8.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.7346688508987427, -0.7159498929977417, -0.6972309947013855, -0.6785120368003845, -0.6597931385040283, -0.6410741806030273, -0.6223552823066711, -0.6036363244056702, -0.584917426109314, -0.566198468208313, -0.5474795699119568, -0.5287606120109558, -0.5100417137145996, -0.49132275581359863, -0.47260382771492004, -0.45388489961624146, -0.4351659417152405, -0.4164470136165619, -0.3977280855178833, -0.3790091574192047, -0.3602902293205261, -0.34157127141952515, -0.32285234332084656, -0.30413341522216797, -0.2854144871234894, -0.2666955590248108, -0.2479766309261322, -0.22925768792629242, -0.21053875982761383, -0.19181983172893524, -0.17310088872909546, -0.15438196063041687, -0.13566303253173828, -0.11694410443305969, -0.0982251688838005, -0.07950623333454132, -0.06078730523586273, -0.04206837713718414, -0.023349441587924957, -0.0046305060386657715, 0.014088422060012817, 0.032807353883981705, 0.05152628570795059, 0.07024522125720978, 0.08896414935588837, 0.10768307745456696, 0.12640202045440674, 0.14512094855308533, 0.16383987665176392, 0.1825588047504425, 0.2012777328491211, 0.21999667584896088, 0.23871560394763947, 0.25743454694747925, 0.27615347504615784, 0.2948724031448364, 0.313591331243515, 0.3323102593421936, 0.3510291874408722, 0.3697481155395508, 0.38846707344055176, 0.40718597173690796, 0.42590492963790894, 0.4446238577365875, 0.4633427858352661]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 10.0, 13.0, 8.0, 14.0, 14.0, 15.0, 18.0, 23.0, 19.0, 21.0, 23.0, 21.0, 25.0, 43.0, 36.0, 30.0, 42.0, 41.0, 56.0, 32.0, 39.0, 51.0, 42.0, 37.0, 37.0, 35.0, 29.0, 39.0, 14.0, 30.0, 27.0, 17.0, 13.0, 10.0, 16.0, 6.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.5365151166915894, -0.5212335586547852, -0.505952000617981, -0.49067047238349915, -0.47538894414901733, -0.46010738611221313, -0.44482582807540894, -0.4295442998409271, -0.4142627716064453, -0.3989812135696411, -0.3836996853351593, -0.3684181272983551, -0.3531365990638733, -0.3378550410270691, -0.3225734829902649, -0.3072919547557831, -0.2920103967189789, -0.2767288386821747, -0.26144731044769287, -0.24616575241088867, -0.23088422417640686, -0.21560266613960266, -0.20032112300395966, -0.18503957986831665, -0.16975803673267365, -0.15447649359703064, -0.13919495046138763, -0.12391339987516403, -0.10863185673952103, -0.09335031360387802, -0.07806876301765442, -0.06278721988201141, -0.04750567674636841, -0.0322241336107254, -0.0169425867497921, -0.0016610398888587952, 0.01362050324678421, 0.028902046382427216, 0.04418359696865082, 0.05946514010429382, 0.07474668323993683, 0.09002822637557983, 0.10530976951122284, 0.12059132009744644, 0.13587287068367004, 0.15115439891815186, 0.16643595695495605, 0.18171750009059906, 0.19699904322624207, 0.21228058636188507, 0.22756212949752808, 0.24284368753433228, 0.2581252157688141, 0.2734067738056183, 0.2886883020401001, 0.3039698600769043, 0.3192514181137085, 0.3345329761505127, 0.3498145043849945, 0.3650960624217987, 0.3803775906562805, 0.3956591486930847, 0.4109407067298889, 0.4262222349643707, 0.44150376319885254]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 27.0, 25.0, 47.0, 72.0, 136.0, 201.0, 322.0, 528.0, 950.0, 1597.0, 2941.0, 5454.0, 10732.0, 21836.0, 47791.0, 114419.0, 296047.0, 321363.0, 124025.0, 51936.0, 23394.0, 11521.0, 5825.0, 3258.0, 1681.0, 985.0, 562.0, 322.0, 227.0, 115.0, 63.0, 39.0, 41.0, 22.0, 7.0, 7.0, 11.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.231964111328125, -0.22369384765625, -0.215423583984375, -0.2071533203125, -0.198883056640625, -0.19061279296875, -0.182342529296875, -0.174072265625, -0.165802001953125, -0.15753173828125, -0.149261474609375, -0.1409912109375, -0.132720947265625, -0.12445068359375, -0.116180419921875, -0.10791015625, -0.099639892578125, -0.09136962890625, -0.083099365234375, -0.0748291015625, -0.066558837890625, -0.05828857421875, -0.050018310546875, -0.041748046875, -0.033477783203125, -0.02520751953125, -0.016937255859375, -0.0086669921875, -0.000396728515625, 0.00787353515625, 0.016143798828125, 0.0244140625, 0.032684326171875, 0.04095458984375, 0.049224853515625, 0.0574951171875, 0.065765380859375, 0.07403564453125, 0.082305908203125, 0.090576171875, 0.098846435546875, 0.10711669921875, 0.115386962890625, 0.1236572265625, 0.131927490234375, 0.14019775390625, 0.148468017578125, 0.15673828125, 0.165008544921875, 0.17327880859375, 0.181549072265625, 0.1898193359375, 0.198089599609375, 0.20635986328125, 0.214630126953125, 0.222900390625, 0.231170654296875, 0.23944091796875, 0.247711181640625, 0.2559814453125, 0.264251708984375, 0.27252197265625, 0.280792236328125, 0.2890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 4.0, 12.0, 9.0, 12.0, 24.0, 13.0, 21.0, 29.0, 37.0, 36.0, 38.0, 44.0, 59.0, 57.0, 58.0, 55.0, 54.0, 60.0, 43.0, 45.0, 41.0, 38.0, 43.0, 27.0, 27.0, 26.0, 13.0, 16.0, 12.0, 6.0, 8.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.149688720703125, -0.14532470703125, -0.140960693359375, -0.1365966796875, -0.132232666015625, -0.12786865234375, -0.123504638671875, -0.119140625, -0.114776611328125, -0.11041259765625, -0.106048583984375, -0.1016845703125, -0.097320556640625, -0.09295654296875, -0.088592529296875, -0.084228515625, -0.079864501953125, -0.07550048828125, -0.071136474609375, -0.0667724609375, -0.062408447265625, -0.05804443359375, -0.053680419921875, -0.04931640625, -0.044952392578125, -0.04058837890625, -0.036224365234375, -0.0318603515625, -0.027496337890625, -0.02313232421875, -0.018768310546875, -0.014404296875, -0.010040283203125, -0.00567626953125, -0.001312255859375, 0.0030517578125, 0.007415771484375, 0.01177978515625, 0.016143798828125, 0.0205078125, 0.024871826171875, 0.02923583984375, 0.033599853515625, 0.0379638671875, 0.042327880859375, 0.04669189453125, 0.051055908203125, 0.055419921875, 0.059783935546875, 0.06414794921875, 0.068511962890625, 0.0728759765625, 0.077239990234375, 0.08160400390625, 0.085968017578125, 0.09033203125, 0.094696044921875, 0.09906005859375, 0.103424072265625, 0.1077880859375, 0.112152099609375, 0.11651611328125, 0.120880126953125, 0.125244140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 14.0, 10.0, 17.0, 21.0, 24.0, 30.0, 41.0, 57.0, 78.0, 134.0, 186.0, 302.0, 445.0, 756.0, 1371.0, 2877.0, 7832.0, 29229.0, 185809.0, 679882.0, 108158.0, 19914.0, 5833.0, 2406.0, 1228.0, 654.0, 430.0, 245.0, 153.0, 120.0, 70.0, 54.0, 54.0, 28.0, 27.0, 13.0, 11.0, 12.0, 2.0, 7.0, 0.0, 5.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.494964599609375, -0.47967529296875, -0.464385986328125, -0.4490966796875, -0.433807373046875, -0.41851806640625, -0.403228759765625, -0.387939453125, -0.372650146484375, -0.35736083984375, -0.342071533203125, -0.3267822265625, -0.311492919921875, -0.29620361328125, -0.280914306640625, -0.265625, -0.250335693359375, -0.23504638671875, -0.219757080078125, -0.2044677734375, -0.189178466796875, -0.17388916015625, -0.158599853515625, -0.143310546875, -0.128021240234375, -0.11273193359375, -0.097442626953125, -0.0821533203125, -0.066864013671875, -0.05157470703125, -0.036285400390625, -0.02099609375, -0.005706787109375, 0.00958251953125, 0.024871826171875, 0.0401611328125, 0.055450439453125, 0.07073974609375, 0.086029052734375, 0.101318359375, 0.116607666015625, 0.13189697265625, 0.147186279296875, 0.1624755859375, 0.177764892578125, 0.19305419921875, 0.208343505859375, 0.2236328125, 0.238922119140625, 0.25421142578125, 0.269500732421875, 0.2847900390625, 0.300079345703125, 0.31536865234375, 0.330657958984375, 0.345947265625, 0.361236572265625, 0.37652587890625, 0.391815185546875, 0.4071044921875, 0.422393798828125, 0.43768310546875, 0.452972412109375, 0.46826171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 9.0, 6.0, 14.0, 20.0, 18.0, 17.0, 32.0, 24.0, 36.0, 45.0, 45.0, 40.0, 65.0, 51.0, 43.0, 51.0, 51.0, 50.0, 41.0, 48.0, 38.0, 35.0, 37.0, 26.0, 22.0, 18.0, 20.0, 9.0, 13.0, 8.0, 10.0, 7.0, 10.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.591796875, -0.5741729736328125, -0.556549072265625, -0.5389251708984375, -0.52130126953125, -0.5036773681640625, -0.486053466796875, -0.4684295654296875, -0.4508056640625, -0.4331817626953125, -0.415557861328125, -0.3979339599609375, -0.38031005859375, -0.3626861572265625, -0.345062255859375, -0.3274383544921875, -0.309814453125, -0.2921905517578125, -0.274566650390625, -0.2569427490234375, -0.23931884765625, -0.2216949462890625, -0.204071044921875, -0.1864471435546875, -0.1688232421875, -0.1511993408203125, -0.133575439453125, -0.1159515380859375, -0.09832763671875, -0.0807037353515625, -0.063079833984375, -0.0454559326171875, -0.02783203125, -0.0102081298828125, 0.007415771484375, 0.0250396728515625, 0.04266357421875, 0.0602874755859375, 0.077911376953125, 0.0955352783203125, 0.1131591796875, 0.1307830810546875, 0.148406982421875, 0.1660308837890625, 0.18365478515625, 0.2012786865234375, 0.218902587890625, 0.2365264892578125, 0.254150390625, 0.2717742919921875, 0.289398193359375, 0.3070220947265625, 0.32464599609375, 0.3422698974609375, 0.359893798828125, 0.3775177001953125, 0.3951416015625, 0.4127655029296875, 0.430389404296875, 0.4480133056640625, 0.46563720703125, 0.4832611083984375, 0.500885009765625, 0.5185089111328125, 0.5361328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 6.0, 11.0, 7.0, 20.0, 32.0, 43.0, 54.0, 79.0, 141.0, 238.0, 419.0, 834.0, 1719.0, 4111.0, 11908.0, 44429.0, 252635.0, 587011.0, 108910.0, 23366.0, 7146.0, 2745.0, 1243.0, 557.0, 326.0, 200.0, 122.0, 62.0, 44.0, 27.0, 27.0, 16.0, 8.0, 13.0, 6.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.172607421875, -0.16725921630859375, -0.1619110107421875, -0.15656280517578125, -0.151214599609375, -0.14586639404296875, -0.1405181884765625, -0.13516998291015625, -0.12982177734375, -0.12447357177734375, -0.1191253662109375, -0.11377716064453125, -0.108428955078125, -0.10308074951171875, -0.0977325439453125, -0.09238433837890625, -0.0870361328125, -0.08168792724609375, -0.0763397216796875, -0.07099151611328125, -0.065643310546875, -0.06029510498046875, -0.0549468994140625, -0.04959869384765625, -0.04425048828125, -0.03890228271484375, -0.0335540771484375, -0.02820587158203125, -0.022857666015625, -0.01750946044921875, -0.0121612548828125, -0.00681304931640625, -0.00146484375, 0.00388336181640625, 0.0092315673828125, 0.01457977294921875, 0.019927978515625, 0.02527618408203125, 0.0306243896484375, 0.03597259521484375, 0.04132080078125, 0.04666900634765625, 0.0520172119140625, 0.05736541748046875, 0.062713623046875, 0.06806182861328125, 0.0734100341796875, 0.07875823974609375, 0.0841064453125, 0.08945465087890625, 0.0948028564453125, 0.10015106201171875, 0.105499267578125, 0.11084747314453125, 0.1161956787109375, 0.12154388427734375, 0.12689208984375, 0.13224029541015625, 0.1375885009765625, 0.14293670654296875, 0.148284912109375, 0.15363311767578125, 0.1589813232421875, 0.16432952880859375, 0.169677734375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 6.0, 10.0, 6.0, 9.0, 16.0, 26.0, 25.0, 21.0, 37.0, 38.0, 47.0, 58.0, 82.0, 111.0, 104.0, 82.0, 70.0, 51.0, 34.0, 34.0, 30.0, 29.0, 14.0, 5.0, 7.0, 10.0, 11.0, 4.0, 7.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.805492401123047e-05, -5.653873085975647e-05, -5.502253770828247e-05, -5.350634455680847e-05, -5.199015140533447e-05, -5.0473958253860474e-05, -4.8957765102386475e-05, -4.7441571950912476e-05, -4.5925378799438477e-05, -4.440918564796448e-05, -4.289299249649048e-05, -4.137679934501648e-05, -3.986060619354248e-05, -3.834441304206848e-05, -3.682821989059448e-05, -3.5312026739120483e-05, -3.3795833587646484e-05, -3.2279640436172485e-05, -3.0763447284698486e-05, -2.9247254133224487e-05, -2.7731060981750488e-05, -2.621486783027649e-05, -2.469867467880249e-05, -2.318248152732849e-05, -2.1666288375854492e-05, -2.0150095224380493e-05, -1.8633902072906494e-05, -1.7117708921432495e-05, -1.5601515769958496e-05, -1.4085322618484497e-05, -1.2569129467010498e-05, -1.1052936315536499e-05, -9.5367431640625e-06, -8.020550012588501e-06, -6.504356861114502e-06, -4.988163709640503e-06, -3.471970558166504e-06, -1.955777406692505e-06, -4.3958425521850586e-07, 1.0766088962554932e-06, 2.592802047729492e-06, 4.108995199203491e-06, 5.62518835067749e-06, 7.141381502151489e-06, 8.657574653625488e-06, 1.0173767805099487e-05, 1.1689960956573486e-05, 1.3206154108047485e-05, 1.4722347259521484e-05, 1.6238540410995483e-05, 1.7754733562469482e-05, 1.927092671394348e-05, 2.078711986541748e-05, 2.230331301689148e-05, 2.381950616836548e-05, 2.5335699319839478e-05, 2.6851892471313477e-05, 2.8368085622787476e-05, 2.9884278774261475e-05, 3.1400471925735474e-05, 3.291666507720947e-05, 3.443285822868347e-05, 3.594905138015747e-05, 3.746524453163147e-05, 3.898143768310547e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 8.0, 7.0, 18.0, 24.0, 26.0, 40.0, 46.0, 83.0, 104.0, 202.0, 290.0, 493.0, 786.0, 1526.0, 3183.0, 7713.0, 24348.0, 112016.0, 566195.0, 261816.0, 47189.0, 12823.0, 4747.0, 2206.0, 1027.0, 587.0, 372.0, 189.0, 137.0, 94.0, 66.0, 51.0, 37.0, 24.0, 22.0, 17.0, 12.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.1770038604736328, -0.17175674438476562, -0.16650962829589844, -0.16126251220703125, -0.15601539611816406, -0.15076828002929688, -0.1455211639404297, -0.1402740478515625, -0.1350269317626953, -0.12977981567382812, -0.12453269958496094, -0.11928558349609375, -0.11403846740722656, -0.10879135131835938, -0.10354423522949219, -0.098297119140625, -0.09305000305175781, -0.08780288696289062, -0.08255577087402344, -0.07730865478515625, -0.07206153869628906, -0.06681442260742188, -0.06156730651855469, -0.0563201904296875, -0.05107307434082031, -0.045825958251953125, -0.04057884216308594, -0.03533172607421875, -0.030084609985351562, -0.024837493896484375, -0.019590377807617188, -0.01434326171875, -0.009096145629882812, -0.003849029541015625, 0.0013980865478515625, 0.00664520263671875, 0.011892318725585938, 0.017139434814453125, 0.022386550903320312, 0.0276336669921875, 0.03288078308105469, 0.038127899169921875, 0.04337501525878906, 0.04862213134765625, 0.05386924743652344, 0.059116363525390625, 0.06436347961425781, 0.069610595703125, 0.07485771179199219, 0.08010482788085938, 0.08535194396972656, 0.09059906005859375, 0.09584617614746094, 0.10109329223632812, 0.10634040832519531, 0.1115875244140625, 0.11683464050292969, 0.12208175659179688, 0.12732887268066406, 0.13257598876953125, 0.13782310485839844, 0.14307022094726562, 0.1483173370361328, 0.153564453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 7.0, 4.0, 6.0, 9.0, 11.0, 9.0, 25.0, 17.0, 40.0, 35.0, 54.0, 52.0, 70.0, 73.0, 68.0, 76.0, 78.0, 80.0, 51.0, 50.0, 39.0, 30.0, 20.0, 16.0, 18.0, 13.0, 10.0, 5.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.147216796875, -0.14231300354003906, -0.13740921020507812, -0.1325054168701172, -0.12760162353515625, -0.12269783020019531, -0.11779403686523438, -0.11289024353027344, -0.1079864501953125, -0.10308265686035156, -0.09817886352539062, -0.09327507019042969, -0.08837127685546875, -0.08346748352050781, -0.07856369018554688, -0.07365989685058594, -0.068756103515625, -0.06385231018066406, -0.058948516845703125, -0.05404472351074219, -0.04914093017578125, -0.04423713684082031, -0.039333343505859375, -0.03442955017089844, -0.0295257568359375, -0.024621963500976562, -0.019718170166015625, -0.014814376831054688, -0.00991058349609375, -0.0050067901611328125, -0.000102996826171875, 0.0048007965087890625, 0.00970458984375, 0.014608383178710938, 0.019512176513671875, 0.024415969848632812, 0.02931976318359375, 0.03422355651855469, 0.039127349853515625, 0.04403114318847656, 0.0489349365234375, 0.05383872985839844, 0.058742523193359375, 0.06364631652832031, 0.06855010986328125, 0.07345390319824219, 0.07835769653320312, 0.08326148986816406, 0.088165283203125, 0.09306907653808594, 0.09797286987304688, 0.10287666320800781, 0.10778045654296875, 0.11268424987792969, 0.11758804321289062, 0.12249183654785156, 0.1273956298828125, 0.13229942321777344, 0.13720321655273438, 0.1421070098876953, 0.14701080322265625, 0.1519145965576172, 0.15681838989257812, 0.16172218322753906, 0.1666259765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 9.0, 8.0, 26.0, 66.0, 94.0, 134.0, 169.0, 170.0, 119.0, 90.0, 51.0, 23.0, 16.0, 12.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.531129837036133, -4.384349346160889, -4.2375688552856445, -4.0907883644104, -3.9440078735351562, -3.797227382659912, -3.650447130203247, -3.503666639328003, -3.356886148452759, -3.2101056575775146, -3.0633251667022705, -2.9165446758270264, -2.7697644233703613, -2.622983932495117, -2.476203441619873, -2.329422950744629, -2.1826424598693848, -2.0358619689941406, -1.8890814781188965, -1.742301106452942, -1.5955206155776978, -1.4487401247024536, -1.301959753036499, -1.1551792621612549, -1.0083987712860107, -0.8616182804107666, -0.7148378491401672, -0.5680574178695679, -0.42127692699432373, -0.2744964361190796, -0.12771600484848022, 0.01906442642211914, 0.16584539413452148, 0.31262585520744324, 0.459406316280365, 0.6061867475509644, 0.7529672384262085, 0.8997477293014526, 1.0465281009674072, 1.1933085918426514, 1.3400890827178955, 1.4868695735931396, 1.6336500644683838, 1.7804304361343384, 1.9272109270095825, 2.073991298675537, 2.2207717895507812, 2.3675522804260254, 2.5143327713012695, 2.6611132621765137, 2.807893753051758, 2.954674243927002, 3.101454734802246, 3.2482352256774902, 3.3950154781341553, 3.5417959690093994, 3.6885764598846436, 3.8353569507598877, 3.982137441635132, 4.128917694091797, 4.275698184967041, 4.422478675842285, 4.569259166717529, 4.716039657592773, 4.862820148468018]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 10.0, 6.0, 6.0, 13.0, 8.0, 6.0, 16.0, 17.0, 27.0, 20.0, 17.0, 21.0, 33.0, 31.0, 40.0, 37.0, 41.0, 48.0, 33.0, 38.0, 37.0, 40.0, 43.0, 49.0, 39.0, 27.0, 40.0, 29.0, 20.0, 35.0, 17.0, 37.0, 20.0, 20.0, 12.0, 10.0, 12.0, 4.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.8938207626342773, -1.8231133222579956, -1.7524058818817139, -1.6816984415054321, -1.6109910011291504, -1.540283441543579, -1.4695760011672974, -1.3988685607910156, -1.3281611204147339, -1.2574536800384521, -1.1867462396621704, -1.1160387992858887, -1.0453312397003174, -0.9746238589286804, -0.9039163589477539, -0.8332089185714722, -0.7625014781951904, -0.6917940378189087, -0.621086597442627, -0.5503790974617004, -0.4796716570854187, -0.40896421670913696, -0.33825674653053284, -0.2675492763519287, -0.19684183597564697, -0.12613438069820404, -0.05542692542076111, 0.015280529856681824, 0.08598798513412476, 0.1566954255104065, 0.22740289568901062, 0.29811036586761475, 0.3688175678253174, 0.4395250082015991, 0.5102324485778809, 0.5809399485588074, 0.6516473889350891, 0.7223548293113708, 0.7930623292922974, 0.8637697696685791, 0.9344772100448608, 1.0051846504211426, 1.0758920907974243, 1.146599531173706, 1.2173070907592773, 1.2880144119262695, 1.3587219715118408, 1.4294294118881226, 1.5001368522644043, 1.570844292640686, 1.6415517330169678, 1.7122591733932495, 1.7829666137695312, 1.8536741733551025, 1.9243816137313843, 1.995089054107666, 2.065796375274658, 2.1365039348602295, 2.2072112560272217, 2.277918815612793, 2.348626136779785, 2.4193336963653564, 2.4900410175323486, 2.56074857711792, 2.631456136703491]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 9.0, 13.0, 16.0, 27.0, 58.0, 60.0, 111.0, 177.0, 268.0, 454.0, 746.0, 1246.0, 2270.0, 4047.0, 8332.0, 18925.0, 54286.0, 308442.0, 3278883.0, 413486.0, 62373.0, 20707.0, 9113.0, 4375.0, 2339.0, 1378.0, 802.0, 495.0, 313.0, 205.0, 132.0, 65.0, 60.0, 25.0, 15.0, 13.0, 5.0, 9.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285888671875, -0.27710723876953125, -0.2683258056640625, -0.25954437255859375, -0.250762939453125, -0.24198150634765625, -0.2332000732421875, -0.22441864013671875, -0.21563720703125, -0.20685577392578125, -0.1980743408203125, -0.18929290771484375, -0.180511474609375, -0.17173004150390625, -0.1629486083984375, -0.15416717529296875, -0.1453857421875, -0.13660430908203125, -0.1278228759765625, -0.11904144287109375, -0.110260009765625, -0.10147857666015625, -0.0926971435546875, -0.08391571044921875, -0.07513427734375, -0.06635284423828125, -0.0575714111328125, -0.04878997802734375, -0.040008544921875, -0.03122711181640625, -0.0224456787109375, -0.01366424560546875, -0.0048828125, 0.00389862060546875, 0.0126800537109375, 0.02146148681640625, 0.030242919921875, 0.03902435302734375, 0.0478057861328125, 0.05658721923828125, 0.06536865234375, 0.07415008544921875, 0.0829315185546875, 0.09171295166015625, 0.100494384765625, 0.10927581787109375, 0.1180572509765625, 0.12683868408203125, 0.1356201171875, 0.14440155029296875, 0.1531829833984375, 0.16196441650390625, 0.170745849609375, 0.17952728271484375, 0.1883087158203125, 0.19709014892578125, 0.20587158203125, 0.21465301513671875, 0.2234344482421875, 0.23221588134765625, 0.240997314453125, 0.24977874755859375, 0.2585601806640625, 0.26734161376953125, 0.276123046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 12.0, 15.0, 11.0, 22.0, 20.0, 37.0, 27.0, 40.0, 50.0, 68.0, 54.0, 58.0, 56.0, 67.0, 67.0, 66.0, 54.0, 63.0, 33.0, 35.0, 38.0, 23.0, 17.0, 21.0, 13.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1602783203125, -0.1556987762451172, -0.15111923217773438, -0.14653968811035156, -0.14196014404296875, -0.13738059997558594, -0.13280105590820312, -0.1282215118408203, -0.1236419677734375, -0.11906242370605469, -0.11448287963867188, -0.10990333557128906, -0.10532379150390625, -0.10074424743652344, -0.09616470336914062, -0.09158515930175781, -0.087005615234375, -0.08242607116699219, -0.07784652709960938, -0.07326698303222656, -0.06868743896484375, -0.06410789489746094, -0.059528350830078125, -0.05494880676269531, -0.0503692626953125, -0.04578971862792969, -0.041210174560546875, -0.03663063049316406, -0.03205108642578125, -0.027471542358398438, -0.022891998291015625, -0.018312454223632812, -0.01373291015625, -0.009153366088867188, -0.004573822021484375, 5.7220458984375e-06, 0.00458526611328125, 0.009164810180664062, 0.013744354248046875, 0.018323898315429688, 0.0229034423828125, 0.027482986450195312, 0.032062530517578125, 0.03664207458496094, 0.04122161865234375, 0.04580116271972656, 0.050380706787109375, 0.05496025085449219, 0.059539794921875, 0.06411933898925781, 0.06869888305664062, 0.07327842712402344, 0.07785797119140625, 0.08243751525878906, 0.08701705932617188, 0.09159660339355469, 0.0961761474609375, 0.10075569152832031, 0.10533523559570312, 0.10991477966308594, 0.11449432373046875, 0.11907386779785156, 0.12365341186523438, 0.1282329559326172, 0.1328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 7.0, 15.0, 10.0, 24.0, 39.0, 46.0, 82.0, 127.0, 192.0, 320.0, 609.0, 1083.0, 2192.0, 5052.0, 12743.0, 39775.0, 213291.0, 3403205.0, 429413.0, 57347.0, 16661.0, 6311.0, 2729.0, 1345.0, 683.0, 390.0, 210.0, 119.0, 65.0, 63.0, 39.0, 23.0, 14.0, 12.0, 7.0, 13.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3444671630859375, -0.332000732421875, -0.3195343017578125, -0.30706787109375, -0.2946014404296875, -0.282135009765625, -0.2696685791015625, -0.2572021484375, -0.2447357177734375, -0.232269287109375, -0.2198028564453125, -0.20733642578125, -0.1948699951171875, -0.182403564453125, -0.1699371337890625, -0.157470703125, -0.1450042724609375, -0.132537841796875, -0.1200714111328125, -0.10760498046875, -0.0951385498046875, -0.082672119140625, -0.0702056884765625, -0.0577392578125, -0.0452728271484375, -0.032806396484375, -0.0203399658203125, -0.00787353515625, 0.0045928955078125, 0.017059326171875, 0.0295257568359375, 0.0419921875, 0.0544586181640625, 0.066925048828125, 0.0793914794921875, 0.09185791015625, 0.1043243408203125, 0.116790771484375, 0.1292572021484375, 0.1417236328125, 0.1541900634765625, 0.166656494140625, 0.1791229248046875, 0.19158935546875, 0.2040557861328125, 0.216522216796875, 0.2289886474609375, 0.241455078125, 0.2539215087890625, 0.266387939453125, 0.2788543701171875, 0.29132080078125, 0.3037872314453125, 0.316253662109375, 0.3287200927734375, 0.3411865234375, 0.3536529541015625, 0.366119384765625, 0.3785858154296875, 0.39105224609375, 0.4035186767578125, 0.415985107421875, 0.4284515380859375, 0.44091796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 3.0, 8.0, 6.0, 9.0, 10.0, 16.0, 14.0, 21.0, 36.0, 35.0, 55.0, 90.0, 140.0, 269.0, 540.0, 1058.0, 754.0, 384.0, 190.0, 125.0, 75.0, 60.0, 38.0, 28.0, 23.0, 17.0, 12.0, 9.0, 6.0, 6.0, 5.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.321533203125, -0.3099479675292969, -0.29836273193359375, -0.2867774963378906, -0.2751922607421875, -0.2636070251464844, -0.25202178955078125, -0.24043655395507812, -0.228851318359375, -0.21726608276367188, -0.20568084716796875, -0.19409561157226562, -0.1825103759765625, -0.17092514038085938, -0.15933990478515625, -0.14775466918945312, -0.13616943359375, -0.12458419799804688, -0.11299896240234375, -0.10141372680664062, -0.0898284912109375, -0.07824325561523438, -0.06665802001953125, -0.055072784423828125, -0.043487548828125, -0.031902313232421875, -0.02031707763671875, -0.008731842041015625, 0.0028533935546875, 0.014438629150390625, 0.02602386474609375, 0.037609100341796875, 0.0491943359375, 0.060779571533203125, 0.07236480712890625, 0.08395004272460938, 0.0955352783203125, 0.10712051391601562, 0.11870574951171875, 0.13029098510742188, 0.141876220703125, 0.15346145629882812, 0.16504669189453125, 0.17663192749023438, 0.1882171630859375, 0.19980239868164062, 0.21138763427734375, 0.22297286987304688, 0.23455810546875, 0.24614334106445312, 0.25772857666015625, 0.2693138122558594, 0.2808990478515625, 0.2924842834472656, 0.30406951904296875, 0.3156547546386719, 0.327239990234375, 0.3388252258300781, 0.35041046142578125, 0.3619956970214844, 0.3735809326171875, 0.3851661682128906, 0.39675140380859375, 0.4083366394042969, 0.419921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 1.0, 7.0, 2.0, 11.0, 12.0, 36.0, 93.0, 167.0, 228.0, 204.0, 137.0, 54.0, 21.0, 13.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.369821548461914, -6.2051591873168945, -6.040497303009033, -5.875834941864014, -5.711172580718994, -5.546510696411133, -5.381848335266113, -5.217185974121094, -5.052523612976074, -4.887861251831055, -4.723199367523193, -4.558537006378174, -4.393874645233154, -4.229212760925293, -4.064550399780273, -3.899888038635254, -3.7352261543273926, -3.570564031600952, -3.4059016704559326, -3.241239547729492, -3.0765771865844727, -2.9119150638580322, -2.747252941131592, -2.5825905799865723, -2.417928457260132, -2.2532663345336914, -2.088603973388672, -1.9239418506622314, -1.7592796087265015, -1.5946173667907715, -1.429955244064331, -1.265293002128601, -1.100630760192871, -0.9359685182571411, -0.7713063359260559, -0.6066441535949707, -0.4419819116592407, -0.27731966972351074, -0.11265748739242554, 0.05200469493865967, 0.21666693687438965, 0.38132914900779724, 0.5459913611412048, 0.71065354347229, 0.87531578540802, 1.03997802734375, 1.2046401500701904, 1.3693023920059204, 1.5339646339416504, 1.6986268758773804, 1.8632891178131104, 2.027951240539551, 2.1926136016845703, 2.3572757244110107, 2.521937847137451, 2.6866002082824707, 2.851262331008911, 3.0159244537353516, 3.180586814880371, 3.3452489376068115, 3.509911060333252, 3.6745734214782715, 3.839235544204712, 4.003897666931152, 4.168560028076172]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 9.0, 7.0, 12.0, 14.0, 16.0, 21.0, 31.0, 29.0, 31.0, 30.0, 59.0, 43.0, 55.0, 66.0, 65.0, 68.0, 53.0, 45.0, 60.0, 63.0, 37.0, 32.0, 32.0, 32.0, 27.0, 17.0, 13.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9480023384094238, -1.8851134777069092, -1.822224497795105, -1.7593356370925903, -1.6964466571807861, -1.6335577964782715, -1.5706689357757568, -1.5077800750732422, -1.444891095161438, -1.3820022344589233, -1.3191132545471191, -1.2562243938446045, -1.1933355331420898, -1.1304465532302856, -1.067557692527771, -1.0046687126159668, -0.9417798519134521, -0.8788909316062927, -0.8160020112991333, -0.7531131505966187, -0.6902242302894592, -0.6273353099822998, -0.5644464492797852, -0.5015575289726257, -0.4386686086654663, -0.3757796883583069, -0.31289079785346985, -0.2500019073486328, -0.1871129870414734, -0.12422406673431396, -0.06133517622947693, 0.0015537142753601074, 0.06444239616394043, 0.12733130156993866, 0.1902202069759369, 0.2531090974807739, 0.31599801778793335, 0.3788869380950928, 0.4417758285999298, 0.5046647191047668, 0.5675536394119263, 0.6304425597190857, 0.6933314800262451, 0.7562203407287598, 0.8191092610359192, 0.8819981813430786, 0.9448870420455933, 1.0077760219573975, 1.070664882659912, 1.1335537433624268, 1.196442723274231, 1.2593315839767456, 1.3222205638885498, 1.3851094245910645, 1.447998285293579, 1.5108871459960938, 1.573776125907898, 1.6366649866104126, 1.6995539665222168, 1.7624428272247314, 1.825331687927246, 1.8882206678390503, 1.951109528541565, 2.013998508453369, 2.076887369155884]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 8.0, 10.0, 13.0, 15.0, 20.0, 28.0, 34.0, 67.0, 89.0, 120.0, 174.0, 222.0, 377.0, 589.0, 883.0, 1521.0, 2230.0, 4061.0, 7310.0, 13714.0, 27852.0, 61135.0, 158589.0, 369731.0, 235416.0, 87143.0, 37386.0, 17786.0, 9177.0, 5140.0, 2820.0, 1737.0, 1030.0, 712.0, 432.0, 284.0, 214.0, 125.0, 101.0, 82.0, 54.0, 32.0, 34.0, 20.0, 14.0, 11.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22624588012695312, -0.21836090087890625, -0.21047592163085938, -0.2025909423828125, -0.19470596313476562, -0.18682098388671875, -0.17893600463867188, -0.171051025390625, -0.16316604614257812, -0.15528106689453125, -0.14739608764648438, -0.1395111083984375, -0.13162612915039062, -0.12374114990234375, -0.11585617065429688, -0.10797119140625, -0.10008621215820312, -0.09220123291015625, -0.08431625366210938, -0.0764312744140625, -0.06854629516601562, -0.06066131591796875, -0.052776336669921875, -0.044891357421875, -0.037006378173828125, -0.02912139892578125, -0.021236419677734375, -0.0133514404296875, -0.005466461181640625, 0.00241851806640625, 0.010303497314453125, 0.0181884765625, 0.026073455810546875, 0.03395843505859375, 0.041843414306640625, 0.0497283935546875, 0.057613372802734375, 0.06549835205078125, 0.07338333129882812, 0.081268310546875, 0.08915328979492188, 0.09703826904296875, 0.10492324829101562, 0.1128082275390625, 0.12069320678710938, 0.12857818603515625, 0.13646316528320312, 0.14434814453125, 0.15223312377929688, 0.16011810302734375, 0.16800308227539062, 0.1758880615234375, 0.18377304077148438, 0.19165802001953125, 0.19954299926757812, 0.207427978515625, 0.21531295776367188, 0.22319793701171875, 0.23108291625976562, 0.2389678955078125, 0.24685287475585938, 0.25473785400390625, 0.2626228332519531, 0.2705078125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 15.0, 10.0, 15.0, 20.0, 26.0, 34.0, 44.0, 40.0, 40.0, 35.0, 42.0, 40.0, 53.0, 48.0, 50.0, 60.0, 59.0, 42.0, 47.0, 36.0, 38.0, 44.0, 19.0, 23.0, 20.0, 11.0, 15.0, 8.0, 4.0, 5.0, 5.0, 7.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.118408203125, -0.11462688446044922, -0.11084556579589844, -0.10706424713134766, -0.10328292846679688, -0.0995016098022461, -0.09572029113769531, -0.09193897247314453, -0.08815765380859375, -0.08437633514404297, -0.08059501647949219, -0.0768136978149414, -0.07303237915039062, -0.06925106048583984, -0.06546974182128906, -0.06168842315673828, -0.0579071044921875, -0.05412578582763672, -0.05034446716308594, -0.046563148498535156, -0.042781829833984375, -0.039000511169433594, -0.03521919250488281, -0.03143787384033203, -0.02765655517578125, -0.02387523651123047, -0.020093917846679688, -0.016312599182128906, -0.012531280517578125, -0.008749961853027344, -0.0049686431884765625, -0.0011873245239257812, 0.002593994140625, 0.006375312805175781, 0.010156631469726562, 0.013937950134277344, 0.017719268798828125, 0.021500587463378906, 0.025281906127929688, 0.02906322479248047, 0.03284454345703125, 0.03662586212158203, 0.04040718078613281, 0.044188499450683594, 0.047969818115234375, 0.051751136779785156, 0.05553245544433594, 0.05931377410888672, 0.0630950927734375, 0.06687641143798828, 0.07065773010253906, 0.07443904876708984, 0.07822036743164062, 0.0820016860961914, 0.08578300476074219, 0.08956432342529297, 0.09334564208984375, 0.09712696075439453, 0.10090827941894531, 0.1046895980834961, 0.10847091674804688, 0.11225223541259766, 0.11603355407714844, 0.11981487274169922, 0.12359619140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 10.0, 7.0, 20.0, 26.0, 25.0, 40.0, 50.0, 68.0, 115.0, 176.0, 296.0, 440.0, 781.0, 1585.0, 3636.0, 9932.0, 41545.0, 408950.0, 517094.0, 45615.0, 10598.0, 3777.0, 1592.0, 867.0, 470.0, 262.0, 191.0, 110.0, 70.0, 61.0, 37.0, 23.0, 18.0, 12.0, 19.0, 6.0, 2.0, 4.0, 6.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48876953125, -0.47193145751953125, -0.4550933837890625, -0.43825531005859375, -0.421417236328125, -0.40457916259765625, -0.3877410888671875, -0.37090301513671875, -0.35406494140625, -0.33722686767578125, -0.3203887939453125, -0.30355072021484375, -0.286712646484375, -0.26987457275390625, -0.2530364990234375, -0.23619842529296875, -0.2193603515625, -0.20252227783203125, -0.1856842041015625, -0.16884613037109375, -0.152008056640625, -0.13516998291015625, -0.1183319091796875, -0.10149383544921875, -0.08465576171875, -0.06781768798828125, -0.0509796142578125, -0.03414154052734375, -0.017303466796875, -0.00046539306640625, 0.0163726806640625, 0.03321075439453125, 0.050048828125, 0.06688690185546875, 0.0837249755859375, 0.10056304931640625, 0.117401123046875, 0.13423919677734375, 0.1510772705078125, 0.16791534423828125, 0.18475341796875, 0.20159149169921875, 0.2184295654296875, 0.23526763916015625, 0.252105712890625, 0.26894378662109375, 0.2857818603515625, 0.30261993408203125, 0.3194580078125, 0.33629608154296875, 0.3531341552734375, 0.36997222900390625, 0.386810302734375, 0.40364837646484375, 0.4204864501953125, 0.43732452392578125, 0.45416259765625, 0.47100067138671875, 0.4878387451171875, 0.5046768188476562, 0.521514892578125, 0.5383529663085938, 0.5551910400390625, 0.5720291137695312, 0.5888671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 10.0, 3.0, 7.0, 9.0, 13.0, 11.0, 20.0, 26.0, 33.0, 38.0, 41.0, 39.0, 55.0, 50.0, 57.0, 63.0, 58.0, 59.0, 54.0, 59.0, 53.0, 37.0, 41.0, 33.0, 28.0, 30.0, 23.0, 14.0, 8.0, 11.0, 5.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6480941772460938, -0.6282196044921875, -0.6083450317382812, -0.588470458984375, -0.5685958862304688, -0.5487213134765625, -0.5288467407226562, -0.50897216796875, -0.48909759521484375, -0.4692230224609375, -0.44934844970703125, -0.429473876953125, -0.40959930419921875, -0.3897247314453125, -0.36985015869140625, -0.3499755859375, -0.33010101318359375, -0.3102264404296875, -0.29035186767578125, -0.270477294921875, -0.25060272216796875, -0.2307281494140625, -0.21085357666015625, -0.19097900390625, -0.17110443115234375, -0.1512298583984375, -0.13135528564453125, -0.111480712890625, -0.09160614013671875, -0.0717315673828125, -0.05185699462890625, -0.031982421875, -0.01210784912109375, 0.0077667236328125, 0.02764129638671875, 0.047515869140625, 0.06739044189453125, 0.0872650146484375, 0.10713958740234375, 0.12701416015625, 0.14688873291015625, 0.1667633056640625, 0.18663787841796875, 0.206512451171875, 0.22638702392578125, 0.2462615966796875, 0.26613616943359375, 0.2860107421875, 0.30588531494140625, 0.3257598876953125, 0.34563446044921875, 0.365509033203125, 0.38538360595703125, 0.4052581787109375, 0.42513275146484375, 0.44500732421875, 0.46488189697265625, 0.4847564697265625, 0.5046310424804688, 0.524505615234375, 0.5443801879882812, 0.5642547607421875, 0.5841293334960938, 0.60400390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 12.0, 14.0, 16.0, 18.0, 34.0, 45.0, 57.0, 116.0, 205.0, 316.0, 643.0, 1180.0, 2778.0, 7044.0, 22480.0, 113065.0, 716136.0, 144543.0, 25970.0, 7936.0, 3055.0, 1351.0, 650.0, 358.0, 195.0, 121.0, 65.0, 41.0, 33.0, 20.0, 20.0, 6.0, 10.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2484130859375, -0.2412242889404297, -0.23403549194335938, -0.22684669494628906, -0.21965789794921875, -0.21246910095214844, -0.20528030395507812, -0.1980915069580078, -0.1909027099609375, -0.1837139129638672, -0.17652511596679688, -0.16933631896972656, -0.16214752197265625, -0.15495872497558594, -0.14776992797851562, -0.1405811309814453, -0.133392333984375, -0.1262035369873047, -0.11901473999023438, -0.11182594299316406, -0.10463714599609375, -0.09744834899902344, -0.09025955200195312, -0.08307075500488281, -0.0758819580078125, -0.06869316101074219, -0.061504364013671875, -0.05431556701660156, -0.04712677001953125, -0.03993797302246094, -0.032749176025390625, -0.025560379028320312, -0.01837158203125, -0.011182785034179688, -0.003993988037109375, 0.0031948089599609375, 0.01038360595703125, 0.017572402954101562, 0.024761199951171875, 0.03194999694824219, 0.0391387939453125, 0.04632759094238281, 0.053516387939453125, 0.06070518493652344, 0.06789398193359375, 0.07508277893066406, 0.08227157592773438, 0.08946037292480469, 0.096649169921875, 0.10383796691894531, 0.11102676391601562, 0.11821556091308594, 0.12540435791015625, 0.13259315490722656, 0.13978195190429688, 0.1469707489013672, 0.1541595458984375, 0.1613483428955078, 0.16853713989257812, 0.17572593688964844, 0.18291473388671875, 0.19010353088378906, 0.19729232788085938, 0.2044811248779297, 0.211669921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 3.0, 1.0, 9.0, 11.0, 13.0, 15.0, 23.0, 32.0, 33.0, 57.0, 114.0, 149.0, 131.0, 125.0, 72.0, 59.0, 37.0, 28.0, 25.0, 12.0, 10.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.957220077514648e-05, -7.724948227405548e-05, -7.492676377296448e-05, -7.260404527187347e-05, -7.028132677078247e-05, -6.795860826969147e-05, -6.563588976860046e-05, -6.331317126750946e-05, -6.099045276641846e-05, -5.8667734265327454e-05, -5.634501576423645e-05, -5.402229726314545e-05, -5.169957876205444e-05, -4.937686026096344e-05, -4.7054141759872437e-05, -4.473142325878143e-05, -4.240870475769043e-05, -4.0085986256599426e-05, -3.776326775550842e-05, -3.544054925441742e-05, -3.3117830753326416e-05, -3.079511225223541e-05, -2.847239375114441e-05, -2.6149675250053406e-05, -2.3826956748962402e-05, -2.15042382478714e-05, -1.9181519746780396e-05, -1.6858801245689392e-05, -1.4536082744598389e-05, -1.2213364243507385e-05, -9.890645742416382e-06, -7.567927241325378e-06, -5.245208740234375e-06, -2.9224902391433716e-06, -5.997717380523682e-07, 1.7229467630386353e-06, 4.045665264129639e-06, 6.368383765220642e-06, 8.691102266311646e-06, 1.1013820767402649e-05, 1.3336539268493652e-05, 1.5659257769584656e-05, 1.798197627067566e-05, 2.0304694771766663e-05, 2.2627413272857666e-05, 2.495013177394867e-05, 2.7272850275039673e-05, 2.9595568776130676e-05, 3.191828727722168e-05, 3.424100577831268e-05, 3.6563724279403687e-05, 3.888644278049469e-05, 4.120916128158569e-05, 4.35318797826767e-05, 4.58545982837677e-05, 4.8177316784858704e-05, 5.050003528594971e-05, 5.282275378704071e-05, 5.5145472288131714e-05, 5.746819078922272e-05, 5.979090929031372e-05, 6.211362779140472e-05, 6.443634629249573e-05, 6.675906479358673e-05, 6.908178329467773e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 10.0, 12.0, 16.0, 19.0, 31.0, 46.0, 66.0, 118.0, 181.0, 333.0, 621.0, 1247.0, 3229.0, 10143.0, 51304.0, 628873.0, 309141.0, 31158.0, 7334.0, 2414.0, 1030.0, 494.0, 236.0, 160.0, 106.0, 60.0, 42.0, 32.0, 20.0, 19.0, 11.0, 10.0, 8.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263671875, -0.2553977966308594, -0.24712371826171875, -0.23884963989257812, -0.2305755615234375, -0.22230148315429688, -0.21402740478515625, -0.20575332641601562, -0.197479248046875, -0.18920516967773438, -0.18093109130859375, -0.17265701293945312, -0.1643829345703125, -0.15610885620117188, -0.14783477783203125, -0.13956069946289062, -0.13128662109375, -0.12301254272460938, -0.11473846435546875, -0.10646438598632812, -0.0981903076171875, -0.08991622924804688, -0.08164215087890625, -0.07336807250976562, -0.065093994140625, -0.056819915771484375, -0.04854583740234375, -0.040271759033203125, -0.0319976806640625, -0.023723602294921875, -0.01544952392578125, -0.007175445556640625, 0.0010986328125, 0.009372711181640625, 0.01764678955078125, 0.025920867919921875, 0.0341949462890625, 0.042469024658203125, 0.05074310302734375, 0.059017181396484375, 0.067291259765625, 0.07556533813476562, 0.08383941650390625, 0.09211349487304688, 0.1003875732421875, 0.10866165161132812, 0.11693572998046875, 0.12520980834960938, 0.13348388671875, 0.14175796508789062, 0.15003204345703125, 0.15830612182617188, 0.1665802001953125, 0.17485427856445312, 0.18312835693359375, 0.19140243530273438, 0.199676513671875, 0.20795059204101562, 0.21622467041015625, 0.22449874877929688, 0.2327728271484375, 0.24104690551757812, 0.24932098388671875, 0.2575950622558594, 0.265869140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 2.0, 8.0, 11.0, 24.0, 27.0, 25.0, 51.0, 40.0, 69.0, 91.0, 85.0, 111.0, 92.0, 72.0, 66.0, 49.0, 34.0, 33.0, 15.0, 18.0, 9.0, 6.0, 10.0, 3.0, 9.0, 8.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2310791015625, -0.22455596923828125, -0.2180328369140625, -0.21150970458984375, -0.204986572265625, -0.19846343994140625, -0.1919403076171875, -0.18541717529296875, -0.17889404296875, -0.17237091064453125, -0.1658477783203125, -0.15932464599609375, -0.152801513671875, -0.14627838134765625, -0.1397552490234375, -0.13323211669921875, -0.126708984375, -0.12018585205078125, -0.1136627197265625, -0.10713958740234375, -0.100616455078125, -0.09409332275390625, -0.0875701904296875, -0.08104705810546875, -0.07452392578125, -0.06800079345703125, -0.0614776611328125, -0.05495452880859375, -0.048431396484375, -0.04190826416015625, -0.0353851318359375, -0.02886199951171875, -0.0223388671875, -0.01581573486328125, -0.0092926025390625, -0.00276947021484375, 0.003753662109375, 0.01027679443359375, 0.0167999267578125, 0.02332305908203125, 0.02984619140625, 0.03636932373046875, 0.0428924560546875, 0.04941558837890625, 0.055938720703125, 0.06246185302734375, 0.0689849853515625, 0.07550811767578125, 0.08203125, 0.08855438232421875, 0.0950775146484375, 0.10160064697265625, 0.108123779296875, 0.11464691162109375, 0.1211700439453125, 0.12769317626953125, 0.13421630859375, 0.14073944091796875, 0.1472625732421875, 0.15378570556640625, 0.160308837890625, 0.16683197021484375, 0.1733551025390625, 0.17987823486328125, 0.1864013671875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 6.0, 11.0, 17.0, 42.0, 75.0, 130.0, 217.0, 185.0, 119.0, 94.0, 41.0, 21.0, 17.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6024069786071777, -2.4645769596099854, -2.326746940612793, -2.1889171600341797, -2.0510871410369873, -1.913257122039795, -1.775427222251892, -1.6375973224639893, -1.4997673034667969, -1.3619372844696045, -1.2241073846817017, -1.0862774848937988, -0.9484474658966064, -0.8106175065040588, -0.6727875471115112, -0.5349575877189636, -0.397127628326416, -0.2592976689338684, -0.1214677095413208, 0.016362249851226807, 0.15419220924377441, 0.292022168636322, 0.42985212802886963, 0.5676820874214172, 0.7055120468139648, 0.8433420062065125, 0.9811719655990601, 1.119001865386963, 1.2568318843841553, 1.3946619033813477, 1.5324918031692505, 1.6703217029571533, 1.808152198791504, 1.9459822177886963, 2.0838122367858887, 2.221642017364502, 2.3594720363616943, 2.4973020553588867, 2.6351318359375, 2.7729618549346924, 2.9107918739318848, 3.048621892929077, 3.1864519119262695, 3.324281692504883, 3.462111711502075, 3.5999417304992676, 3.737771511077881, 3.8756015300750732, 4.013431549072266, 4.151261329650879, 4.28909158706665, 4.426921367645264, 4.564751625061035, 4.702581405639648, 4.840411186218262, 4.978241443634033, 5.1160712242126465, 5.25390100479126, 5.391731262207031, 5.5295610427856445, 5.667390823364258, 5.805221080780029, 5.943050861358643, 6.080881118774414, 6.218710899353027]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 9.0, 11.0, 16.0, 14.0, 30.0, 27.0, 27.0, 35.0, 38.0, 44.0, 44.0, 54.0, 54.0, 78.0, 61.0, 64.0, 48.0, 47.0, 41.0, 35.0, 39.0, 28.0, 24.0, 18.0, 20.0, 17.0, 16.0, 12.0, 16.0, 7.0, 5.0, 0.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.039203643798828, -2.964172840118408, -2.8891422748565674, -2.8141114711761475, -2.7390806674957275, -2.6640501022338867, -2.589019298553467, -2.513988494873047, -2.438957691192627, -2.363926887512207, -2.288896322250366, -2.2138655185699463, -2.1388347148895264, -2.0638041496276855, -1.9887733459472656, -1.9137425422668457, -1.8387119770050049, -1.7636812925338745, -1.6886504888534546, -1.6136198043823242, -1.5385890007019043, -1.463558316230774, -1.3885276317596436, -1.3134968280792236, -1.2384661436080933, -1.163435459136963, -1.088404655456543, -1.0133739709854126, -0.9383432269096375, -0.8633124828338623, -0.7882817983627319, -0.7132510542869568, -0.6382205486297607, -0.5631898045539856, -0.48815909028053284, -0.4131283760070801, -0.33809763193130493, -0.2630668878555298, -0.18803617358207703, -0.11300545930862427, -0.03797471523284912, 0.03705601394176483, 0.11208674311637878, 0.18711747229099274, 0.2621482014656067, 0.33717894554138184, 0.4122096598148346, 0.48724037408828735, 0.5622711181640625, 0.6373018622398376, 0.7123326063156128, 0.7873632907867432, 0.8623940348625183, 0.9374247789382935, 1.0124554634094238, 1.0874862670898438, 1.1625169515609741, 1.2375476360321045, 1.3125784397125244, 1.3876091241836548, 1.4626398086547852, 1.537670612335205, 1.6127012968063354, 1.6877319812774658, 1.7627627849578857]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 12.0, 17.0, 24.0, 31.0, 69.0, 100.0, 186.0, 509.0, 1667.0, 8631.0, 130687.0, 4003160.0, 42550.0, 4765.0, 1106.0, 329.0, 143.0, 76.0, 46.0, 32.0, 34.0, 12.0, 14.0, 5.0, 10.0, 12.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.0673828125, -1.040252685546875, -1.01312255859375, -0.985992431640625, -0.9588623046875, -0.931732177734375, -0.90460205078125, -0.877471923828125, -0.850341796875, -0.823211669921875, -0.79608154296875, -0.768951416015625, -0.7418212890625, -0.714691162109375, -0.68756103515625, -0.660430908203125, -0.63330078125, -0.606170654296875, -0.57904052734375, -0.551910400390625, -0.5247802734375, -0.497650146484375, -0.47052001953125, -0.443389892578125, -0.416259765625, -0.389129638671875, -0.36199951171875, -0.334869384765625, -0.3077392578125, -0.280609130859375, -0.25347900390625, -0.226348876953125, -0.19921875, -0.172088623046875, -0.14495849609375, -0.117828369140625, -0.0906982421875, -0.063568115234375, -0.03643798828125, -0.009307861328125, 0.017822265625, 0.044952392578125, 0.07208251953125, 0.099212646484375, 0.1263427734375, 0.153472900390625, 0.18060302734375, 0.207733154296875, 0.23486328125, 0.261993408203125, 0.28912353515625, 0.316253662109375, 0.3433837890625, 0.370513916015625, 0.39764404296875, 0.424774169921875, 0.451904296875, 0.479034423828125, 0.50616455078125, 0.533294677734375, 0.5604248046875, 0.587554931640625, 0.61468505859375, 0.641815185546875, 0.6689453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 10.0, 6.0, 9.0, 18.0, 21.0, 28.0, 50.0, 45.0, 52.0, 68.0, 67.0, 78.0, 68.0, 76.0, 64.0, 83.0, 53.0, 49.0, 42.0, 39.0, 28.0, 11.0, 13.0, 11.0, 12.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.2256460189819336, -0.2200908660888672, -0.21453571319580078, -0.20898056030273438, -0.20342540740966797, -0.19787025451660156, -0.19231510162353516, -0.18675994873046875, -0.18120479583740234, -0.17564964294433594, -0.17009449005126953, -0.16453933715820312, -0.15898418426513672, -0.1534290313720703, -0.1478738784790039, -0.1423187255859375, -0.1367635726928711, -0.1312084197998047, -0.12565326690673828, -0.12009811401367188, -0.11454296112060547, -0.10898780822753906, -0.10343265533447266, -0.09787750244140625, -0.09232234954833984, -0.08676719665527344, -0.08121204376220703, -0.07565689086914062, -0.07010173797607422, -0.06454658508300781, -0.058991432189941406, -0.053436279296875, -0.047881126403808594, -0.04232597351074219, -0.03677082061767578, -0.031215667724609375, -0.02566051483154297, -0.020105361938476562, -0.014550209045410156, -0.00899505615234375, -0.0034399032592773438, 0.0021152496337890625, 0.007670402526855469, 0.013225555419921875, 0.01878070831298828, 0.024335861206054688, 0.029891014099121094, 0.0354461669921875, 0.041001319885253906, 0.04655647277832031, 0.05211162567138672, 0.057666778564453125, 0.06322193145751953, 0.06877708435058594, 0.07433223724365234, 0.07988739013671875, 0.08544254302978516, 0.09099769592285156, 0.09655284881591797, 0.10210800170898438, 0.10766315460205078, 0.11321830749511719, 0.1187734603881836, 0.12432861328125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 12.0, 9.0, 19.0, 37.0, 61.0, 112.0, 219.0, 399.0, 955.0, 2148.0, 5832.0, 17944.0, 71740.0, 786245.0, 3109867.0, 152278.0, 30674.0, 9494.0, 3439.0, 1447.0, 635.0, 305.0, 161.0, 90.0, 55.0, 32.0, 15.0, 12.0, 9.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.3169097900390625, -0.303253173828125, -0.2895965576171875, -0.27593994140625, -0.2622833251953125, -0.248626708984375, -0.2349700927734375, -0.2213134765625, -0.2076568603515625, -0.194000244140625, -0.1803436279296875, -0.16668701171875, -0.1530303955078125, -0.139373779296875, -0.1257171630859375, -0.112060546875, -0.0984039306640625, -0.084747314453125, -0.0710906982421875, -0.05743408203125, -0.0437774658203125, -0.030120849609375, -0.0164642333984375, -0.0028076171875, 0.0108489990234375, 0.024505615234375, 0.0381622314453125, 0.05181884765625, 0.0654754638671875, 0.079132080078125, 0.0927886962890625, 0.1064453125, 0.1201019287109375, 0.133758544921875, 0.1474151611328125, 0.16107177734375, 0.1747283935546875, 0.188385009765625, 0.2020416259765625, 0.2156982421875, 0.2293548583984375, 0.243011474609375, 0.2566680908203125, 0.27032470703125, 0.2839813232421875, 0.297637939453125, 0.3112945556640625, 0.324951171875, 0.3386077880859375, 0.352264404296875, 0.3659210205078125, 0.37957763671875, 0.3932342529296875, 0.406890869140625, 0.4205474853515625, 0.4342041015625, 0.4478607177734375, 0.461517333984375, 0.4751739501953125, 0.48883056640625, 0.5024871826171875, 0.516143798828125, 0.5298004150390625, 0.54345703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 7.0, 8.0, 21.0, 14.0, 25.0, 29.0, 53.0, 89.0, 124.0, 183.0, 381.0, 734.0, 1073.0, 515.0, 289.0, 155.0, 93.0, 74.0, 51.0, 33.0, 20.0, 18.0, 11.0, 16.0, 9.0, 6.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2823333740234375, -0.270233154296875, -0.2581329345703125, -0.24603271484375, -0.2339324951171875, -0.221832275390625, -0.2097320556640625, -0.1976318359375, -0.1855316162109375, -0.173431396484375, -0.1613311767578125, -0.14923095703125, -0.1371307373046875, -0.125030517578125, -0.1129302978515625, -0.100830078125, -0.0887298583984375, -0.076629638671875, -0.0645294189453125, -0.05242919921875, -0.0403289794921875, -0.028228759765625, -0.0161285400390625, -0.0040283203125, 0.0080718994140625, 0.020172119140625, 0.0322723388671875, 0.04437255859375, 0.0564727783203125, 0.068572998046875, 0.0806732177734375, 0.0927734375, 0.1048736572265625, 0.116973876953125, 0.1290740966796875, 0.14117431640625, 0.1532745361328125, 0.165374755859375, 0.1774749755859375, 0.1895751953125, 0.2016754150390625, 0.213775634765625, 0.2258758544921875, 0.23797607421875, 0.2500762939453125, 0.262176513671875, 0.2742767333984375, 0.286376953125, 0.2984771728515625, 0.310577392578125, 0.3226776123046875, 0.33477783203125, 0.3468780517578125, 0.358978271484375, 0.3710784912109375, 0.3831787109375, 0.3952789306640625, 0.407379150390625, 0.4194793701171875, 0.43157958984375, 0.4436798095703125, 0.455780029296875, 0.4678802490234375, 0.47998046875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 21.0, 31.0, 39.0, 70.0, 97.0, 133.0, 117.0, 124.0, 98.0, 73.0, 60.0, 38.0, 23.0, 5.0, 9.0, 5.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.598886013031006, -2.520750045776367, -2.4426143169403076, -2.364478349685669, -2.2863426208496094, -2.2082066535949707, -2.130070924758911, -2.0519349575042725, -1.973799228668213, -1.8956633806228638, -1.8175275325775146, -1.7393916845321655, -1.6612558364868164, -1.5831199884414673, -1.5049841403961182, -1.4268481731414795, -1.3487123250961304, -1.2705764770507812, -1.1924406290054321, -1.114304780960083, -1.0361689329147339, -0.9580330848693848, -0.8798971772193909, -0.8017613291740417, -0.7236254811286926, -0.6454896330833435, -0.5673537850379944, -0.4892179071903229, -0.41108205914497375, -0.33294621109962463, -0.2548103332519531, -0.176674485206604, -0.09853863716125488, -0.020402781665325165, 0.05773307383060455, 0.13586893677711487, 0.214004784822464, 0.2921406328678131, 0.3702765107154846, 0.44841235876083374, 0.5265482068061829, 0.604684054851532, 0.6828199028968811, 0.760955810546875, 0.8390916585922241, 0.9172275066375732, 0.9953633546829224, 1.0734992027282715, 1.1516350507736206, 1.2297708988189697, 1.3079067468643188, 1.386042594909668, 1.464178442955017, 1.5423142910003662, 1.6204502582550049, 1.6985859870910645, 1.7767219543457031, 1.8548578023910522, 1.9329936504364014, 2.01112961769104, 2.0892653465270996, 2.1674013137817383, 2.245537042617798, 2.3236730098724365, 2.401808738708496]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 9.0, 7.0, 13.0, 13.0, 10.0, 20.0, 28.0, 15.0, 18.0, 25.0, 35.0, 45.0, 42.0, 50.0, 48.0, 44.0, 49.0, 40.0, 51.0, 51.0, 49.0, 31.0, 26.0, 37.0, 38.0, 34.0, 25.0, 17.0, 21.0, 19.0, 14.0, 17.0, 11.0, 7.0, 10.0, 9.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.406076192855835, -1.3600701093673706, -1.3140639066696167, -1.2680578231811523, -1.222051739692688, -1.176045536994934, -1.1300394535064697, -1.0840332508087158, -1.0380271673202515, -0.9920210242271423, -0.946014940738678, -0.9000087976455688, -0.8540026545524597, -0.8079965114593506, -0.7619904279708862, -0.7159842848777771, -0.6699782013893127, -0.6239720582962036, -0.5779659748077393, -0.5319598317146301, -0.485953688621521, -0.43994757533073425, -0.3939414620399475, -0.3479353189468384, -0.30192920565605164, -0.2559230923652649, -0.20991694927215576, -0.16391083598136902, -0.11790470778942108, -0.07189857959747314, -0.0258924663066864, 0.02011367678642273, 0.06611979007720947, 0.11212591826915741, 0.15813204646110535, 0.2041381597518921, 0.2501443028450012, 0.29615041613578796, 0.3421565294265747, 0.38816267251968384, 0.4341687858104706, 0.4801748991012573, 0.5261810421943665, 0.5721871852874756, 0.6181932687759399, 0.6641994118690491, 0.7102055549621582, 0.7562116384506226, 0.8022177815437317, 0.8482239246368408, 0.8942300081253052, 0.9402361512184143, 0.9862422943115234, 1.0322483777999878, 1.0782544612884521, 1.124260663986206, 1.1702667474746704, 1.2162728309631348, 1.2622790336608887, 1.308285117149353, 1.3542912006378174, 1.4002974033355713, 1.4463034868240356, 1.4923095703125, 1.538315773010254]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 11.0, 14.0, 24.0, 32.0, 29.0, 60.0, 85.0, 98.0, 151.0, 213.0, 335.0, 455.0, 757.0, 1058.0, 1775.0, 2787.0, 4700.0, 8160.0, 14775.0, 29853.0, 68487.0, 190056.0, 403697.0, 187652.0, 67843.0, 29967.0, 14956.0, 8102.0, 4692.0, 2755.0, 1687.0, 1082.0, 738.0, 447.0, 309.0, 205.0, 169.0, 97.0, 60.0, 56.0, 36.0, 25.0, 23.0, 10.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2474365234375, -0.2395801544189453, -0.23172378540039062, -0.22386741638183594, -0.21601104736328125, -0.20815467834472656, -0.20029830932617188, -0.1924419403076172, -0.1845855712890625, -0.1767292022705078, -0.16887283325195312, -0.16101646423339844, -0.15316009521484375, -0.14530372619628906, -0.13744735717773438, -0.1295909881591797, -0.121734619140625, -0.11387825012207031, -0.10602188110351562, -0.09816551208496094, -0.09030914306640625, -0.08245277404785156, -0.07459640502929688, -0.06674003601074219, -0.0588836669921875, -0.05102729797363281, -0.043170928955078125, -0.03531455993652344, -0.02745819091796875, -0.019601821899414062, -0.011745452880859375, -0.0038890838623046875, 0.00396728515625, 0.011823654174804688, 0.019680023193359375, 0.027536392211914062, 0.03539276123046875, 0.04324913024902344, 0.051105499267578125, 0.05896186828613281, 0.0668182373046875, 0.07467460632324219, 0.08253097534179688, 0.09038734436035156, 0.09824371337890625, 0.10610008239746094, 0.11395645141601562, 0.12181282043457031, 0.129669189453125, 0.1375255584716797, 0.14538192749023438, 0.15323829650878906, 0.16109466552734375, 0.16895103454589844, 0.17680740356445312, 0.1846637725830078, 0.1925201416015625, 0.2003765106201172, 0.20823287963867188, 0.21608924865722656, 0.22394561767578125, 0.23180198669433594, 0.23965835571289062, 0.2475147247314453, 0.25537109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 18.0, 18.0, 18.0, 40.0, 43.0, 50.0, 58.0, 61.0, 65.0, 65.0, 63.0, 74.0, 70.0, 55.0, 59.0, 36.0, 42.0, 37.0, 21.0, 22.0, 20.0, 8.0, 6.0, 9.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.22412109375, -0.21869850158691406, -0.21327590942382812, -0.2078533172607422, -0.20243072509765625, -0.1970081329345703, -0.19158554077148438, -0.18616294860839844, -0.1807403564453125, -0.17531776428222656, -0.16989517211914062, -0.1644725799560547, -0.15904998779296875, -0.1536273956298828, -0.14820480346679688, -0.14278221130371094, -0.137359619140625, -0.13193702697753906, -0.12651443481445312, -0.12109184265136719, -0.11566925048828125, -0.11024665832519531, -0.10482406616210938, -0.09940147399902344, -0.0939788818359375, -0.08855628967285156, -0.08313369750976562, -0.07771110534667969, -0.07228851318359375, -0.06686592102050781, -0.061443328857421875, -0.05602073669433594, -0.05059814453125, -0.04517555236816406, -0.039752960205078125, -0.03433036804199219, -0.02890777587890625, -0.023485183715820312, -0.018062591552734375, -0.012639999389648438, -0.0072174072265625, -0.0017948150634765625, 0.003627777099609375, 0.009050369262695312, 0.01447296142578125, 0.019895553588867188, 0.025318145751953125, 0.030740737915039062, 0.036163330078125, 0.04158592224121094, 0.047008514404296875, 0.05243110656738281, 0.05785369873046875, 0.06327629089355469, 0.06869888305664062, 0.07412147521972656, 0.0795440673828125, 0.08496665954589844, 0.09038925170898438, 0.09581184387207031, 0.10123443603515625, 0.10665702819824219, 0.11207962036132812, 0.11750221252441406, 0.1229248046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 12.0, 9.0, 14.0, 19.0, 31.0, 35.0, 44.0, 71.0, 92.0, 146.0, 188.0, 331.0, 499.0, 869.0, 1621.0, 3403.0, 8548.0, 24844.0, 98805.0, 656414.0, 192052.0, 38542.0, 12223.0, 4744.0, 2105.0, 1111.0, 612.0, 339.0, 252.0, 165.0, 94.0, 79.0, 51.0, 51.0, 38.0, 18.0, 17.0, 14.0, 11.0, 5.0, 2.0, 5.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.431640625, -0.4180145263671875, -0.404388427734375, -0.3907623291015625, -0.37713623046875, -0.3635101318359375, -0.349884033203125, -0.3362579345703125, -0.3226318359375, -0.3090057373046875, -0.295379638671875, -0.2817535400390625, -0.26812744140625, -0.2545013427734375, -0.240875244140625, -0.2272491455078125, -0.213623046875, -0.1999969482421875, -0.186370849609375, -0.1727447509765625, -0.15911865234375, -0.1454925537109375, -0.131866455078125, -0.1182403564453125, -0.1046142578125, -0.0909881591796875, -0.077362060546875, -0.0637359619140625, -0.05010986328125, -0.0364837646484375, -0.022857666015625, -0.0092315673828125, 0.00439453125, 0.0180206298828125, 0.031646728515625, 0.0452728271484375, 0.05889892578125, 0.0725250244140625, 0.086151123046875, 0.0997772216796875, 0.1134033203125, 0.1270294189453125, 0.140655517578125, 0.1542816162109375, 0.16790771484375, 0.1815338134765625, 0.195159912109375, 0.2087860107421875, 0.222412109375, 0.2360382080078125, 0.249664306640625, 0.2632904052734375, 0.27691650390625, 0.2905426025390625, 0.304168701171875, 0.3177947998046875, 0.3314208984375, 0.3450469970703125, 0.358673095703125, 0.3722991943359375, 0.38592529296875, 0.3995513916015625, 0.413177490234375, 0.4268035888671875, 0.4404296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 21.0, 13.0, 15.0, 19.0, 24.0, 30.0, 28.0, 29.0, 38.0, 50.0, 51.0, 58.0, 62.0, 50.0, 47.0, 46.0, 58.0, 61.0, 49.0, 40.0, 41.0, 29.0, 29.0, 16.0, 12.0, 9.0, 8.0, 6.0, 7.0, 8.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.5829925537109375, -0.564910888671875, -0.5468292236328125, -0.52874755859375, -0.5106658935546875, -0.492584228515625, -0.4745025634765625, -0.4564208984375, -0.4383392333984375, -0.420257568359375, -0.4021759033203125, -0.38409423828125, -0.3660125732421875, -0.347930908203125, -0.3298492431640625, -0.311767578125, -0.2936859130859375, -0.275604248046875, -0.2575225830078125, -0.23944091796875, -0.2213592529296875, -0.203277587890625, -0.1851959228515625, -0.1671142578125, -0.1490325927734375, -0.130950927734375, -0.1128692626953125, -0.09478759765625, -0.0767059326171875, -0.058624267578125, -0.0405426025390625, -0.0224609375, -0.0043792724609375, 0.013702392578125, 0.0317840576171875, 0.04986572265625, 0.0679473876953125, 0.086029052734375, 0.1041107177734375, 0.1221923828125, 0.1402740478515625, 0.158355712890625, 0.1764373779296875, 0.19451904296875, 0.2126007080078125, 0.230682373046875, 0.2487640380859375, 0.266845703125, 0.2849273681640625, 0.303009033203125, 0.3210906982421875, 0.33917236328125, 0.3572540283203125, 0.375335693359375, 0.3934173583984375, 0.4114990234375, 0.4295806884765625, 0.447662353515625, 0.4657440185546875, 0.48382568359375, 0.5019073486328125, 0.519989013671875, 0.5380706787109375, 0.55615234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 9.0, 7.0, 13.0, 17.0, 18.0, 42.0, 105.0, 227.0, 552.0, 1737.0, 7587.0, 75188.0, 864464.0, 87383.0, 8246.0, 1856.0, 617.0, 245.0, 101.0, 54.0, 24.0, 21.0, 10.0, 6.0, 6.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40771484375, -0.3939056396484375, -0.380096435546875, -0.3662872314453125, -0.35247802734375, -0.3386688232421875, -0.324859619140625, -0.3110504150390625, -0.2972412109375, -0.2834320068359375, -0.269622802734375, -0.2558135986328125, -0.24200439453125, -0.2281951904296875, -0.214385986328125, -0.2005767822265625, -0.186767578125, -0.1729583740234375, -0.159149169921875, -0.1453399658203125, -0.13153076171875, -0.1177215576171875, -0.103912353515625, -0.0901031494140625, -0.0762939453125, -0.0624847412109375, -0.048675537109375, -0.0348663330078125, -0.02105712890625, -0.0072479248046875, 0.006561279296875, 0.0203704833984375, 0.0341796875, 0.0479888916015625, 0.061798095703125, 0.0756072998046875, 0.08941650390625, 0.1032257080078125, 0.117034912109375, 0.1308441162109375, 0.1446533203125, 0.1584625244140625, 0.172271728515625, 0.1860809326171875, 0.19989013671875, 0.2136993408203125, 0.227508544921875, 0.2413177490234375, 0.255126953125, 0.2689361572265625, 0.282745361328125, 0.2965545654296875, 0.31036376953125, 0.3241729736328125, 0.337982177734375, 0.3517913818359375, 0.3656005859375, 0.3794097900390625, 0.393218994140625, 0.4070281982421875, 0.42083740234375, 0.4346466064453125, 0.448455810546875, 0.4622650146484375, 0.47607421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 7.0, 10.0, 8.0, 9.0, 23.0, 25.0, 41.0, 60.0, 69.0, 93.0, 117.0, 123.0, 102.0, 71.0, 63.0, 43.0, 30.0, 31.0, 19.0, 13.0, 6.0, 4.0, 5.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.900859832763672e-05, -5.699321627616882e-05, -5.497783422470093e-05, -5.296245217323303e-05, -5.094707012176514e-05, -4.893168807029724e-05, -4.6916306018829346e-05, -4.490092396736145e-05, -4.2885541915893555e-05, -4.087015986442566e-05, -3.8854777812957764e-05, -3.683939576148987e-05, -3.482401371002197e-05, -3.280863165855408e-05, -3.079324960708618e-05, -2.8777867555618286e-05, -2.676248550415039e-05, -2.4747103452682495e-05, -2.27317214012146e-05, -2.0716339349746704e-05, -1.870095729827881e-05, -1.6685575246810913e-05, -1.4670193195343018e-05, -1.2654811143875122e-05, -1.0639429092407227e-05, -8.624047040939331e-06, -6.6086649894714355e-06, -4.59328293800354e-06, -2.5779008865356445e-06, -5.62518835067749e-07, 1.4528632164001465e-06, 3.468245267868042e-06, 5.4836273193359375e-06, 7.499009370803833e-06, 9.514391422271729e-06, 1.1529773473739624e-05, 1.354515552520752e-05, 1.5560537576675415e-05, 1.757591962814331e-05, 1.9591301679611206e-05, 2.16066837310791e-05, 2.3622065782546997e-05, 2.5637447834014893e-05, 2.7652829885482788e-05, 2.9668211936950684e-05, 3.168359398841858e-05, 3.3698976039886475e-05, 3.571435809135437e-05, 3.7729740142822266e-05, 3.974512219429016e-05, 4.176050424575806e-05, 4.377588629722595e-05, 4.579126834869385e-05, 4.780665040016174e-05, 4.982203245162964e-05, 5.1837414503097534e-05, 5.385279655456543e-05, 5.5868178606033325e-05, 5.788356065750122e-05, 5.9898942708969116e-05, 6.191432476043701e-05, 6.392970681190491e-05, 6.59450888633728e-05, 6.79604709148407e-05, 6.99758529663086e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 7.0, 6.0, 15.0, 16.0, 30.0, 24.0, 45.0, 68.0, 124.0, 180.0, 271.0, 490.0, 1007.0, 2215.0, 6206.0, 22785.0, 143713.0, 706437.0, 133068.0, 21515.0, 6052.0, 2073.0, 952.0, 486.0, 258.0, 165.0, 100.0, 87.0, 33.0, 35.0, 16.0, 22.0, 14.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.283203125, -0.2754402160644531, -0.26767730712890625, -0.2599143981933594, -0.2521514892578125, -0.24438858032226562, -0.23662567138671875, -0.22886276245117188, -0.221099853515625, -0.21333694458007812, -0.20557403564453125, -0.19781112670898438, -0.1900482177734375, -0.18228530883789062, -0.17452239990234375, -0.16675949096679688, -0.15899658203125, -0.15123367309570312, -0.14347076416015625, -0.13570785522460938, -0.1279449462890625, -0.12018203735351562, -0.11241912841796875, -0.10465621948242188, -0.096893310546875, -0.08913040161132812, -0.08136749267578125, -0.07360458374023438, -0.0658416748046875, -0.058078765869140625, -0.05031585693359375, -0.042552947998046875, -0.0347900390625, -0.027027130126953125, -0.01926422119140625, -0.011501312255859375, -0.0037384033203125, 0.004024505615234375, 0.01178741455078125, 0.019550323486328125, 0.027313232421875, 0.035076141357421875, 0.04283905029296875, 0.050601959228515625, 0.0583648681640625, 0.06612777709960938, 0.07389068603515625, 0.08165359497070312, 0.08941650390625, 0.09717941284179688, 0.10494232177734375, 0.11270523071289062, 0.1204681396484375, 0.12823104858398438, 0.13599395751953125, 0.14375686645507812, 0.151519775390625, 0.15928268432617188, 0.16704559326171875, 0.17480850219726562, 0.1825714111328125, 0.19033432006835938, 0.19809722900390625, 0.20586013793945312, 0.213623046875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 3.0, 8.0, 10.0, 18.0, 20.0, 24.0, 40.0, 39.0, 57.0, 47.0, 68.0, 96.0, 88.0, 79.0, 81.0, 59.0, 49.0, 47.0, 34.0, 24.0, 18.0, 12.0, 12.0, 7.0, 9.0, 7.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2423095703125, -0.2360210418701172, -0.22973251342773438, -0.22344398498535156, -0.21715545654296875, -0.21086692810058594, -0.20457839965820312, -0.1982898712158203, -0.1920013427734375, -0.1857128143310547, -0.17942428588867188, -0.17313575744628906, -0.16684722900390625, -0.16055870056152344, -0.15427017211914062, -0.1479816436767578, -0.141693115234375, -0.1354045867919922, -0.12911605834960938, -0.12282752990722656, -0.11653900146484375, -0.11025047302246094, -0.10396194458007812, -0.09767341613769531, -0.0913848876953125, -0.08509635925292969, -0.07880783081054688, -0.07251930236816406, -0.06623077392578125, -0.05994224548339844, -0.053653717041015625, -0.04736518859863281, -0.04107666015625, -0.03478813171386719, -0.028499603271484375, -0.022211074829101562, -0.01592254638671875, -0.009634017944335938, -0.003345489501953125, 0.0029430389404296875, 0.0092315673828125, 0.015520095825195312, 0.021808624267578125, 0.028097152709960938, 0.03438568115234375, 0.04067420959472656, 0.046962738037109375, 0.05325126647949219, 0.059539794921875, 0.06582832336425781, 0.07211685180664062, 0.07840538024902344, 0.08469390869140625, 0.09098243713378906, 0.09727096557617188, 0.10355949401855469, 0.1098480224609375, 0.11613655090332031, 0.12242507934570312, 0.12871360778808594, 0.13500213623046875, 0.14129066467285156, 0.14757919311523438, 0.1538677215576172, 0.16015625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 10.0, 13.0, 20.0, 48.0, 60.0, 96.0, 118.0, 157.0, 140.0, 115.0, 70.0, 55.0, 31.0, 19.0, 15.0, 8.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.539969444274902, -4.439096927642822, -4.338224411010742, -4.237351894378662, -4.136479377746582, -4.035606861114502, -3.934734582901001, -3.833862066268921, -3.732989549636841, -3.6321170330047607, -3.5312445163726807, -3.4303722381591797, -3.3294997215270996, -3.2286272048950195, -3.1277546882629395, -3.0268821716308594, -2.9260096549987793, -2.825137138366699, -2.724264621734619, -2.623392105102539, -2.522519826889038, -2.421647310256958, -2.320774793624878, -2.219902276992798, -2.119029998779297, -2.018157482147217, -1.9172850847244263, -1.8164125680923462, -1.7155400514602661, -1.6146676540374756, -1.5137951374053955, -1.4129226207733154, -1.3120501041412354, -1.2111775875091553, -1.1103051900863647, -1.0094326734542847, -0.9085601568222046, -0.8076876997947693, -0.706815242767334, -0.6059427261352539, -0.5050702691078186, -0.4041977822780609, -0.3033252954483032, -0.20245283842086792, -0.10158035159111023, -0.0007078647613525391, 0.10016459226608276, 0.20103710889816284, 0.30190956592559814, 0.40278205275535583, 0.5036545395851135, 0.6045269966125488, 0.7053995132446289, 0.8062719702720642, 0.9071444272994995, 1.0080169439315796, 1.1088893413543701, 1.2097618579864502, 1.3106342554092407, 1.4115067720413208, 1.5123792886734009, 1.6132516860961914, 1.7141242027282715, 1.8149967193603516, 1.9158692359924316]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 9.0, 13.0, 20.0, 19.0, 18.0, 16.0, 22.0, 21.0, 28.0, 26.0, 33.0, 30.0, 38.0, 47.0, 42.0, 49.0, 46.0, 43.0, 41.0, 44.0, 44.0, 31.0, 33.0, 36.0, 26.0, 18.0, 26.0, 31.0, 15.0, 21.0, 17.0, 11.0, 11.0, 12.0, 4.0, 11.0, 3.0, 7.0, 1.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.971482753753662, -1.9116636514663696, -1.8518446683883667, -1.7920255661010742, -1.7322065830230713, -1.6723874807357788, -1.6125683784484863, -1.5527493953704834, -1.4929304122924805, -1.433111310005188, -1.373292326927185, -1.3134732246398926, -1.2536542415618896, -1.1938351392745972, -1.1340160369873047, -1.0741970539093018, -1.0143779516220093, -0.9545589089393616, -0.8947398662567139, -0.8349207639694214, -0.7751017808914185, -0.715282678604126, -0.6554636359214783, -0.5956445932388306, -0.5358255505561829, -0.47600650787353516, -0.41618746519088745, -0.35636839270591736, -0.29654935002326965, -0.23673030734062195, -0.17691123485565186, -0.11709219217300415, -0.057273030281066895, 0.0025460198521614075, 0.06236506998538971, 0.12218412756919861, 0.1820031702518463, 0.24182221293449402, 0.3016412854194641, 0.3614603281021118, 0.4212793707847595, 0.4810984134674072, 0.5409174561500549, 0.6007364988327026, 0.6605556011199951, 0.720374584197998, 0.7801936864852905, 0.8400127291679382, 0.8998317718505859, 0.9596508145332336, 1.0194698572158813, 1.0792889595031738, 1.1391079425811768, 1.1989270448684692, 1.2587461471557617, 1.3185651302337646, 1.3783841133117676, 1.43820321559906, 1.498022198677063, 1.5578413009643555, 1.6176602840423584, 1.6774793863296509, 1.7372984886169434, 1.7971174716949463, 1.8569365739822388]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 15.0, 22.0, 32.0, 42.0, 76.0, 117.0, 171.0, 319.0, 417.0, 704.0, 1192.0, 1962.0, 3469.0, 6523.0, 12811.0, 29526.0, 84100.0, 374297.0, 2225782.0, 1167311.0, 189165.0, 53749.0, 20990.0, 9645.0, 5053.0, 2709.0, 1534.0, 954.0, 561.0, 374.0, 232.0, 164.0, 91.0, 55.0, 42.0, 27.0, 12.0, 14.0, 4.0, 4.0, 1.0, 3.0], "bins": [-0.26953125, -0.2629241943359375, -0.256317138671875, -0.2497100830078125, -0.24310302734375, -0.2364959716796875, -0.229888916015625, -0.2232818603515625, -0.2166748046875, -0.2100677490234375, -0.203460693359375, -0.1968536376953125, -0.19024658203125, -0.1836395263671875, -0.177032470703125, -0.1704254150390625, -0.163818359375, -0.1572113037109375, -0.150604248046875, -0.1439971923828125, -0.13739013671875, -0.1307830810546875, -0.124176025390625, -0.1175689697265625, -0.1109619140625, -0.1043548583984375, -0.097747802734375, -0.0911407470703125, -0.08453369140625, -0.0779266357421875, -0.071319580078125, -0.0647125244140625, -0.05810546875, -0.0514984130859375, -0.044891357421875, -0.0382843017578125, -0.03167724609375, -0.0250701904296875, -0.018463134765625, -0.0118560791015625, -0.0052490234375, 0.0013580322265625, 0.007965087890625, 0.0145721435546875, 0.02117919921875, 0.0277862548828125, 0.034393310546875, 0.0410003662109375, 0.047607421875, 0.0542144775390625, 0.060821533203125, 0.0674285888671875, 0.07403564453125, 0.0806427001953125, 0.087249755859375, 0.0938568115234375, 0.1004638671875, 0.1070709228515625, 0.113677978515625, 0.1202850341796875, 0.12689208984375, 0.1334991455078125, 0.140106201171875, 0.1467132568359375, 0.1533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 10.0, 11.0, 13.0, 24.0, 33.0, 22.0, 39.0, 44.0, 51.0, 41.0, 55.0, 60.0, 55.0, 60.0, 53.0, 58.0, 48.0, 39.0, 47.0, 45.0, 32.0, 25.0, 29.0, 15.0, 21.0, 18.0, 12.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1490478515625, -0.14482784271240234, -0.1406078338623047, -0.13638782501220703, -0.13216781616210938, -0.12794780731201172, -0.12372779846191406, -0.1195077896118164, -0.11528778076171875, -0.1110677719116211, -0.10684776306152344, -0.10262775421142578, -0.09840774536132812, -0.09418773651123047, -0.08996772766113281, -0.08574771881103516, -0.0815277099609375, -0.07730770111083984, -0.07308769226074219, -0.06886768341064453, -0.06464767456054688, -0.06042766571044922, -0.05620765686035156, -0.051987648010253906, -0.04776763916015625, -0.043547630310058594, -0.03932762145996094, -0.03510761260986328, -0.030887603759765625, -0.02666759490966797, -0.022447586059570312, -0.018227577209472656, -0.014007568359375, -0.009787559509277344, -0.0055675506591796875, -0.0013475418090820312, 0.002872467041015625, 0.007092475891113281, 0.011312484741210938, 0.015532493591308594, 0.01975250244140625, 0.023972511291503906, 0.028192520141601562, 0.03241252899169922, 0.036632537841796875, 0.04085254669189453, 0.04507255554199219, 0.049292564392089844, 0.0535125732421875, 0.057732582092285156, 0.06195259094238281, 0.06617259979248047, 0.07039260864257812, 0.07461261749267578, 0.07883262634277344, 0.0830526351928711, 0.08727264404296875, 0.0914926528930664, 0.09571266174316406, 0.09993267059326172, 0.10415267944335938, 0.10837268829345703, 0.11259269714355469, 0.11681270599365234, 0.12103271484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 6.0, 8.0, 20.0, 21.0, 40.0, 75.0, 117.0, 226.0, 417.0, 980.0, 2549.0, 7829.0, 31170.0, 184446.0, 2961484.0, 898544.0, 81404.0, 16999.0, 4849.0, 1732.0, 665.0, 287.0, 143.0, 96.0, 54.0, 34.0, 22.0, 11.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.515625, -0.5016098022460938, -0.4875946044921875, -0.47357940673828125, -0.459564208984375, -0.44554901123046875, -0.4315338134765625, -0.41751861572265625, -0.40350341796875, -0.38948822021484375, -0.3754730224609375, -0.36145782470703125, -0.347442626953125, -0.33342742919921875, -0.3194122314453125, -0.30539703369140625, -0.2913818359375, -0.27736663818359375, -0.2633514404296875, -0.24933624267578125, -0.235321044921875, -0.22130584716796875, -0.2072906494140625, -0.19327545166015625, -0.17926025390625, -0.16524505615234375, -0.1512298583984375, -0.13721466064453125, -0.123199462890625, -0.10918426513671875, -0.0951690673828125, -0.08115386962890625, -0.067138671875, -0.05312347412109375, -0.0391082763671875, -0.02509307861328125, -0.011077880859375, 0.00293731689453125, 0.0169525146484375, 0.03096771240234375, 0.04498291015625, 0.05899810791015625, 0.0730133056640625, 0.08702850341796875, 0.101043701171875, 0.11505889892578125, 0.1290740966796875, 0.14308929443359375, 0.1571044921875, 0.17111968994140625, 0.1851348876953125, 0.19915008544921875, 0.213165283203125, 0.22718048095703125, 0.2411956787109375, 0.25521087646484375, 0.26922607421875, 0.28324127197265625, 0.2972564697265625, 0.31127166748046875, 0.325286865234375, 0.33930206298828125, 0.3533172607421875, 0.36733245849609375, 0.38134765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 9.0, 10.0, 10.0, 20.0, 27.0, 30.0, 34.0, 44.0, 60.0, 83.0, 124.0, 182.0, 277.0, 476.0, 666.0, 668.0, 453.0, 271.0, 187.0, 114.0, 83.0, 61.0, 42.0, 31.0, 27.0, 11.0, 16.0, 8.0, 12.0, 7.0, 5.0, 7.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37744140625, -0.36522674560546875, -0.3530120849609375, -0.34079742431640625, -0.328582763671875, -0.31636810302734375, -0.3041534423828125, -0.29193878173828125, -0.27972412109375, -0.26750946044921875, -0.2552947998046875, -0.24308013916015625, -0.230865478515625, -0.21865081787109375, -0.2064361572265625, -0.19422149658203125, -0.1820068359375, -0.16979217529296875, -0.1575775146484375, -0.14536285400390625, -0.133148193359375, -0.12093353271484375, -0.1087188720703125, -0.09650421142578125, -0.08428955078125, -0.07207489013671875, -0.0598602294921875, -0.04764556884765625, -0.035430908203125, -0.02321624755859375, -0.0110015869140625, 0.00121307373046875, 0.013427734375, 0.02564239501953125, 0.0378570556640625, 0.05007171630859375, 0.062286376953125, 0.07450103759765625, 0.0867156982421875, 0.09893035888671875, 0.11114501953125, 0.12335968017578125, 0.1355743408203125, 0.14778900146484375, 0.160003662109375, 0.17221832275390625, 0.1844329833984375, 0.19664764404296875, 0.2088623046875, 0.22107696533203125, 0.2332916259765625, 0.24550628662109375, 0.257720947265625, 0.26993560791015625, 0.2821502685546875, 0.29436492919921875, 0.30657958984375, 0.31879425048828125, 0.3310089111328125, 0.34322357177734375, 0.355438232421875, 0.36765289306640625, 0.3798675537109375, 0.39208221435546875, 0.404296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 10.0, 16.0, 12.0, 64.0, 123.0, 236.0, 244.0, 151.0, 66.0, 41.0, 13.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.866659164428711, -7.679159164428711, -7.491659641265869, -7.304160118103027, -7.116660118103027, -6.929160118103027, -6.7416605949401855, -6.554161071777344, -6.366661071777344, -6.179161071777344, -5.991661548614502, -5.80416202545166, -5.61666202545166, -5.42916202545166, -5.241662502288818, -5.054162979125977, -4.866662979125977, -4.679162979125977, -4.491663455963135, -4.304163932800293, -4.116663932800293, -3.929164171218872, -3.741664409637451, -3.5541646480560303, -3.3666648864746094, -3.1791651248931885, -2.9916653633117676, -2.8041656017303467, -2.616665840148926, -2.429166078567505, -2.241666316986084, -2.054166555404663, -1.8666667938232422, -1.6791670322418213, -1.4916672706604004, -1.3041675090789795, -1.1166677474975586, -0.9291679859161377, -0.7416682243347168, -0.5541684627532959, -0.366668701171875, -0.1791689395904541, 0.008330821990966797, 0.1958305835723877, 0.3833303451538086, 0.5708301067352295, 0.7583298683166504, 0.9458296298980713, 1.1333293914794922, 1.320829153060913, 1.508328914642334, 1.6958286762237549, 1.8833284378051758, 2.0708281993865967, 2.2583279609680176, 2.4458277225494385, 2.6333274841308594, 2.8208272457122803, 3.008327007293701, 3.195826768875122, 3.383326530456543, 3.570826292037964, 3.7583260536193848, 3.9458258152008057, 4.133325576782227]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 12.0, 15.0, 16.0, 22.0, 23.0, 26.0, 26.0, 33.0, 32.0, 40.0, 45.0, 42.0, 42.0, 52.0, 49.0, 45.0, 49.0, 50.0, 53.0, 52.0, 37.0, 31.0, 28.0, 38.0, 24.0, 29.0, 13.0, 16.0, 9.0, 14.0, 9.0, 4.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.54189133644104, -2.473738670349121, -2.405586004257202, -2.337433338165283, -2.2692806720733643, -2.2011280059814453, -2.1329753398895264, -2.0648226737976074, -1.996670126914978, -1.928517460823059, -1.8603647947311401, -1.7922121286392212, -1.7240595817565918, -1.6559069156646729, -1.587754249572754, -1.519601583480835, -1.451448917388916, -1.383296251296997, -1.3151435852050781, -1.2469909191131592, -1.1788382530212402, -1.1106855869293213, -1.042533040046692, -0.974380373954773, -0.906227707862854, -0.8380750417709351, -0.7699223756790161, -0.7017697691917419, -0.633617103099823, -0.565464437007904, -0.4973118007183075, -0.42915916442871094, -0.3610062599182129, -0.29285359382629395, -0.2247009575366974, -0.15654830634593964, -0.08839565515518188, -0.02024298906326294, 0.04790964722633362, 0.11606228351593018, 0.18421494960784912, 0.25236761569976807, 0.3205202519893646, 0.3886728882789612, 0.4568255543708801, 0.5249782204627991, 0.5931308269500732, 0.6612834930419922, 0.7294361591339111, 0.7975888252258301, 0.865741491317749, 0.9338940978050232, 1.002046823501587, 1.0701994895935059, 1.1383520364761353, 1.2065047025680542, 1.2746573686599731, 1.342810034751892, 1.410962700843811, 1.47911536693573, 1.5472679138183594, 1.6154205799102783, 1.6835732460021973, 1.7517259120941162, 1.8198785781860352]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 5.0, 16.0, 20.0, 30.0, 32.0, 62.0, 90.0, 136.0, 193.0, 252.0, 409.0, 681.0, 966.0, 1451.0, 2437.0, 3995.0, 6966.0, 11797.0, 21835.0, 41057.0, 80007.0, 167887.0, 312523.0, 197987.0, 92835.0, 46604.0, 25000.0, 13607.0, 7663.0, 4436.0, 2740.0, 1681.0, 1066.0, 714.0, 451.0, 301.0, 212.0, 143.0, 68.0, 54.0, 42.0, 29.0, 27.0, 15.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.220947265625, -0.2137279510498047, -0.20650863647460938, -0.19928932189941406, -0.19207000732421875, -0.18485069274902344, -0.17763137817382812, -0.1704120635986328, -0.1631927490234375, -0.1559734344482422, -0.14875411987304688, -0.14153480529785156, -0.13431549072265625, -0.12709617614746094, -0.11987686157226562, -0.11265754699707031, -0.105438232421875, -0.09821891784667969, -0.09099960327148438, -0.08378028869628906, -0.07656097412109375, -0.06934165954589844, -0.062122344970703125, -0.05490303039550781, -0.0476837158203125, -0.04046440124511719, -0.033245086669921875, -0.026025772094726562, -0.01880645751953125, -0.011587142944335938, -0.004367828369140625, 0.0028514862060546875, 0.01007080078125, 0.017290115356445312, 0.024509429931640625, 0.03172874450683594, 0.03894805908203125, 0.04616737365722656, 0.053386688232421875, 0.06060600280761719, 0.0678253173828125, 0.07504463195800781, 0.08226394653320312, 0.08948326110839844, 0.09670257568359375, 0.10392189025878906, 0.11114120483398438, 0.11836051940917969, 0.125579833984375, 0.1327991485595703, 0.14001846313476562, 0.14723777770996094, 0.15445709228515625, 0.16167640686035156, 0.16889572143554688, 0.1761150360107422, 0.1833343505859375, 0.1905536651611328, 0.19777297973632812, 0.20499229431152344, 0.21221160888671875, 0.21943092346191406, 0.22665023803710938, 0.2338695526123047, 0.2410888671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 10.0, 13.0, 12.0, 12.0, 14.0, 18.0, 17.0, 28.0, 32.0, 35.0, 43.0, 41.0, 45.0, 50.0, 58.0, 48.0, 39.0, 65.0, 35.0, 41.0, 48.0, 51.0, 57.0, 43.0, 20.0, 16.0, 22.0, 22.0, 13.0, 15.0, 11.0, 11.0, 5.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11138916015625, -0.10715198516845703, -0.10291481018066406, -0.0986776351928711, -0.09444046020507812, -0.09020328521728516, -0.08596611022949219, -0.08172893524169922, -0.07749176025390625, -0.07325458526611328, -0.06901741027832031, -0.06478023529052734, -0.060543060302734375, -0.056305885314941406, -0.05206871032714844, -0.04783153533935547, -0.0435943603515625, -0.03935718536376953, -0.03512001037597656, -0.030882835388183594, -0.026645660400390625, -0.022408485412597656, -0.018171310424804688, -0.013934135437011719, -0.00969696044921875, -0.005459785461425781, -0.0012226104736328125, 0.0030145645141601562, 0.007251739501953125, 0.011488914489746094, 0.015726089477539062, 0.01996326446533203, 0.024200439453125, 0.02843761444091797, 0.03267478942871094, 0.036911964416503906, 0.041149139404296875, 0.045386314392089844, 0.04962348937988281, 0.05386066436767578, 0.05809783935546875, 0.06233501434326172, 0.06657218933105469, 0.07080936431884766, 0.07504653930664062, 0.0792837142944336, 0.08352088928222656, 0.08775806427001953, 0.0919952392578125, 0.09623241424560547, 0.10046958923339844, 0.1047067642211914, 0.10894393920898438, 0.11318111419677734, 0.11741828918457031, 0.12165546417236328, 0.12589263916015625, 0.13012981414794922, 0.1343669891357422, 0.13860416412353516, 0.14284133911132812, 0.1470785140991211, 0.15131568908691406, 0.15555286407470703, 0.1597900390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 8.0, 4.0, 20.0, 17.0, 22.0, 38.0, 36.0, 39.0, 64.0, 87.0, 130.0, 172.0, 240.0, 320.0, 537.0, 839.0, 1409.0, 2575.0, 5433.0, 15115.0, 58780.0, 491457.0, 389110.0, 55641.0, 14581.0, 5482.0, 2491.0, 1378.0, 766.0, 554.0, 310.0, 258.0, 179.0, 122.0, 89.0, 75.0, 44.0, 31.0, 33.0, 19.0, 8.0, 12.0, 14.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0], "bins": [-0.58349609375, -0.567718505859375, -0.55194091796875, -0.536163330078125, -0.5203857421875, -0.504608154296875, -0.48883056640625, -0.473052978515625, -0.457275390625, -0.441497802734375, -0.42572021484375, -0.409942626953125, -0.3941650390625, -0.378387451171875, -0.36260986328125, -0.346832275390625, -0.3310546875, -0.315277099609375, -0.29949951171875, -0.283721923828125, -0.2679443359375, -0.252166748046875, -0.23638916015625, -0.220611572265625, -0.204833984375, -0.189056396484375, -0.17327880859375, -0.157501220703125, -0.1417236328125, -0.125946044921875, -0.11016845703125, -0.094390869140625, -0.07861328125, -0.062835693359375, -0.04705810546875, -0.031280517578125, -0.0155029296875, 0.000274658203125, 0.01605224609375, 0.031829833984375, 0.047607421875, 0.063385009765625, 0.07916259765625, 0.094940185546875, 0.1107177734375, 0.126495361328125, 0.14227294921875, 0.158050537109375, 0.173828125, 0.189605712890625, 0.20538330078125, 0.221160888671875, 0.2369384765625, 0.252716064453125, 0.26849365234375, 0.284271240234375, 0.300048828125, 0.315826416015625, 0.33160400390625, 0.347381591796875, 0.3631591796875, 0.378936767578125, 0.39471435546875, 0.410491943359375, 0.42626953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 10.0, 7.0, 9.0, 14.0, 7.0, 23.0, 20.0, 21.0, 25.0, 35.0, 37.0, 48.0, 44.0, 31.0, 40.0, 38.0, 55.0, 48.0, 49.0, 40.0, 46.0, 40.0, 48.0, 40.0, 37.0, 28.0, 26.0, 29.0, 19.0, 16.0, 12.0, 9.0, 8.0, 12.0, 4.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59033203125, -0.5719680786132812, -0.5536041259765625, -0.5352401733398438, -0.516876220703125, -0.49851226806640625, -0.4801483154296875, -0.46178436279296875, -0.44342041015625, -0.42505645751953125, -0.4066925048828125, -0.38832855224609375, -0.369964599609375, -0.35160064697265625, -0.3332366943359375, -0.31487274169921875, -0.2965087890625, -0.27814483642578125, -0.2597808837890625, -0.24141693115234375, -0.223052978515625, -0.20468902587890625, -0.1863250732421875, -0.16796112060546875, -0.14959716796875, -0.13123321533203125, -0.1128692626953125, -0.09450531005859375, -0.076141357421875, -0.05777740478515625, -0.0394134521484375, -0.02104949951171875, -0.002685546875, 0.01567840576171875, 0.0340423583984375, 0.05240631103515625, 0.070770263671875, 0.08913421630859375, 0.1074981689453125, 0.12586212158203125, 0.14422607421875, 0.16259002685546875, 0.1809539794921875, 0.19931793212890625, 0.217681884765625, 0.23604583740234375, 0.2544097900390625, 0.27277374267578125, 0.2911376953125, 0.30950164794921875, 0.3278656005859375, 0.34622955322265625, 0.364593505859375, 0.38295745849609375, 0.4013214111328125, 0.41968536376953125, 0.43804931640625, 0.45641326904296875, 0.4747772216796875, 0.49314117431640625, 0.511505126953125, 0.5298690795898438, 0.5482330322265625, 0.5665969848632812, 0.5849609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 10.0, 7.0, 17.0, 42.0, 51.0, 104.0, 146.0, 329.0, 652.0, 1443.0, 4244.0, 16462.0, 88921.0, 657308.0, 230269.0, 36202.0, 8079.0, 2436.0, 939.0, 392.0, 201.0, 106.0, 57.0, 45.0, 15.0, 18.0, 16.0, 7.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.21511077880859375, -0.2085418701171875, -0.20197296142578125, -0.195404052734375, -0.18883514404296875, -0.1822662353515625, -0.17569732666015625, -0.16912841796875, -0.16255950927734375, -0.1559906005859375, -0.14942169189453125, -0.142852783203125, -0.13628387451171875, -0.1297149658203125, -0.12314605712890625, -0.1165771484375, -0.11000823974609375, -0.1034393310546875, -0.09687042236328125, -0.090301513671875, -0.08373260498046875, -0.0771636962890625, -0.07059478759765625, -0.06402587890625, -0.05745697021484375, -0.0508880615234375, -0.04431915283203125, -0.037750244140625, -0.03118133544921875, -0.0246124267578125, -0.01804351806640625, -0.011474609375, -0.00490570068359375, 0.0016632080078125, 0.00823211669921875, 0.014801025390625, 0.02136993408203125, 0.0279388427734375, 0.03450775146484375, 0.04107666015625, 0.04764556884765625, 0.0542144775390625, 0.06078338623046875, 0.067352294921875, 0.07392120361328125, 0.0804901123046875, 0.08705902099609375, 0.0936279296875, 0.10019683837890625, 0.1067657470703125, 0.11333465576171875, 0.119903564453125, 0.12647247314453125, 0.1330413818359375, 0.13961029052734375, 0.14617919921875, 0.15274810791015625, 0.1593170166015625, 0.16588592529296875, 0.172454833984375, 0.17902374267578125, 0.1855926513671875, 0.19216156005859375, 0.19873046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 7.0, 10.0, 7.0, 10.0, 5.0, 15.0, 15.0, 15.0, 28.0, 21.0, 31.0, 39.0, 47.0, 57.0, 68.0, 77.0, 100.0, 70.0, 61.0, 49.0, 46.0, 33.0, 36.0, 32.0, 18.0, 16.0, 15.0, 13.0, 8.0, 13.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.857778549194336e-05, -4.704948514699936e-05, -4.552118480205536e-05, -4.399288445711136e-05, -4.246458411216736e-05, -4.093628376722336e-05, -3.940798342227936e-05, -3.787968307733536e-05, -3.635138273239136e-05, -3.482308238744736e-05, -3.329478204250336e-05, -3.176648169755936e-05, -3.0238181352615356e-05, -2.8709881007671356e-05, -2.7181580662727356e-05, -2.5653280317783356e-05, -2.4124979972839355e-05, -2.2596679627895355e-05, -2.1068379282951355e-05, -1.9540078938007355e-05, -1.8011778593063354e-05, -1.6483478248119354e-05, -1.4955177903175354e-05, -1.3426877558231354e-05, -1.1898577213287354e-05, -1.0370276868343353e-05, -8.841976523399353e-06, -7.313676178455353e-06, -5.7853758335113525e-06, -4.257075488567352e-06, -2.728775143623352e-06, -1.2004747986793518e-06, 3.2782554626464844e-07, 1.8561258912086487e-06, 3.384426236152649e-06, 4.912726581096649e-06, 6.441026926040649e-06, 7.96932727098465e-06, 9.49762761592865e-06, 1.102592796087265e-05, 1.255422830581665e-05, 1.408252865076065e-05, 1.561082899570465e-05, 1.713912934064865e-05, 1.866742968559265e-05, 2.019573003053665e-05, 2.1724030375480652e-05, 2.3252330720424652e-05, 2.4780631065368652e-05, 2.6308931410312653e-05, 2.7837231755256653e-05, 2.9365532100200653e-05, 3.089383244514465e-05, 3.2422132790088654e-05, 3.3950433135032654e-05, 3.5478733479976654e-05, 3.7007033824920654e-05, 3.8535334169864655e-05, 4.0063634514808655e-05, 4.1591934859752655e-05, 4.3120235204696655e-05, 4.4648535549640656e-05, 4.6176835894584656e-05, 4.7705136239528656e-05, 4.9233436584472656e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 11.0, 18.0, 30.0, 52.0, 95.0, 185.0, 332.0, 769.0, 1861.0, 5715.0, 29937.0, 367690.0, 593314.0, 37961.0, 6715.0, 2160.0, 865.0, 414.0, 224.0, 99.0, 45.0, 35.0, 13.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.184326171875, -0.17633056640625, -0.1683349609375, -0.16033935546875, -0.15234375, -0.14434814453125, -0.1363525390625, -0.12835693359375, -0.120361328125, -0.11236572265625, -0.1043701171875, -0.09637451171875, -0.08837890625, -0.08038330078125, -0.0723876953125, -0.06439208984375, -0.056396484375, -0.04840087890625, -0.0404052734375, -0.03240966796875, -0.0244140625, -0.01641845703125, -0.0084228515625, -0.00042724609375, 0.007568359375, 0.01556396484375, 0.0235595703125, 0.03155517578125, 0.03955078125, 0.04754638671875, 0.0555419921875, 0.06353759765625, 0.071533203125, 0.07952880859375, 0.0875244140625, 0.09552001953125, 0.103515625, 0.11151123046875, 0.1195068359375, 0.12750244140625, 0.135498046875, 0.14349365234375, 0.1514892578125, 0.15948486328125, 0.16748046875, 0.17547607421875, 0.1834716796875, 0.19146728515625, 0.199462890625, 0.20745849609375, 0.2154541015625, 0.22344970703125, 0.2314453125, 0.23944091796875, 0.2474365234375, 0.25543212890625, 0.263427734375, 0.27142333984375, 0.2794189453125, 0.28741455078125, 0.29541015625, 0.30340576171875, 0.3114013671875, 0.31939697265625, 0.327392578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 7.0, 3.0, 7.0, 6.0, 7.0, 15.0, 13.0, 14.0, 8.0, 16.0, 20.0, 25.0, 33.0, 31.0, 38.0, 39.0, 44.0, 54.0, 65.0, 62.0, 53.0, 57.0, 46.0, 45.0, 46.0, 44.0, 27.0, 30.0, 21.0, 25.0, 17.0, 16.0, 19.0, 14.0, 8.0, 3.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1414794921875, -0.13768291473388672, -0.13388633728027344, -0.13008975982666016, -0.12629318237304688, -0.1224966049194336, -0.11870002746582031, -0.11490345001220703, -0.11110687255859375, -0.10731029510498047, -0.10351371765136719, -0.0997171401977539, -0.09592056274414062, -0.09212398529052734, -0.08832740783691406, -0.08453083038330078, -0.0807342529296875, -0.07693767547607422, -0.07314109802246094, -0.06934452056884766, -0.06554794311523438, -0.061751365661621094, -0.05795478820800781, -0.05415821075439453, -0.05036163330078125, -0.04656505584716797, -0.04276847839355469, -0.038971900939941406, -0.035175323486328125, -0.031378746032714844, -0.027582168579101562, -0.02378559112548828, -0.019989013671875, -0.01619243621826172, -0.012395858764648438, -0.008599281311035156, -0.004802703857421875, -0.0010061264038085938, 0.0027904510498046875, 0.006587028503417969, 0.01038360595703125, 0.014180183410644531, 0.017976760864257812, 0.021773338317871094, 0.025569915771484375, 0.029366493225097656, 0.03316307067871094, 0.03695964813232422, 0.0407562255859375, 0.04455280303955078, 0.04834938049316406, 0.052145957946777344, 0.055942535400390625, 0.059739112854003906, 0.06353569030761719, 0.06733226776123047, 0.07112884521484375, 0.07492542266845703, 0.07872200012207031, 0.0825185775756836, 0.08631515502929688, 0.09011173248291016, 0.09390830993652344, 0.09770488739013672, 0.10150146484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 12.0, 11.0, 17.0, 43.0, 70.0, 80.0, 142.0, 246.0, 145.0, 97.0, 60.0, 24.0, 16.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6263699531555176, -3.50262713432312, -3.3788843154907227, -3.255141496658325, -3.1313986778259277, -3.0076558589935303, -2.883913040161133, -2.7601704597473145, -2.636427402496338, -2.5126845836639404, -2.388941764831543, -2.2651989459991455, -2.141456127166748, -2.0177133083343506, -1.8939706087112427, -1.7702277898788452, -1.6464850902557373, -1.5227422714233398, -1.3989994525909424, -1.275256633758545, -1.1515138149261475, -1.02777099609375, -0.9040282964706421, -0.7802854776382446, -0.6565426588058472, -0.5327998399734497, -0.40905705094337463, -0.28531426191329956, -0.1615714430809021, -0.03782862424850464, 0.08591413497924805, 0.2096569538116455, 0.33339977264404297, 0.45714259147644043, 0.5808854103088379, 0.7046281695365906, 0.828370988368988, 0.9521138072013855, 1.0758565664291382, 1.1995993852615356, 1.323342204093933, 1.4470850229263306, 1.570827841758728, 1.694570541381836, 1.8183133602142334, 1.9420561790466309, 2.0657989978790283, 2.189541816711426, 2.3132846355438232, 2.4370274543762207, 2.560770273208618, 2.6845130920410156, 2.808255910873413, 2.9319987297058105, 3.055741310119629, 3.1794843673706055, 3.303226947784424, 3.4269697666168213, 3.5507125854492188, 3.674455404281616, 3.7981982231140137, 3.921941041946411, 4.045683860778809, 4.169426441192627, 4.2931694984436035]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 9.0, 13.0, 14.0, 21.0, 10.0, 22.0, 26.0, 30.0, 27.0, 34.0, 36.0, 37.0, 53.0, 54.0, 59.0, 76.0, 73.0, 55.0, 39.0, 41.0, 35.0, 30.0, 31.0, 24.0, 23.0, 18.0, 18.0, 11.0, 11.0, 11.0, 7.0, 12.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5546655654907227, -2.4808285236358643, -2.406991481781006, -2.3331542015075684, -2.25931715965271, -2.1854801177978516, -2.111642837524414, -2.0378057956695557, -1.9639687538146973, -1.8901317119598389, -1.816294550895691, -1.742457389831543, -1.6686203479766846, -1.5947833061218262, -1.5209461450576782, -1.4471089839935303, -1.3732719421386719, -1.2994349002838135, -1.2255977392196655, -1.1517605781555176, -1.0779235363006592, -1.0040864944458008, -0.9302493333816528, -0.8564122319221497, -0.7825751304626465, -0.7087380290031433, -0.6349009275436401, -0.561063826084137, -0.4872267246246338, -0.4133896231651306, -0.33955252170562744, -0.26571542024612427, -0.191878080368042, -0.11804097890853882, -0.044203877449035645, 0.02963322401046753, 0.1034703254699707, 0.17730742692947388, 0.25114452838897705, 0.3249816298484802, 0.3988187313079834, 0.4726558327674866, 0.5464929342269897, 0.6203300356864929, 0.6941671371459961, 0.7680042386054993, 0.8418413400650024, 0.9156784415245056, 0.9895155429840088, 1.0633525848388672, 1.1371897459030151, 1.211026906967163, 1.2848639488220215, 1.3587009906768799, 1.4325381517410278, 1.5063753128051758, 1.5802123546600342, 1.6540493965148926, 1.7278865575790405, 1.8017237186431885, 1.8755607604980469, 1.9493978023529053, 2.0232348442077637, 2.097072124481201, 2.1709091663360596]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 13.0, 35.0, 48.0, 75.0, 140.0, 226.0, 386.0, 668.0, 1412.0, 2940.0, 7077.0, 18012.0, 55475.0, 245241.0, 1584984.0, 1889823.0, 292761.0, 61198.0, 19378.0, 7568.0, 3226.0, 1510.0, 872.0, 456.0, 264.0, 167.0, 106.0, 77.0, 42.0, 19.0, 24.0, 14.0, 10.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.2039642333984375, -0.197601318359375, -0.1912384033203125, -0.18487548828125, -0.1785125732421875, -0.172149658203125, -0.1657867431640625, -0.159423828125, -0.1530609130859375, -0.146697998046875, -0.1403350830078125, -0.13397216796875, -0.1276092529296875, -0.121246337890625, -0.1148834228515625, -0.1085205078125, -0.1021575927734375, -0.095794677734375, -0.0894317626953125, -0.08306884765625, -0.0767059326171875, -0.070343017578125, -0.0639801025390625, -0.0576171875, -0.0512542724609375, -0.044891357421875, -0.0385284423828125, -0.03216552734375, -0.0258026123046875, -0.019439697265625, -0.0130767822265625, -0.0067138671875, -0.0003509521484375, 0.006011962890625, 0.0123748779296875, 0.01873779296875, 0.0251007080078125, 0.031463623046875, 0.0378265380859375, 0.044189453125, 0.0505523681640625, 0.056915283203125, 0.0632781982421875, 0.06964111328125, 0.0760040283203125, 0.082366943359375, 0.0887298583984375, 0.0950927734375, 0.1014556884765625, 0.107818603515625, 0.1141815185546875, 0.12054443359375, 0.1269073486328125, 0.133270263671875, 0.1396331787109375, 0.14599609375, 0.1523590087890625, 0.158721923828125, 0.1650848388671875, 0.17144775390625, 0.1778106689453125, 0.184173583984375, 0.1905364990234375, 0.1968994140625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 9.0, 12.0, 10.0, 12.0, 14.0, 21.0, 33.0, 30.0, 33.0, 46.0, 48.0, 54.0, 65.0, 67.0, 77.0, 60.0, 59.0, 59.0, 43.0, 39.0, 30.0, 32.0, 27.0, 21.0, 22.0, 20.0, 16.0, 15.0, 11.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11224365234375, -0.10732555389404297, -0.10240745544433594, -0.0974893569946289, -0.09257125854492188, -0.08765316009521484, -0.08273506164550781, -0.07781696319580078, -0.07289886474609375, -0.06798076629638672, -0.06306266784667969, -0.058144569396972656, -0.053226470947265625, -0.048308372497558594, -0.04339027404785156, -0.03847217559814453, -0.0335540771484375, -0.02863597869873047, -0.023717880249023438, -0.018799781799316406, -0.013881683349609375, -0.008963584899902344, -0.0040454864501953125, 0.0008726119995117188, 0.00579071044921875, 0.010708808898925781, 0.015626907348632812, 0.020545005798339844, 0.025463104248046875, 0.030381202697753906, 0.03529930114746094, 0.04021739959716797, 0.045135498046875, 0.05005359649658203, 0.05497169494628906, 0.059889793395996094, 0.06480789184570312, 0.06972599029541016, 0.07464408874511719, 0.07956218719482422, 0.08448028564453125, 0.08939838409423828, 0.09431648254394531, 0.09923458099365234, 0.10415267944335938, 0.1090707778930664, 0.11398887634277344, 0.11890697479248047, 0.1238250732421875, 0.12874317169189453, 0.13366127014160156, 0.1385793685913086, 0.14349746704101562, 0.14841556549072266, 0.1533336639404297, 0.15825176239013672, 0.16316986083984375, 0.16808795928955078, 0.1730060577392578, 0.17792415618896484, 0.18284225463867188, 0.1877603530883789, 0.19267845153808594, 0.19759654998779297, 0.2025146484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 13.0, 12.0, 31.0, 54.0, 64.0, 112.0, 238.0, 492.0, 1437.0, 4415.0, 16917.0, 88505.0, 1210431.0, 2684663.0, 154346.0, 23710.0, 5707.0, 1808.0, 680.0, 276.0, 114.0, 97.0, 48.0, 30.0, 17.0, 13.0, 10.0, 8.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.400146484375, -0.3876991271972656, -0.37525177001953125, -0.3628044128417969, -0.3503570556640625, -0.3379096984863281, -0.32546234130859375, -0.3130149841308594, -0.300567626953125, -0.2881202697753906, -0.27567291259765625, -0.2632255554199219, -0.2507781982421875, -0.23833084106445312, -0.22588348388671875, -0.21343612670898438, -0.20098876953125, -0.18854141235351562, -0.17609405517578125, -0.16364669799804688, -0.1511993408203125, -0.13875198364257812, -0.12630462646484375, -0.11385726928710938, -0.101409912109375, -0.08896255493164062, -0.07651519775390625, -0.06406784057617188, -0.0516204833984375, -0.039173126220703125, -0.02672576904296875, -0.014278411865234375, -0.0018310546875, 0.010616302490234375, 0.02306365966796875, 0.035511016845703125, 0.0479583740234375, 0.060405731201171875, 0.07285308837890625, 0.08530044555664062, 0.097747802734375, 0.11019515991210938, 0.12264251708984375, 0.13508987426757812, 0.1475372314453125, 0.15998458862304688, 0.17243194580078125, 0.18487930297851562, 0.19732666015625, 0.20977401733398438, 0.22222137451171875, 0.23466873168945312, 0.2471160888671875, 0.2595634460449219, 0.27201080322265625, 0.2844581604003906, 0.296905517578125, 0.3093528747558594, 0.32180023193359375, 0.3342475891113281, 0.3466949462890625, 0.3591423034667969, 0.37158966064453125, 0.3840370178222656, 0.396484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 6.0, 7.0, 10.0, 4.0, 12.0, 9.0, 13.0, 16.0, 29.0, 36.0, 41.0, 69.0, 90.0, 126.0, 159.0, 243.0, 336.0, 494.0, 585.0, 537.0, 362.0, 272.0, 192.0, 117.0, 92.0, 55.0, 30.0, 35.0, 18.0, 19.0, 12.0, 12.0, 10.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.2677803039550781, -0.25772857666015625, -0.24767684936523438, -0.2376251220703125, -0.22757339477539062, -0.21752166748046875, -0.20746994018554688, -0.197418212890625, -0.18736648559570312, -0.17731475830078125, -0.16726303100585938, -0.1572113037109375, -0.14715957641601562, -0.13710784912109375, -0.12705612182617188, -0.11700439453125, -0.10695266723632812, -0.09690093994140625, -0.08684921264648438, -0.0767974853515625, -0.06674575805664062, -0.05669403076171875, -0.046642303466796875, -0.036590576171875, -0.026538848876953125, -0.01648712158203125, -0.006435394287109375, 0.0036163330078125, 0.013668060302734375, 0.02371978759765625, 0.033771514892578125, 0.0438232421875, 0.053874969482421875, 0.06392669677734375, 0.07397842407226562, 0.0840301513671875, 0.09408187866210938, 0.10413360595703125, 0.11418533325195312, 0.124237060546875, 0.13428878784179688, 0.14434051513671875, 0.15439224243164062, 0.1644439697265625, 0.17449569702148438, 0.18454742431640625, 0.19459915161132812, 0.20465087890625, 0.21470260620117188, 0.22475433349609375, 0.23480606079101562, 0.2448577880859375, 0.2549095153808594, 0.26496124267578125, 0.2750129699707031, 0.285064697265625, 0.2951164245605469, 0.30516815185546875, 0.3152198791503906, 0.3252716064453125, 0.3353233337402344, 0.34537506103515625, 0.3554267883300781, 0.365478515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 14.0, 23.0, 38.0, 81.0, 147.0, 195.0, 207.0, 138.0, 72.0, 28.0, 15.0, 7.0, 8.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.727634906768799, -3.5950684547424316, -3.4625022411346436, -3.3299360275268555, -3.1973695755004883, -3.064803123474121, -2.932236909866333, -2.799670696258545, -2.6671042442321777, -2.5345377922058105, -2.4019715785980225, -2.2694053649902344, -2.136838912963867, -2.0042724609375, -1.871706247329712, -1.7391399145126343, -1.6065735816955566, -1.474007248878479, -1.3414409160614014, -1.2088745832443237, -1.076308250427246, -0.9437419176101685, -0.8111755847930908, -0.6786092519760132, -0.5460429191589355, -0.4134765863418579, -0.2809102535247803, -0.14834392070770264, -0.015777587890625, 0.11678874492645264, 0.24935507774353027, 0.3819214105606079, 0.5144882202148438, 0.6470545530319214, 0.779620885848999, 0.9121872186660767, 1.0447535514831543, 1.177319884300232, 1.3098862171173096, 1.4424525499343872, 1.5750188827514648, 1.7075852155685425, 1.8401515483856201, 1.9727178812026978, 2.1052842140197754, 2.2378506660461426, 2.3704168796539307, 2.5029830932617188, 2.635549545288086, 2.768115997314453, 2.900682210922241, 3.0332484245300293, 3.1658148765563965, 3.2983813285827637, 3.4309475421905518, 3.56351375579834, 3.696080207824707, 3.828646659851074, 3.9612128734588623, 4.09377908706665, 4.226345539093018, 4.358911991119385, 4.491477966308594, 4.624044418334961, 4.756610870361328]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 8.0, 11.0, 14.0, 11.0, 11.0, 19.0, 21.0, 24.0, 27.0, 36.0, 39.0, 53.0, 36.0, 60.0, 53.0, 37.0, 42.0, 49.0, 64.0, 50.0, 41.0, 26.0, 43.0, 44.0, 29.0, 29.0, 19.0, 19.0, 10.0, 13.0, 12.0, 10.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.666301965713501, -1.609972596168518, -1.5536432266235352, -1.4973138570785522, -1.4409844875335693, -1.384655237197876, -1.328325867652893, -1.2719964981079102, -1.2156671285629272, -1.1593377590179443, -1.1030083894729614, -1.0466790199279785, -0.9903497099876404, -0.9340203404426575, -0.8776910305023193, -0.8213616609573364, -0.7650322914123535, -0.7087029218673706, -0.6523735523223877, -0.5960442423820496, -0.5397148728370667, -0.48338550329208374, -0.4270561635494232, -0.3707268238067627, -0.3143974542617798, -0.2580680847167969, -0.20173874497413635, -0.14540939033031464, -0.08908003568649292, -0.03275066614151001, 0.023578673601150513, 0.07990801334381104, 0.13623738288879395, 0.19256673753261566, 0.24889609217643738, 0.3052254319190979, 0.3615548014640808, 0.4178841710090637, 0.47421351075172424, 0.5305428504943848, 0.5868722200393677, 0.6432015895843506, 0.6995309591293335, 0.7558602690696716, 0.8121896386146545, 0.8685190081596375, 0.9248483180999756, 0.9811776876449585, 1.0375070571899414, 1.0938364267349243, 1.1501657962799072, 1.2064951658248901, 1.262824535369873, 1.3191537857055664, 1.3754831552505493, 1.4318125247955322, 1.4881418943405151, 1.544471263885498, 1.600800633430481, 1.6571300029754639, 1.7134592533111572, 1.7697887420654297, 1.826117992401123, 1.882447361946106, 1.9387767314910889]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 11.0, 11.0, 15.0, 20.0, 23.0, 50.0, 44.0, 56.0, 128.0, 144.0, 221.0, 353.0, 544.0, 881.0, 1341.0, 2262.0, 3728.0, 7031.0, 14129.0, 30714.0, 76185.0, 224629.0, 417329.0, 159960.0, 58179.0, 24651.0, 11326.0, 5928.0, 3328.0, 1870.0, 1193.0, 703.0, 506.0, 339.0, 226.0, 152.0, 105.0, 78.0, 39.0, 38.0, 23.0, 21.0, 9.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.248046875, -0.23987579345703125, -0.2317047119140625, -0.22353363037109375, -0.215362548828125, -0.20719146728515625, -0.1990203857421875, -0.19084930419921875, -0.18267822265625, -0.17450714111328125, -0.1663360595703125, -0.15816497802734375, -0.149993896484375, -0.14182281494140625, -0.1336517333984375, -0.12548065185546875, -0.1173095703125, -0.10913848876953125, -0.1009674072265625, -0.09279632568359375, -0.084625244140625, -0.07645416259765625, -0.0682830810546875, -0.06011199951171875, -0.05194091796875, -0.04376983642578125, -0.0355987548828125, -0.02742767333984375, -0.019256591796875, -0.01108551025390625, -0.0029144287109375, 0.00525665283203125, 0.013427734375, 0.02159881591796875, 0.0297698974609375, 0.03794097900390625, 0.046112060546875, 0.05428314208984375, 0.0624542236328125, 0.07062530517578125, 0.07879638671875, 0.08696746826171875, 0.0951385498046875, 0.10330963134765625, 0.111480712890625, 0.11965179443359375, 0.1278228759765625, 0.13599395751953125, 0.1441650390625, 0.15233612060546875, 0.1605072021484375, 0.16867828369140625, 0.176849365234375, 0.18502044677734375, 0.1931915283203125, 0.20136260986328125, 0.20953369140625, 0.21770477294921875, 0.2258758544921875, 0.23404693603515625, 0.242218017578125, 0.25038909912109375, 0.2585601806640625, 0.26673126220703125, 0.27490234375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 12.0, 16.0, 18.0, 18.0, 24.0, 30.0, 40.0, 38.0, 60.0, 39.0, 57.0, 48.0, 55.0, 60.0, 60.0, 45.0, 48.0, 30.0, 42.0, 43.0, 27.0, 28.0, 25.0, 20.0, 22.0, 15.0, 19.0, 10.0, 5.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1268310546875, -0.12234115600585938, -0.11785125732421875, -0.11336135864257812, -0.1088714599609375, -0.10438156127929688, -0.09989166259765625, -0.09540176391601562, -0.090911865234375, -0.08642196655273438, -0.08193206787109375, -0.07744216918945312, -0.0729522705078125, -0.06846237182617188, -0.06397247314453125, -0.059482574462890625, -0.05499267578125, -0.050502777099609375, -0.04601287841796875, -0.041522979736328125, -0.0370330810546875, -0.032543182373046875, -0.02805328369140625, -0.023563385009765625, -0.019073486328125, -0.014583587646484375, -0.01009368896484375, -0.005603790283203125, -0.0011138916015625, 0.003376007080078125, 0.00786590576171875, 0.012355804443359375, 0.016845703125, 0.021335601806640625, 0.02582550048828125, 0.030315399169921875, 0.0348052978515625, 0.039295196533203125, 0.04378509521484375, 0.048274993896484375, 0.052764892578125, 0.057254791259765625, 0.06174468994140625, 0.06623458862304688, 0.0707244873046875, 0.07521438598632812, 0.07970428466796875, 0.08419418334960938, 0.08868408203125, 0.09317398071289062, 0.09766387939453125, 0.10215377807617188, 0.1066436767578125, 0.11113357543945312, 0.11562347412109375, 0.12011337280273438, 0.124603271484375, 0.12909317016601562, 0.13358306884765625, 0.13807296752929688, 0.1425628662109375, 0.14705276489257812, 0.15154266357421875, 0.15603256225585938, 0.1605224609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 10.0, 12.0, 17.0, 14.0, 22.0, 32.0, 35.0, 61.0, 73.0, 102.0, 129.0, 185.0, 257.0, 361.0, 620.0, 1052.0, 1832.0, 3929.0, 9715.0, 32124.0, 166642.0, 702983.0, 92613.0, 21187.0, 7250.0, 3041.0, 1502.0, 903.0, 565.0, 375.0, 243.0, 167.0, 119.0, 97.0, 60.0, 60.0, 43.0, 26.0, 22.0, 17.0, 14.0, 7.0, 10.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4150390625, -0.4008979797363281, -0.38675689697265625, -0.3726158142089844, -0.3584747314453125, -0.3443336486816406, -0.33019256591796875, -0.3160514831542969, -0.301910400390625, -0.2877693176269531, -0.27362823486328125, -0.2594871520996094, -0.2453460693359375, -0.23120498657226562, -0.21706390380859375, -0.20292282104492188, -0.18878173828125, -0.17464065551757812, -0.16049957275390625, -0.14635848999023438, -0.1322174072265625, -0.11807632446289062, -0.10393524169921875, -0.08979415893554688, -0.075653076171875, -0.061511993408203125, -0.04737091064453125, -0.033229827880859375, -0.0190887451171875, -0.004947662353515625, 0.00919342041015625, 0.023334503173828125, 0.0374755859375, 0.051616668701171875, 0.06575775146484375, 0.07989883422851562, 0.0940399169921875, 0.10818099975585938, 0.12232208251953125, 0.13646316528320312, 0.150604248046875, 0.16474533081054688, 0.17888641357421875, 0.19302749633789062, 0.2071685791015625, 0.22130966186523438, 0.23545074462890625, 0.24959182739257812, 0.26373291015625, 0.2778739929199219, 0.29201507568359375, 0.3061561584472656, 0.3202972412109375, 0.3344383239746094, 0.34857940673828125, 0.3627204895019531, 0.376861572265625, 0.3910026550292969, 0.40514373779296875, 0.4192848205566406, 0.4334259033203125, 0.4475669860839844, 0.46170806884765625, 0.4758491516113281, 0.489990234375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 13.0, 17.0, 11.0, 17.0, 21.0, 31.0, 35.0, 28.0, 37.0, 25.0, 39.0, 50.0, 55.0, 49.0, 53.0, 69.0, 46.0, 49.0, 36.0, 39.0, 42.0, 33.0, 31.0, 21.0, 22.0, 16.0, 16.0, 16.0, 15.0, 11.0, 9.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.63525390625, -0.61700439453125, -0.5987548828125, -0.58050537109375, -0.562255859375, -0.54400634765625, -0.5257568359375, -0.50750732421875, -0.4892578125, -0.47100830078125, -0.4527587890625, -0.43450927734375, -0.416259765625, -0.39801025390625, -0.3797607421875, -0.36151123046875, -0.34326171875, -0.32501220703125, -0.3067626953125, -0.28851318359375, -0.270263671875, -0.25201416015625, -0.2337646484375, -0.21551513671875, -0.197265625, -0.17901611328125, -0.1607666015625, -0.14251708984375, -0.124267578125, -0.10601806640625, -0.0877685546875, -0.06951904296875, -0.05126953125, -0.03302001953125, -0.0147705078125, 0.00347900390625, 0.021728515625, 0.03997802734375, 0.0582275390625, 0.07647705078125, 0.0947265625, 0.11297607421875, 0.1312255859375, 0.14947509765625, 0.167724609375, 0.18597412109375, 0.2042236328125, 0.22247314453125, 0.24072265625, 0.25897216796875, 0.2772216796875, 0.29547119140625, 0.313720703125, 0.33197021484375, 0.3502197265625, 0.36846923828125, 0.38671875, 0.40496826171875, 0.4232177734375, 0.44146728515625, 0.459716796875, 0.47796630859375, 0.4962158203125, 0.51446533203125, 0.53271484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 6.0, 15.0, 10.0, 22.0, 22.0, 36.0, 42.0, 80.0, 96.0, 138.0, 295.0, 454.0, 878.0, 1852.0, 4548.0, 14288.0, 57714.0, 332995.0, 540610.0, 68509.0, 16520.0, 5128.0, 1996.0, 930.0, 508.0, 322.0, 169.0, 124.0, 64.0, 48.0, 32.0, 22.0, 19.0, 8.0, 9.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1895751953125, -0.1838397979736328, -0.17810440063476562, -0.17236900329589844, -0.16663360595703125, -0.16089820861816406, -0.15516281127929688, -0.1494274139404297, -0.1436920166015625, -0.1379566192626953, -0.13222122192382812, -0.12648582458496094, -0.12075042724609375, -0.11501502990722656, -0.10927963256835938, -0.10354423522949219, -0.097808837890625, -0.09207344055175781, -0.08633804321289062, -0.08060264587402344, -0.07486724853515625, -0.06913185119628906, -0.06339645385742188, -0.05766105651855469, -0.0519256591796875, -0.04619026184082031, -0.040454864501953125, -0.03471946716308594, -0.02898406982421875, -0.023248672485351562, -0.017513275146484375, -0.011777877807617188, -0.00604248046875, -0.0003070831298828125, 0.005428314208984375, 0.011163711547851562, 0.01689910888671875, 0.022634506225585938, 0.028369903564453125, 0.03410530090332031, 0.0398406982421875, 0.04557609558105469, 0.051311492919921875, 0.05704689025878906, 0.06278228759765625, 0.06851768493652344, 0.07425308227539062, 0.07998847961425781, 0.085723876953125, 0.09145927429199219, 0.09719467163085938, 0.10293006896972656, 0.10866546630859375, 0.11440086364746094, 0.12013626098632812, 0.1258716583251953, 0.1316070556640625, 0.1373424530029297, 0.14307785034179688, 0.14881324768066406, 0.15454864501953125, 0.16028404235839844, 0.16601943969726562, 0.1717548370361328, 0.177490234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 10.0, 3.0, 13.0, 10.0, 17.0, 20.0, 32.0, 23.0, 22.0, 26.0, 44.0, 51.0, 72.0, 92.0, 81.0, 86.0, 78.0, 59.0, 49.0, 35.0, 30.0, 23.0, 16.0, 17.0, 17.0, 12.0, 9.0, 11.0, 6.0, 6.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.792213439941406e-05, -4.640687257051468e-05, -4.4891610741615295e-05, -4.337634891271591e-05, -4.186108708381653e-05, -4.0345825254917145e-05, -3.883056342601776e-05, -3.731530159711838e-05, -3.5800039768218994e-05, -3.428477793931961e-05, -3.276951611042023e-05, -3.1254254281520844e-05, -2.973899245262146e-05, -2.8223730623722076e-05, -2.6708468794822693e-05, -2.519320696592331e-05, -2.3677945137023926e-05, -2.2162683308124542e-05, -2.064742147922516e-05, -1.9132159650325775e-05, -1.761689782142639e-05, -1.6101635992527008e-05, -1.4586374163627625e-05, -1.3071112334728241e-05, -1.1555850505828857e-05, -1.0040588676929474e-05, -8.52532684803009e-06, -7.010065019130707e-06, -5.494803190231323e-06, -3.97954136133194e-06, -2.464279532432556e-06, -9.490177035331726e-07, 5.662441253662109e-07, 2.0815059542655945e-06, 3.596767783164978e-06, 5.1120296120643616e-06, 6.627291440963745e-06, 8.142553269863129e-06, 9.657815098762512e-06, 1.1173076927661896e-05, 1.268833875656128e-05, 1.4203600585460663e-05, 1.5718862414360046e-05, 1.723412424325943e-05, 1.8749386072158813e-05, 2.0264647901058197e-05, 2.177990972995758e-05, 2.3295171558856964e-05, 2.4810433387756348e-05, 2.632569521665573e-05, 2.7840957045555115e-05, 2.9356218874454498e-05, 3.087148070335388e-05, 3.2386742532253265e-05, 3.390200436115265e-05, 3.541726619005203e-05, 3.6932528018951416e-05, 3.84477898478508e-05, 3.996305167675018e-05, 4.147831350564957e-05, 4.299357533454895e-05, 4.4508837163448334e-05, 4.602409899234772e-05, 4.75393608212471e-05, 4.9054622650146484e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 12.0, 7.0, 14.0, 15.0, 34.0, 49.0, 75.0, 148.0, 251.0, 530.0, 1123.0, 2807.0, 9899.0, 67518.0, 765898.0, 174414.0, 18267.0, 4308.0, 1622.0, 728.0, 358.0, 199.0, 106.0, 73.0, 46.0, 14.0, 6.0, 12.0, 6.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.274658203125, -0.26696205139160156, -0.2592658996582031, -0.2515697479248047, -0.24387359619140625, -0.2361774444580078, -0.22848129272460938, -0.22078514099121094, -0.2130889892578125, -0.20539283752441406, -0.19769668579101562, -0.1900005340576172, -0.18230438232421875, -0.1746082305908203, -0.16691207885742188, -0.15921592712402344, -0.151519775390625, -0.14382362365722656, -0.13612747192382812, -0.1284313201904297, -0.12073516845703125, -0.11303901672363281, -0.10534286499023438, -0.09764671325683594, -0.0899505615234375, -0.08225440979003906, -0.07455825805664062, -0.06686210632324219, -0.05916595458984375, -0.05146980285644531, -0.043773651123046875, -0.03607749938964844, -0.02838134765625, -0.020685195922851562, -0.012989044189453125, -0.0052928924560546875, 0.00240325927734375, 0.010099411010742188, 0.017795562744140625, 0.025491714477539062, 0.0331878662109375, 0.04088401794433594, 0.048580169677734375, 0.05627632141113281, 0.06397247314453125, 0.07166862487792969, 0.07936477661132812, 0.08706092834472656, 0.094757080078125, 0.10245323181152344, 0.11014938354492188, 0.11784553527832031, 0.12554168701171875, 0.1332378387451172, 0.14093399047851562, 0.14863014221191406, 0.1563262939453125, 0.16402244567871094, 0.17171859741210938, 0.1794147491455078, 0.18711090087890625, 0.1948070526123047, 0.20250320434570312, 0.21019935607910156, 0.2178955078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 11.0, 15.0, 13.0, 16.0, 24.0, 37.0, 52.0, 49.0, 94.0, 96.0, 107.0, 92.0, 82.0, 58.0, 48.0, 54.0, 28.0, 34.0, 28.0, 13.0, 15.0, 5.0, 11.0, 7.0, 5.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24586868286132812, -0.23954010009765625, -0.23321151733398438, -0.2268829345703125, -0.22055435180664062, -0.21422576904296875, -0.20789718627929688, -0.201568603515625, -0.19524002075195312, -0.18891143798828125, -0.18258285522460938, -0.1762542724609375, -0.16992568969726562, -0.16359710693359375, -0.15726852416992188, -0.15093994140625, -0.14461135864257812, -0.13828277587890625, -0.13195419311523438, -0.1256256103515625, -0.11929702758789062, -0.11296844482421875, -0.10663986206054688, -0.100311279296875, -0.09398269653320312, -0.08765411376953125, -0.08132553100585938, -0.0749969482421875, -0.06866836547851562, -0.06233978271484375, -0.056011199951171875, -0.0496826171875, -0.043354034423828125, -0.03702545166015625, -0.030696868896484375, -0.0243682861328125, -0.018039703369140625, -0.01171112060546875, -0.005382537841796875, 0.000946044921875, 0.007274627685546875, 0.01360321044921875, 0.019931793212890625, 0.0262603759765625, 0.032588958740234375, 0.03891754150390625, 0.045246124267578125, 0.05157470703125, 0.057903289794921875, 0.06423187255859375, 0.07056045532226562, 0.0768890380859375, 0.08321762084960938, 0.08954620361328125, 0.09587478637695312, 0.102203369140625, 0.10853195190429688, 0.11486053466796875, 0.12118911743164062, 0.1275177001953125, 0.13384628295898438, 0.14017486572265625, 0.14650344848632812, 0.15283203125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 9.0, 11.0, 54.0, 93.0, 216.0, 302.0, 139.0, 82.0, 34.0, 11.0, 14.0, 5.0, 3.0, 2.0, 1.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9421443939208984, -3.7858171463012695, -3.6294896602630615, -3.4731624126434326, -3.3168351650238037, -3.1605076789855957, -3.004180431365967, -2.847853183746338, -2.691525936126709, -2.53519868850708, -2.378871202468872, -2.222543954849243, -2.0662167072296143, -1.9098893404006958, -1.7535619735717773, -1.5972347259521484, -1.4409072399139404, -1.284579873085022, -1.128252625465393, -0.9719252586364746, -0.8155979514122009, -0.6592706441879272, -0.5029432773590088, -0.3466160297393799, -0.19028866291046143, -0.03396134078502655, 0.12236598134040833, 0.2786933183670044, 0.4350206255912781, 0.5913479328155518, 0.7476752996444702, 0.9040025472640991, 1.0603299140930176, 1.216657280921936, 1.372984528541565, 1.5293118953704834, 1.6856391429901123, 1.8419665098190308, 1.9982938766479492, 2.154621124267578, 2.310948371887207, 2.467275619506836, 2.623603105545044, 2.779930353164673, 2.9362576007843018, 3.0925850868225098, 3.2489123344421387, 3.4052395820617676, 3.5615670680999756, 3.7178943157196045, 3.8742218017578125, 4.030549049377441, 4.18687629699707, 4.343203544616699, 4.499530792236328, 4.655858039855957, 4.812185764312744, 4.968513011932373, 5.124840259552002, 5.281167984008789, 5.437495231628418, 5.593822479248047, 5.750149726867676, 5.906476974487305, 6.062804222106934]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 3.0, 8.0, 9.0, 10.0, 11.0, 10.0, 21.0, 17.0, 19.0, 22.0, 20.0, 21.0, 21.0, 31.0, 21.0, 23.0, 36.0, 42.0, 61.0, 66.0, 72.0, 67.0, 52.0, 38.0, 29.0, 29.0, 28.0, 33.0, 30.0, 22.0, 16.0, 15.0, 11.0, 8.0, 11.0, 9.0, 6.0, 7.0, 7.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.110687255859375, -2.04278564453125, -1.9748839139938354, -1.906982183456421, -1.839080572128296, -1.7711788415908813, -1.7032771110534668, -1.6353754997253418, -1.5674738883972168, -1.4995721578598022, -1.4316705465316772, -1.3637688159942627, -1.2958672046661377, -1.2279654741287231, -1.1600637435913086, -1.0921621322631836, -1.024260401725769, -0.9563587307929993, -0.8884570598602295, -0.8205553293228149, -0.7526537179946899, -0.6847519874572754, -0.6168503165245056, -0.5489486455917358, -0.48104697465896606, -0.4131453037261963, -0.3452436327934265, -0.27734193205833435, -0.20944026112556458, -0.1415385901927948, -0.07363688945770264, -0.005735218524932861, 0.062166452407836914, 0.1300681233406067, 0.19796980917453766, 0.26587149500846863, 0.3337731659412384, 0.4016748368740082, 0.46957653760910034, 0.5374782085418701, 0.6053798794746399, 0.6732815504074097, 0.7411832213401794, 0.8090848922729492, 0.8769866228103638, 0.9448882341384888, 1.0127899646759033, 1.0806915760040283, 1.1485933065414429, 1.2164950370788574, 1.2843966484069824, 1.352298378944397, 1.420199990272522, 1.4881017208099365, 1.5560033321380615, 1.623905062675476, 1.6918067932128906, 1.7597085237503052, 1.8276101350784302, 1.8955118656158447, 1.9634134769439697, 2.0313150882720947, 2.099216938018799, 2.167118549346924, 2.235020160675049]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 6.0, 2.0, 6.0, 15.0, 12.0, 18.0, 22.0, 38.0, 50.0, 77.0, 111.0, 155.0, 256.0, 358.0, 487.0, 786.0, 1268.0, 2067.0, 3427.0, 6115.0, 11941.0, 26535.0, 71113.0, 251183.0, 1056670.0, 1943632.0, 586790.0, 145980.0, 45999.0, 18379.0, 8929.0, 4590.0, 2716.0, 1604.0, 966.0, 627.0, 436.0, 286.0, 188.0, 147.0, 87.0, 62.0, 42.0, 33.0, 27.0, 16.0, 7.0, 7.0, 7.0, 8.0, 2.0, 2.0, 3.0], "bins": [-0.15380859375, -0.14957046508789062, -0.14533233642578125, -0.14109420776367188, -0.1368560791015625, -0.13261795043945312, -0.12837982177734375, -0.12414169311523438, -0.119903564453125, -0.11566543579101562, -0.11142730712890625, -0.10718917846679688, -0.1029510498046875, -0.09871292114257812, -0.09447479248046875, -0.09023666381835938, -0.08599853515625, -0.08176040649414062, -0.07752227783203125, -0.07328414916992188, -0.0690460205078125, -0.06480789184570312, -0.06056976318359375, -0.056331634521484375, -0.052093505859375, -0.047855377197265625, -0.04361724853515625, -0.039379119873046875, -0.0351409912109375, -0.030902862548828125, -0.02666473388671875, -0.022426605224609375, -0.0181884765625, -0.013950347900390625, -0.00971221923828125, -0.005474090576171875, -0.0012359619140625, 0.003002166748046875, 0.00724029541015625, 0.011478424072265625, 0.015716552734375, 0.019954681396484375, 0.02419281005859375, 0.028430938720703125, 0.0326690673828125, 0.036907196044921875, 0.04114532470703125, 0.045383453369140625, 0.04962158203125, 0.053859710693359375, 0.05809783935546875, 0.062335968017578125, 0.0665740966796875, 0.07081222534179688, 0.07505035400390625, 0.07928848266601562, 0.083526611328125, 0.08776473999023438, 0.09200286865234375, 0.09624099731445312, 0.1004791259765625, 0.10471725463867188, 0.10895538330078125, 0.11319351196289062, 0.117431640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 1.0, 9.0, 3.0, 10.0, 12.0, 16.0, 12.0, 11.0, 22.0, 17.0, 30.0, 36.0, 40.0, 45.0, 46.0, 55.0, 75.0, 56.0, 59.0, 72.0, 47.0, 54.0, 39.0, 36.0, 33.0, 33.0, 24.0, 29.0, 16.0, 13.0, 13.0, 15.0, 13.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11724853515625, -0.11259746551513672, -0.10794639587402344, -0.10329532623291016, -0.09864425659179688, -0.0939931869506836, -0.08934211730957031, -0.08469104766845703, -0.08003997802734375, -0.07538890838623047, -0.07073783874511719, -0.0660867691040039, -0.061435699462890625, -0.056784629821777344, -0.05213356018066406, -0.04748249053955078, -0.0428314208984375, -0.03818035125732422, -0.03352928161621094, -0.028878211975097656, -0.024227142333984375, -0.019576072692871094, -0.014925003051757812, -0.010273933410644531, -0.00562286376953125, -0.0009717941284179688, 0.0036792755126953125, 0.008330345153808594, 0.012981414794921875, 0.017632484436035156, 0.022283554077148438, 0.02693462371826172, 0.031585693359375, 0.03623676300048828, 0.04088783264160156, 0.045538902282714844, 0.050189971923828125, 0.054841041564941406, 0.05949211120605469, 0.06414318084716797, 0.06879425048828125, 0.07344532012939453, 0.07809638977050781, 0.0827474594116211, 0.08739852905273438, 0.09204959869384766, 0.09670066833496094, 0.10135173797607422, 0.1060028076171875, 0.11065387725830078, 0.11530494689941406, 0.11995601654052734, 0.12460708618164062, 0.1292581558227539, 0.1339092254638672, 0.13856029510498047, 0.14321136474609375, 0.14786243438720703, 0.1525135040283203, 0.1571645736694336, 0.16181564331054688, 0.16646671295166016, 0.17111778259277344, 0.17576885223388672, 0.180419921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 5.0, 13.0, 11.0, 26.0, 52.0, 75.0, 153.0, 294.0, 909.0, 3242.0, 16298.0, 193329.0, 3755111.0, 204587.0, 15798.0, 2954.0, 821.0, 307.0, 121.0, 67.0, 44.0, 23.0, 18.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.58984375, -0.57275390625, -0.5556640625, -0.53857421875, -0.521484375, -0.50439453125, -0.4873046875, -0.47021484375, -0.453125, -0.43603515625, -0.4189453125, -0.40185546875, -0.384765625, -0.36767578125, -0.3505859375, -0.33349609375, -0.31640625, -0.29931640625, -0.2822265625, -0.26513671875, -0.248046875, -0.23095703125, -0.2138671875, -0.19677734375, -0.1796875, -0.16259765625, -0.1455078125, -0.12841796875, -0.111328125, -0.09423828125, -0.0771484375, -0.06005859375, -0.04296875, -0.02587890625, -0.0087890625, 0.00830078125, 0.025390625, 0.04248046875, 0.0595703125, 0.07666015625, 0.09375, 0.11083984375, 0.1279296875, 0.14501953125, 0.162109375, 0.17919921875, 0.1962890625, 0.21337890625, 0.23046875, 0.24755859375, 0.2646484375, 0.28173828125, 0.298828125, 0.31591796875, 0.3330078125, 0.35009765625, 0.3671875, 0.38427734375, 0.4013671875, 0.41845703125, 0.435546875, 0.45263671875, 0.4697265625, 0.48681640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 5.0, 3.0, 11.0, 6.0, 9.0, 9.0, 20.0, 27.0, 29.0, 38.0, 39.0, 70.0, 118.0, 154.0, 224.0, 358.0, 562.0, 682.0, 558.0, 400.0, 236.0, 165.0, 89.0, 80.0, 50.0, 28.0, 30.0, 17.0, 9.0, 15.0, 8.0, 11.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.26811981201171875, -0.2584075927734375, -0.24869537353515625, -0.238983154296875, -0.22927093505859375, -0.2195587158203125, -0.20984649658203125, -0.20013427734375, -0.19042205810546875, -0.1807098388671875, -0.17099761962890625, -0.161285400390625, -0.15157318115234375, -0.1418609619140625, -0.13214874267578125, -0.1224365234375, -0.11272430419921875, -0.1030120849609375, -0.09329986572265625, -0.083587646484375, -0.07387542724609375, -0.0641632080078125, -0.05445098876953125, -0.04473876953125, -0.03502655029296875, -0.0253143310546875, -0.01560211181640625, -0.005889892578125, 0.00382232666015625, 0.0135345458984375, 0.02324676513671875, 0.032958984375, 0.04267120361328125, 0.0523834228515625, 0.06209564208984375, 0.071807861328125, 0.08152008056640625, 0.0912322998046875, 0.10094451904296875, 0.11065673828125, 0.12036895751953125, 0.1300811767578125, 0.13979339599609375, 0.149505615234375, 0.15921783447265625, 0.1689300537109375, 0.17864227294921875, 0.1883544921875, 0.19806671142578125, 0.2077789306640625, 0.21749114990234375, 0.227203369140625, 0.23691558837890625, 0.2466278076171875, 0.25634002685546875, 0.26605224609375, 0.27576446533203125, 0.2854766845703125, 0.29518890380859375, 0.304901123046875, 0.31461334228515625, 0.3243255615234375, 0.33403778076171875, 0.34375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 12.0, 29.0, 51.0, 129.0, 235.0, 273.0, 154.0, 60.0, 22.0, 12.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.281395435333252, -7.127960205078125, -6.97452449798584, -6.821089267730713, -6.667653560638428, -6.514218330383301, -6.360782623291016, -6.207347393035889, -6.053912162780762, -5.900476932525635, -5.74704122543335, -5.593605995178223, -5.4401702880859375, -5.2867350578308105, -5.133299350738525, -4.979864120483398, -4.826428413391113, -4.672993183135986, -4.519557476043701, -4.366122245788574, -4.212686538696289, -4.059251308441162, -3.905815839767456, -3.75238037109375, -3.598944902420044, -3.445509433746338, -3.292073965072632, -3.138638496398926, -2.985203266143799, -2.8317675590515137, -2.6783323287963867, -2.5248968601226807, -2.371461868286133, -2.2180263996124268, -2.0645909309387207, -1.9111555814743042, -1.7577201128005981, -1.604284644126892, -1.4508492946624756, -1.2974138259887695, -1.1439783573150635, -0.9905428886413574, -0.8371074795722961, -0.6836720705032349, -0.5302366018295288, -0.37680113315582275, -0.22336572408676147, -0.0699303150177002, 0.08350515365600586, 0.23694059252738953, 0.3903760313987732, 0.5438114404678345, 0.6972469091415405, 0.8506823778152466, 1.004117727279663, 1.1575531959533691, 1.3109886646270752, 1.4644241333007812, 1.6178596019744873, 1.7712949514389038, 1.9247304201126099, 2.0781660079956055, 2.2316012382507324, 2.3850367069244385, 2.5384721755981445]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 10.0, 16.0, 18.0, 10.0, 18.0, 19.0, 25.0, 30.0, 31.0, 34.0, 39.0, 42.0, 37.0, 39.0, 36.0, 48.0, 45.0, 30.0, 46.0, 35.0, 47.0, 39.0, 32.0, 30.0, 24.0, 20.0, 31.0, 20.0, 26.0, 18.0, 22.0, 12.0, 16.0, 7.0, 6.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2125723361968994, -1.1690690517425537, -1.1255658864974976, -1.0820626020431519, -1.0385594367980957, -0.99505615234375, -0.9515529274940491, -0.9080497026443481, -0.8645464777946472, -0.8210432529449463, -0.7775400280952454, -0.7340368032455444, -0.6905335187911987, -0.6470303535461426, -0.6035270690917969, -0.560023844242096, -0.516520619392395, -0.4730173945426941, -0.42951416969299316, -0.38601091504096985, -0.3425076901912689, -0.299004465341568, -0.2555012106895447, -0.21199798583984375, -0.16849476099014282, -0.1249915286898613, -0.08148829638957977, -0.03798505663871765, 0.005518168210983276, 0.049021393060684204, 0.09252464771270752, 0.13602787256240845, 0.17953097820281982, 0.22303420305252075, 0.2665374279022217, 0.310040682554245, 0.3535439074039459, 0.39704713225364685, 0.44055038690567017, 0.4840536117553711, 0.527556836605072, 0.571060061454773, 0.6145632863044739, 0.6580665111541748, 0.7015697956085205, 0.7450729608535767, 0.7885762453079224, 0.8320794701576233, 0.8755826950073242, 0.9190859198570251, 0.9625891447067261, 1.0060924291610718, 1.049595594406128, 1.0930988788604736, 1.1366021633148193, 1.1801053285598755, 1.2236084938049316, 1.2671117782592773, 1.3106149435043335, 1.3541182279586792, 1.3976213932037354, 1.441124677658081, 1.4846279621124268, 1.528131127357483, 1.5716344118118286]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 12.0, 7.0, 10.0, 25.0, 39.0, 39.0, 72.0, 100.0, 164.0, 265.0, 371.0, 725.0, 1342.0, 2562.0, 5363.0, 12978.0, 34533.0, 112433.0, 351184.0, 353834.0, 113225.0, 35234.0, 12751.0, 5577.0, 2580.0, 1275.0, 740.0, 418.0, 254.0, 150.0, 95.0, 70.0, 44.0, 17.0, 22.0, 21.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.180908203125, -0.17444801330566406, -0.16798782348632812, -0.1615276336669922, -0.15506744384765625, -0.1486072540283203, -0.14214706420898438, -0.13568687438964844, -0.1292266845703125, -0.12276649475097656, -0.11630630493164062, -0.10984611511230469, -0.10338592529296875, -0.09692573547363281, -0.09046554565429688, -0.08400535583496094, -0.077545166015625, -0.07108497619628906, -0.06462478637695312, -0.05816459655761719, -0.05170440673828125, -0.04524421691894531, -0.038784027099609375, -0.03232383728027344, -0.0258636474609375, -0.019403457641601562, -0.012943267822265625, -0.0064830780029296875, -2.288818359375e-05, 0.0064373016357421875, 0.012897491455078125, 0.019357681274414062, 0.02581787109375, 0.03227806091308594, 0.038738250732421875, 0.04519844055175781, 0.05165863037109375, 0.05811882019042969, 0.06457901000976562, 0.07103919982910156, 0.0774993896484375, 0.08395957946777344, 0.09041976928710938, 0.09687995910644531, 0.10334014892578125, 0.10980033874511719, 0.11626052856445312, 0.12272071838378906, 0.129180908203125, 0.13564109802246094, 0.14210128784179688, 0.1485614776611328, 0.15502166748046875, 0.1614818572998047, 0.16794204711914062, 0.17440223693847656, 0.1808624267578125, 0.18732261657714844, 0.19378280639648438, 0.2002429962158203, 0.20670318603515625, 0.2131633758544922, 0.21962356567382812, 0.22608375549316406, 0.2325439453125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 7.0, 10.0, 17.0, 23.0, 15.0, 29.0, 21.0, 42.0, 48.0, 29.0, 45.0, 52.0, 58.0, 70.0, 52.0, 51.0, 46.0, 44.0, 36.0, 33.0, 50.0, 35.0, 30.0, 29.0, 23.0, 24.0, 17.0, 13.0, 12.0, 8.0, 6.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12353515625, -0.11874961853027344, -0.11396408081054688, -0.10917854309082031, -0.10439300537109375, -0.09960746765136719, -0.09482192993164062, -0.09003639221191406, -0.0852508544921875, -0.08046531677246094, -0.07567977905273438, -0.07089424133300781, -0.06610870361328125, -0.06132316589355469, -0.056537628173828125, -0.05175209045410156, -0.046966552734375, -0.04218101501464844, -0.037395477294921875, -0.03260993957519531, -0.02782440185546875, -0.023038864135742188, -0.018253326416015625, -0.013467788696289062, -0.0086822509765625, -0.0038967132568359375, 0.000888824462890625, 0.0056743621826171875, 0.01045989990234375, 0.015245437622070312, 0.020030975341796875, 0.024816513061523438, 0.02960205078125, 0.03438758850097656, 0.039173126220703125, 0.04395866394042969, 0.04874420166015625, 0.05352973937988281, 0.058315277099609375, 0.06310081481933594, 0.0678863525390625, 0.07267189025878906, 0.07745742797851562, 0.08224296569824219, 0.08702850341796875, 0.09181404113769531, 0.09659957885742188, 0.10138511657714844, 0.106170654296875, 0.11095619201660156, 0.11574172973632812, 0.12052726745605469, 0.12531280517578125, 0.1300983428955078, 0.13488388061523438, 0.13966941833496094, 0.1444549560546875, 0.14924049377441406, 0.15402603149414062, 0.1588115692138672, 0.16359710693359375, 0.1683826446533203, 0.17316818237304688, 0.17795372009277344, 0.1827392578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 10.0, 11.0, 7.0, 10.0, 15.0, 19.0, 32.0, 41.0, 52.0, 102.0, 180.0, 232.0, 474.0, 916.0, 2150.0, 6616.0, 27152.0, 191785.0, 701539.0, 93598.0, 15810.0, 4303.0, 1684.0, 796.0, 379.0, 197.0, 139.0, 81.0, 44.0, 42.0, 25.0, 25.0, 17.0, 18.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3466796875, -0.3359565734863281, -0.32523345947265625, -0.3145103454589844, -0.3037872314453125, -0.2930641174316406, -0.28234100341796875, -0.2716178894042969, -0.260894775390625, -0.2501716613769531, -0.23944854736328125, -0.22872543334960938, -0.2180023193359375, -0.20727920532226562, -0.19655609130859375, -0.18583297729492188, -0.17510986328125, -0.16438674926757812, -0.15366363525390625, -0.14294052124023438, -0.1322174072265625, -0.12149429321289062, -0.11077117919921875, -0.10004806518554688, -0.089324951171875, -0.07860183715820312, -0.06787872314453125, -0.057155609130859375, -0.0464324951171875, -0.035709381103515625, -0.02498626708984375, -0.014263153076171875, -0.0035400390625, 0.007183074951171875, 0.01790618896484375, 0.028629302978515625, 0.0393524169921875, 0.050075531005859375, 0.06079864501953125, 0.07152175903320312, 0.082244873046875, 0.09296798706054688, 0.10369110107421875, 0.11441421508789062, 0.1251373291015625, 0.13586044311523438, 0.14658355712890625, 0.15730667114257812, 0.16802978515625, 0.17875289916992188, 0.18947601318359375, 0.20019912719726562, 0.2109222412109375, 0.22164535522460938, 0.23236846923828125, 0.24309158325195312, 0.253814697265625, 0.2645378112792969, 0.27526092529296875, 0.2859840393066406, 0.2967071533203125, 0.3074302673339844, 0.31815338134765625, 0.3288764953613281, 0.339599609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 8.0, 5.0, 12.0, 17.0, 23.0, 32.0, 36.0, 55.0, 66.0, 53.0, 64.0, 71.0, 71.0, 56.0, 65.0, 56.0, 48.0, 57.0, 40.0, 39.0, 25.0, 31.0, 16.0, 11.0, 8.0, 13.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6650238037109375, -0.642059326171875, -0.6190948486328125, -0.59613037109375, -0.5731658935546875, -0.550201416015625, -0.5272369384765625, -0.5042724609375, -0.4813079833984375, -0.458343505859375, -0.4353790283203125, -0.41241455078125, -0.3894500732421875, -0.366485595703125, -0.3435211181640625, -0.320556640625, -0.2975921630859375, -0.274627685546875, -0.2516632080078125, -0.22869873046875, -0.2057342529296875, -0.182769775390625, -0.1598052978515625, -0.1368408203125, -0.1138763427734375, -0.090911865234375, -0.0679473876953125, -0.04498291015625, -0.0220184326171875, 0.000946044921875, 0.0239105224609375, 0.046875, 0.0698394775390625, 0.092803955078125, 0.1157684326171875, 0.13873291015625, 0.1616973876953125, 0.184661865234375, 0.2076263427734375, 0.2305908203125, 0.2535552978515625, 0.276519775390625, 0.2994842529296875, 0.32244873046875, 0.3454132080078125, 0.368377685546875, 0.3913421630859375, 0.414306640625, 0.4372711181640625, 0.460235595703125, 0.4832000732421875, 0.50616455078125, 0.5291290283203125, 0.552093505859375, 0.5750579833984375, 0.5980224609375, 0.6209869384765625, 0.643951416015625, 0.6669158935546875, 0.68988037109375, 0.7128448486328125, 0.735809326171875, 0.7587738037109375, 0.78173828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 17.0, 10.0, 25.0, 35.0, 54.0, 92.0, 183.0, 309.0, 589.0, 1342.0, 3235.0, 9808.0, 39119.0, 229742.0, 649985.0, 86234.0, 18584.0, 5380.0, 1969.0, 894.0, 375.0, 237.0, 127.0, 75.0, 44.0, 23.0, 22.0, 16.0, 4.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15771484375, -0.1531085968017578, -0.14850234985351562, -0.14389610290527344, -0.13928985595703125, -0.13468360900878906, -0.13007736206054688, -0.1254711151123047, -0.1208648681640625, -0.11625862121582031, -0.11165237426757812, -0.10704612731933594, -0.10243988037109375, -0.09783363342285156, -0.09322738647460938, -0.08862113952636719, -0.084014892578125, -0.07940864562988281, -0.07480239868164062, -0.07019615173339844, -0.06558990478515625, -0.06098365783691406, -0.056377410888671875, -0.05177116394042969, -0.0471649169921875, -0.04255867004394531, -0.037952423095703125, -0.03334617614746094, -0.02873992919921875, -0.024133682250976562, -0.019527435302734375, -0.014921188354492188, -0.01031494140625, -0.0057086944580078125, -0.001102447509765625, 0.0035037994384765625, 0.00811004638671875, 0.012716293334960938, 0.017322540283203125, 0.021928787231445312, 0.0265350341796875, 0.031141281127929688, 0.035747528076171875, 0.04035377502441406, 0.04496002197265625, 0.04956626892089844, 0.054172515869140625, 0.05877876281738281, 0.063385009765625, 0.06799125671386719, 0.07259750366210938, 0.07720375061035156, 0.08180999755859375, 0.08641624450683594, 0.09102249145507812, 0.09562873840332031, 0.1002349853515625, 0.10484123229980469, 0.10944747924804688, 0.11405372619628906, 0.11865997314453125, 0.12326622009277344, 0.12787246704101562, 0.1324787139892578, 0.1370849609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 7.0, 8.0, 12.0, 7.0, 15.0, 23.0, 23.0, 42.0, 55.0, 67.0, 102.0, 104.0, 103.0, 103.0, 74.0, 74.0, 47.0, 28.0, 25.0, 17.0, 22.0, 16.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.13060188293457e-05, -3.999192267656326e-05, -3.867782652378082e-05, -3.736373037099838e-05, -3.604963421821594e-05, -3.47355380654335e-05, -3.342144191265106e-05, -3.210734575986862e-05, -3.079324960708618e-05, -2.947915345430374e-05, -2.81650573015213e-05, -2.685096114873886e-05, -2.553686499595642e-05, -2.422276884317398e-05, -2.290867269039154e-05, -2.15945765376091e-05, -2.028048038482666e-05, -1.896638423204422e-05, -1.765228807926178e-05, -1.633819192647934e-05, -1.50240957736969e-05, -1.370999962091446e-05, -1.2395903468132019e-05, -1.1081807315349579e-05, -9.767711162567139e-06, -8.453615009784698e-06, -7.139518857002258e-06, -5.825422704219818e-06, -4.511326551437378e-06, -3.1972303986549377e-06, -1.8831342458724976e-06, -5.690380930900574e-07, 7.450580596923828e-07, 2.059154212474823e-06, 3.373250365257263e-06, 4.687346518039703e-06, 6.0014426708221436e-06, 7.315538823604584e-06, 8.629634976387024e-06, 9.943731129169464e-06, 1.1257827281951904e-05, 1.2571923434734344e-05, 1.3886019587516785e-05, 1.5200115740299225e-05, 1.6514211893081665e-05, 1.7828308045864105e-05, 1.9142404198646545e-05, 2.0456500351428986e-05, 2.1770596504211426e-05, 2.3084692656993866e-05, 2.4398788809776306e-05, 2.5712884962558746e-05, 2.7026981115341187e-05, 2.8341077268123627e-05, 2.9655173420906067e-05, 3.096926957368851e-05, 3.228336572647095e-05, 3.359746187925339e-05, 3.491155803203583e-05, 3.622565418481827e-05, 3.753975033760071e-05, 3.885384649038315e-05, 4.016794264316559e-05, 4.148203879594803e-05, 4.279613494873047e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 9.0, 20.0, 27.0, 38.0, 58.0, 102.0, 186.0, 327.0, 661.0, 1336.0, 3280.0, 10837.0, 54130.0, 529903.0, 381067.0, 50328.0, 10320.0, 3151.0, 1315.0, 625.0, 323.0, 197.0, 114.0, 69.0, 36.0, 28.0, 13.0, 12.0, 11.0, 10.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.1150503158569336, -0.11004447937011719, -0.10503864288330078, -0.10003280639648438, -0.09502696990966797, -0.09002113342285156, -0.08501529693603516, -0.08000946044921875, -0.07500362396240234, -0.06999778747558594, -0.06499195098876953, -0.059986114501953125, -0.05498027801513672, -0.04997444152832031, -0.044968605041503906, -0.0399627685546875, -0.034956932067871094, -0.029951095581054688, -0.02494525909423828, -0.019939422607421875, -0.014933586120605469, -0.009927749633789062, -0.004921913146972656, 8.392333984375e-05, 0.005089759826660156, 0.010095596313476562, 0.015101432800292969, 0.020107269287109375, 0.02511310577392578, 0.030118942260742188, 0.035124778747558594, 0.040130615234375, 0.045136451721191406, 0.05014228820800781, 0.05514812469482422, 0.060153961181640625, 0.06515979766845703, 0.07016563415527344, 0.07517147064208984, 0.08017730712890625, 0.08518314361572266, 0.09018898010253906, 0.09519481658935547, 0.10020065307617188, 0.10520648956298828, 0.11021232604980469, 0.1152181625366211, 0.1202239990234375, 0.1252298355102539, 0.1302356719970703, 0.13524150848388672, 0.14024734497070312, 0.14525318145751953, 0.15025901794433594, 0.15526485443115234, 0.16027069091796875, 0.16527652740478516, 0.17028236389160156, 0.17528820037841797, 0.18029403686523438, 0.18529987335205078, 0.1903057098388672, 0.1953115463256836, 0.2003173828125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 18.0, 28.0, 43.0, 62.0, 77.0, 90.0, 102.0, 106.0, 97.0, 76.0, 69.0, 52.0, 46.0, 27.0, 20.0, 13.0, 12.0, 12.0, 7.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.13680076599121094, -0.13138961791992188, -0.1259784698486328, -0.12056732177734375, -0.11515617370605469, -0.10974502563476562, -0.10433387756347656, -0.0989227294921875, -0.09351158142089844, -0.08810043334960938, -0.08268928527832031, -0.07727813720703125, -0.07186698913574219, -0.06645584106445312, -0.06104469299316406, -0.055633544921875, -0.05022239685058594, -0.044811248779296875, -0.03940010070800781, -0.03398895263671875, -0.028577804565429688, -0.023166656494140625, -0.017755508422851562, -0.0123443603515625, -0.0069332122802734375, -0.001522064208984375, 0.0038890838623046875, 0.00930023193359375, 0.014711380004882812, 0.020122528076171875, 0.025533676147460938, 0.03094482421875, 0.03635597229003906, 0.041767120361328125, 0.04717826843261719, 0.05258941650390625, 0.05800056457519531, 0.06341171264648438, 0.06882286071777344, 0.0742340087890625, 0.07964515686035156, 0.08505630493164062, 0.09046745300292969, 0.09587860107421875, 0.10128974914550781, 0.10670089721679688, 0.11211204528808594, 0.117523193359375, 0.12293434143066406, 0.12834548950195312, 0.1337566375732422, 0.13916778564453125, 0.1445789337158203, 0.14999008178710938, 0.15540122985839844, 0.1608123779296875, 0.16622352600097656, 0.17163467407226562, 0.1770458221435547, 0.18245697021484375, 0.1878681182861328, 0.19327926635742188, 0.19869041442871094, 0.2041015625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 11.0, 15.0, 53.0, 138.0, 368.0, 226.0, 98.0, 42.0, 22.0, 11.0, 3.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.138543128967285, -4.003957271575928, -3.869371175765991, -3.7347850799560547, -3.6001992225646973, -3.4656131267547607, -3.331027030944824, -3.196441173553467, -3.0618550777435303, -2.9272689819335938, -2.7926831245422363, -2.6580970287323, -2.5235109329223633, -2.388925075531006, -2.2543389797210693, -2.119752883911133, -1.9851670265197754, -1.8505810499191284, -1.7159950733184814, -1.581408977508545, -1.446823000907898, -1.312237024307251, -1.1776509284973145, -1.0430649518966675, -0.9084789752960205, -0.7738929986953735, -0.6393069624900818, -0.50472092628479, -0.37013494968414307, -0.2355489730834961, -0.10096293687820435, 0.0336230993270874, 0.16820955276489258, 0.30279555916786194, 0.4373815655708313, 0.571967601776123, 0.70655357837677, 0.841139554977417, 0.9757255911827087, 1.1103116273880005, 1.2448976039886475, 1.3794835805892944, 1.5140695571899414, 1.648655652999878, 1.783241629600525, 1.9178276062011719, 2.0524137020111084, 2.186999797821045, 2.3215856552124023, 2.456171751022339, 2.5907576084136963, 2.725343704223633, 2.8599295616149902, 2.9945156574249268, 3.1291017532348633, 3.2636876106262207, 3.3982737064361572, 3.5328598022460938, 3.667445659637451, 3.8020317554473877, 3.936617851257324, 4.071203708648682, 4.205789566040039, 4.340375900268555, 4.474961757659912]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 9.0, 2.0, 7.0, 11.0, 9.0, 6.0, 18.0, 18.0, 6.0, 22.0, 18.0, 15.0, 18.0, 21.0, 25.0, 27.0, 34.0, 41.0, 58.0, 57.0, 69.0, 82.0, 69.0, 38.0, 29.0, 41.0, 23.0, 36.0, 27.0, 17.0, 20.0, 25.0, 13.0, 8.0, 12.0, 14.0, 10.0, 4.0, 5.0, 5.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.6017582416534424, -1.5445072650909424, -1.4872561693191528, -1.4300051927566528, -1.3727542161941528, -1.3155031204223633, -1.2582521438598633, -1.2010011672973633, -1.1437501907348633, -1.0864992141723633, -1.0292481184005737, -0.9719971418380737, -0.9147461652755737, -0.857495129108429, -0.8002440929412842, -0.7429931163787842, -0.6857420802116394, -0.6284910440444946, -0.5712400674819946, -0.5139890313148499, -0.45673805475234985, -0.3994870185852051, -0.3422360122203827, -0.2849850058555603, -0.22773399949073792, -0.17048299312591553, -0.11323197931051254, -0.05598096549510956, 0.0012700408697128296, 0.05852106213569641, 0.1157720685005188, 0.1730230748653412, 0.23027408123016357, 0.28752508759498596, 0.34477609395980835, 0.4020271301269531, 0.4592781066894531, 0.5165291428565979, 0.5737801790237427, 0.6310311555862427, 0.6882821321487427, 0.7455331683158875, 0.8027841448783875, 0.8600351810455322, 0.9172861576080322, 0.974537193775177, 1.0317882299423218, 1.0890392065048218, 1.1462903022766113, 1.2035412788391113, 1.2607923746109009, 1.3180433511734009, 1.3752943277359009, 1.4325454235076904, 1.4897964000701904, 1.5470473766326904, 1.6042983531951904, 1.6615493297576904, 1.71880042552948, 1.77605140209198, 1.83330237865448, 1.8905534744262695, 1.9478044509887695, 2.0050554275512695, 2.0623064041137695]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 5.0, 12.0, 24.0, 31.0, 32.0, 69.0, 108.0, 172.0, 280.0, 438.0, 675.0, 1161.0, 1893.0, 3447.0, 6629.0, 13700.0, 33753.0, 103302.0, 402006.0, 1646387.0, 1482275.0, 350428.0, 91498.0, 29836.0, 12356.0, 5959.0, 3134.0, 1875.0, 1073.0, 653.0, 408.0, 267.0, 150.0, 69.0, 59.0, 35.0, 27.0, 18.0, 14.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14013671875, -0.13600921630859375, -0.1318817138671875, -0.12775421142578125, -0.123626708984375, -0.11949920654296875, -0.1153717041015625, -0.11124420166015625, -0.10711669921875, -0.10298919677734375, -0.0988616943359375, -0.09473419189453125, -0.090606689453125, -0.08647918701171875, -0.0823516845703125, -0.07822418212890625, -0.0740966796875, -0.06996917724609375, -0.0658416748046875, -0.06171417236328125, -0.057586669921875, -0.05345916748046875, -0.0493316650390625, -0.04520416259765625, -0.04107666015625, -0.03694915771484375, -0.0328216552734375, -0.02869415283203125, -0.024566650390625, -0.02043914794921875, -0.0163116455078125, -0.01218414306640625, -0.008056640625, -0.00392913818359375, 0.0001983642578125, 0.00432586669921875, 0.008453369140625, 0.01258087158203125, 0.0167083740234375, 0.02083587646484375, 0.02496337890625, 0.02909088134765625, 0.0332183837890625, 0.03734588623046875, 0.041473388671875, 0.04560089111328125, 0.0497283935546875, 0.05385589599609375, 0.0579833984375, 0.06211090087890625, 0.0662384033203125, 0.07036590576171875, 0.074493408203125, 0.07862091064453125, 0.0827484130859375, 0.08687591552734375, 0.09100341796875, 0.09513092041015625, 0.0992584228515625, 0.10338592529296875, 0.107513427734375, 0.11164093017578125, 0.1157684326171875, 0.11989593505859375, 0.1240234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 5.0, 7.0, 11.0, 14.0, 20.0, 23.0, 29.0, 22.0, 38.0, 36.0, 63.0, 51.0, 60.0, 61.0, 54.0, 53.0, 62.0, 59.0, 50.0, 51.0, 45.0, 35.0, 37.0, 22.0, 18.0, 18.0, 12.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.123931884765625, -0.11895751953125, -0.113983154296875, -0.1090087890625, -0.104034423828125, -0.09906005859375, -0.094085693359375, -0.089111328125, -0.084136962890625, -0.07916259765625, -0.074188232421875, -0.0692138671875, -0.064239501953125, -0.05926513671875, -0.054290771484375, -0.04931640625, -0.044342041015625, -0.03936767578125, -0.034393310546875, -0.0294189453125, -0.024444580078125, -0.01947021484375, -0.014495849609375, -0.009521484375, -0.004547119140625, 0.00042724609375, 0.005401611328125, 0.0103759765625, 0.015350341796875, 0.02032470703125, 0.025299072265625, 0.0302734375, 0.035247802734375, 0.04022216796875, 0.045196533203125, 0.0501708984375, 0.055145263671875, 0.06011962890625, 0.065093994140625, 0.070068359375, 0.075042724609375, 0.08001708984375, 0.084991455078125, 0.0899658203125, 0.094940185546875, 0.09991455078125, 0.104888916015625, 0.10986328125, 0.114837646484375, 0.11981201171875, 0.124786376953125, 0.1297607421875, 0.134735107421875, 0.13970947265625, 0.144683837890625, 0.149658203125, 0.154632568359375, 0.15960693359375, 0.164581298828125, 0.1695556640625, 0.174530029296875, 0.17950439453125, 0.184478759765625, 0.189453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 2.0, 10.0, 14.0, 15.0, 28.0, 38.0, 43.0, 70.0, 129.0, 333.0, 940.0, 3906.0, 24059.0, 455195.0, 3603635.0, 92717.0, 10125.0, 1950.0, 569.0, 226.0, 105.0, 52.0, 42.0, 16.0, 21.0, 14.0, 11.0, 9.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.383544921875, -0.3677482604980469, -0.35195159912109375, -0.3361549377441406, -0.3203582763671875, -0.3045616149902344, -0.28876495361328125, -0.2729682922363281, -0.257171630859375, -0.24137496948242188, -0.22557830810546875, -0.20978164672851562, -0.1939849853515625, -0.17818832397460938, -0.16239166259765625, -0.14659500122070312, -0.13079833984375, -0.11500167846679688, -0.09920501708984375, -0.08340835571289062, -0.0676116943359375, -0.051815032958984375, -0.03601837158203125, -0.020221710205078125, -0.004425048828125, 0.011371612548828125, 0.02716827392578125, 0.042964935302734375, 0.0587615966796875, 0.07455825805664062, 0.09035491943359375, 0.10615158081054688, 0.1219482421875, 0.13774490356445312, 0.15354156494140625, 0.16933822631835938, 0.1851348876953125, 0.20093154907226562, 0.21672821044921875, 0.23252487182617188, 0.248321533203125, 0.2641181945800781, 0.27991485595703125, 0.2957115173339844, 0.3115081787109375, 0.3273048400878906, 0.34310150146484375, 0.3588981628417969, 0.37469482421875, 0.3904914855957031, 0.40628814697265625, 0.4220848083496094, 0.4378814697265625, 0.4536781311035156, 0.46947479248046875, 0.4852714538574219, 0.501068115234375, 0.5168647766113281, 0.5326614379882812, 0.5484580993652344, 0.5642547607421875, 0.5800514221191406, 0.5958480834960938, 0.6116447448730469, 0.62744140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 8.0, 2.0, 6.0, 12.0, 10.0, 19.0, 19.0, 32.0, 42.0, 58.0, 100.0, 171.0, 275.0, 437.0, 746.0, 810.0, 524.0, 287.0, 167.0, 104.0, 64.0, 41.0, 34.0, 33.0, 17.0, 10.0, 10.0, 13.0, 5.0, 7.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3916015625, -0.3810615539550781, -0.37052154541015625, -0.3599815368652344, -0.3494415283203125, -0.3389015197753906, -0.32836151123046875, -0.3178215026855469, -0.307281494140625, -0.2967414855957031, -0.28620147705078125, -0.2756614685058594, -0.2651214599609375, -0.2545814514160156, -0.24404144287109375, -0.23350143432617188, -0.22296142578125, -0.21242141723632812, -0.20188140869140625, -0.19134140014648438, -0.1808013916015625, -0.17026138305664062, -0.15972137451171875, -0.14918136596679688, -0.138641357421875, -0.12810134887695312, -0.11756134033203125, -0.10702133178710938, -0.0964813232421875, -0.08594131469726562, -0.07540130615234375, -0.06486129760742188, -0.0543212890625, -0.043781280517578125, -0.03324127197265625, -0.022701263427734375, -0.0121612548828125, -0.001621246337890625, 0.00891876220703125, 0.019458770751953125, 0.029998779296875, 0.040538787841796875, 0.05107879638671875, 0.061618804931640625, 0.0721588134765625, 0.08269882202148438, 0.09323883056640625, 0.10377883911132812, 0.11431884765625, 0.12485885620117188, 0.13539886474609375, 0.14593887329101562, 0.1564788818359375, 0.16701889038085938, 0.17755889892578125, 0.18809890747070312, 0.198638916015625, 0.20917892456054688, 0.21971893310546875, 0.23025894165039062, 0.2407989501953125, 0.2513389587402344, 0.26187896728515625, 0.2724189758300781, 0.282958984375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 3.0, 10.0, 24.0, 64.0, 145.0, 249.0, 246.0, 146.0, 69.0, 27.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0440897941589355, -4.911666393280029, -4.779242515563965, -4.646819114685059, -4.514395236968994, -4.381971836090088, -4.249547958374023, -4.117124557495117, -3.984700918197632, -3.8522772789001465, -3.719853639602661, -3.587430000305176, -3.4550065994262695, -3.322582721710205, -3.190159320831299, -3.0577356815338135, -2.925312042236328, -2.7928884029388428, -2.6604647636413574, -2.528041124343872, -2.3956174850463867, -2.2631940841674805, -2.130770444869995, -1.9983468055725098, -1.8659231662750244, -1.733499526977539, -1.6010758876800537, -1.468652367591858, -1.3362287282943726, -1.2038050889968872, -1.0713815689086914, -0.938957929611206, -0.8065338134765625, -0.6741101741790771, -0.5416865944862366, -0.4092629849910736, -0.27683937549591064, -0.1444157361984253, -0.011992156505584717, 0.12043142318725586, 0.2528550624847412, 0.3852786719799042, 0.5177022814750671, 0.6501258611679077, 0.7825495004653931, 0.9149731397628784, 1.0473966598510742, 1.1798202991485596, 1.312243938446045, 1.4446675777435303, 1.5770912170410156, 1.7095147371292114, 1.8419383764266968, 1.9743620157241821, 2.106785535812378, 2.2392091751098633, 2.3716328144073486, 2.504056453704834, 2.6364800930023193, 2.7689037322998047, 2.901327133178711, 3.0337510108947754, 3.1661744117736816, 3.298598051071167, 3.4310216903686523]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 11.0, 6.0, 8.0, 9.0, 17.0, 17.0, 15.0, 25.0, 34.0, 31.0, 37.0, 46.0, 47.0, 49.0, 33.0, 54.0, 46.0, 53.0, 44.0, 46.0, 44.0, 52.0, 53.0, 33.0, 30.0, 29.0, 30.0, 25.0, 16.0, 16.0, 13.0, 6.0, 4.0, 2.0, 4.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3673722743988037, -1.3215018510818481, -1.2756314277648926, -1.229761004447937, -1.1838905811309814, -1.1380200386047363, -1.0921496152877808, -1.0462791919708252, -1.0004087686538696, -0.9545383453369141, -0.9086679220199585, -0.8627974390983582, -0.8169270157814026, -0.771056592464447, -0.7251861095428467, -0.6793156862258911, -0.6334452629089355, -0.58757483959198, -0.5417044162750244, -0.4958339333534241, -0.4499635100364685, -0.40409308671951294, -0.358222633600235, -0.31235218048095703, -0.26648175716400146, -0.2206113189458847, -0.17474088072776794, -0.12887044250965118, -0.08300000429153442, -0.037129566073417664, 0.008740872144699097, 0.05461132526397705, 0.10048174858093262, 0.14635218679904938, 0.19222262501716614, 0.2380930632352829, 0.28396350145339966, 0.3298339247703552, 0.3757043778896332, 0.42157483100891113, 0.4674452543258667, 0.5133156776428223, 0.5591861009597778, 0.6050565838813782, 0.6509270071983337, 0.6967974305152893, 0.7426679134368896, 0.7885383367538452, 0.8344087600708008, 0.8802791833877563, 0.9261496067047119, 0.9720200896263123, 1.017890453338623, 1.0637609958648682, 1.1096314191818237, 1.1555018424987793, 1.2013722658157349, 1.2472426891326904, 1.293113112449646, 1.3389835357666016, 1.3848540782928467, 1.4307245016098022, 1.4765949249267578, 1.5224653482437134, 1.568335771560669]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 16.0, 13.0, 24.0, 38.0, 45.0, 36.0, 69.0, 129.0, 173.0, 230.0, 398.0, 610.0, 1126.0, 2025.0, 4449.0, 10884.0, 30482.0, 105444.0, 432839.0, 338181.0, 79935.0, 24216.0, 8927.0, 3840.0, 1819.0, 969.0, 542.0, 338.0, 208.0, 145.0, 92.0, 80.0, 62.0, 39.0, 29.0, 33.0, 14.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.239990234375, -0.23291015625, -0.225830078125, -0.21875, -0.211669921875, -0.20458984375, -0.197509765625, -0.1904296875, -0.183349609375, -0.17626953125, -0.169189453125, -0.162109375, -0.155029296875, -0.14794921875, -0.140869140625, -0.1337890625, -0.126708984375, -0.11962890625, -0.112548828125, -0.10546875, -0.098388671875, -0.09130859375, -0.084228515625, -0.0771484375, -0.070068359375, -0.06298828125, -0.055908203125, -0.048828125, -0.041748046875, -0.03466796875, -0.027587890625, -0.0205078125, -0.013427734375, -0.00634765625, 0.000732421875, 0.0078125, 0.014892578125, 0.02197265625, 0.029052734375, 0.0361328125, 0.043212890625, 0.05029296875, 0.057373046875, 0.064453125, 0.071533203125, 0.07861328125, 0.085693359375, 0.0927734375, 0.099853515625, 0.10693359375, 0.114013671875, 0.12109375, 0.128173828125, 0.13525390625, 0.142333984375, 0.1494140625, 0.156494140625, 0.16357421875, 0.170654296875, 0.177734375, 0.184814453125, 0.19189453125, 0.198974609375, 0.2060546875, 0.213134765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 9.0, 12.0, 10.0, 14.0, 27.0, 15.0, 19.0, 28.0, 33.0, 46.0, 25.0, 37.0, 36.0, 46.0, 49.0, 50.0, 50.0, 38.0, 52.0, 63.0, 38.0, 39.0, 30.0, 35.0, 27.0, 29.0, 24.0, 16.0, 13.0, 15.0, 16.0, 15.0, 10.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11859130859375, -0.11428546905517578, -0.10997962951660156, -0.10567378997802734, -0.10136795043945312, -0.0970621109008789, -0.09275627136230469, -0.08845043182373047, -0.08414459228515625, -0.07983875274658203, -0.07553291320800781, -0.0712270736694336, -0.06692123413085938, -0.06261539459228516, -0.05830955505371094, -0.05400371551513672, -0.0496978759765625, -0.04539203643798828, -0.04108619689941406, -0.036780357360839844, -0.032474517822265625, -0.028168678283691406, -0.023862838745117188, -0.01955699920654297, -0.01525115966796875, -0.010945320129394531, -0.0066394805908203125, -0.0023336410522460938, 0.001972198486328125, 0.006278038024902344, 0.010583877563476562, 0.014889717102050781, 0.019195556640625, 0.02350139617919922, 0.027807235717773438, 0.032113075256347656, 0.036418914794921875, 0.040724754333496094, 0.04503059387207031, 0.04933643341064453, 0.05364227294921875, 0.05794811248779297, 0.06225395202636719, 0.0665597915649414, 0.07086563110351562, 0.07517147064208984, 0.07947731018066406, 0.08378314971923828, 0.0880889892578125, 0.09239482879638672, 0.09670066833496094, 0.10100650787353516, 0.10531234741210938, 0.1096181869506836, 0.11392402648925781, 0.11822986602783203, 0.12253570556640625, 0.12684154510498047, 0.1311473846435547, 0.1354532241821289, 0.13975906372070312, 0.14406490325927734, 0.14837074279785156, 0.15267658233642578, 0.156982421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 11.0, 9.0, 18.0, 28.0, 51.0, 64.0, 101.0, 153.0, 262.0, 496.0, 1004.0, 2531.0, 8028.0, 42743.0, 671849.0, 282905.0, 28249.0, 6195.0, 1935.0, 865.0, 433.0, 221.0, 137.0, 78.0, 48.0, 42.0, 34.0, 22.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28564453125, -0.27368927001953125, -0.2617340087890625, -0.24977874755859375, -0.237823486328125, -0.22586822509765625, -0.2139129638671875, -0.20195770263671875, -0.19000244140625, -0.17804718017578125, -0.1660919189453125, -0.15413665771484375, -0.142181396484375, -0.13022613525390625, -0.1182708740234375, -0.10631561279296875, -0.0943603515625, -0.08240509033203125, -0.0704498291015625, -0.05849456787109375, -0.046539306640625, -0.03458404541015625, -0.0226287841796875, -0.01067352294921875, 0.00128173828125, 0.01323699951171875, 0.0251922607421875, 0.03714752197265625, 0.049102783203125, 0.06105804443359375, 0.0730133056640625, 0.08496856689453125, 0.096923828125, 0.10887908935546875, 0.1208343505859375, 0.13278961181640625, 0.144744873046875, 0.15670013427734375, 0.1686553955078125, 0.18061065673828125, 0.19256591796875, 0.20452117919921875, 0.2164764404296875, 0.22843170166015625, 0.240386962890625, 0.25234222412109375, 0.2642974853515625, 0.27625274658203125, 0.2882080078125, 0.30016326904296875, 0.3121185302734375, 0.32407379150390625, 0.336029052734375, 0.34798431396484375, 0.3599395751953125, 0.37189483642578125, 0.38385009765625, 0.39580535888671875, 0.4077606201171875, 0.41971588134765625, 0.431671142578125, 0.44362640380859375, 0.4555816650390625, 0.46753692626953125, 0.4794921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 3.0, 10.0, 22.0, 13.0, 19.0, 23.0, 30.0, 38.0, 50.0, 32.0, 65.0, 50.0, 62.0, 61.0, 58.0, 52.0, 59.0, 52.0, 46.0, 44.0, 38.0, 26.0, 19.0, 17.0, 24.0, 14.0, 8.0, 12.0, 7.0, 10.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5231170654296875, -0.504730224609375, -0.4863433837890625, -0.46795654296875, -0.4495697021484375, -0.431182861328125, -0.4127960205078125, -0.3944091796875, -0.3760223388671875, -0.357635498046875, -0.3392486572265625, -0.32086181640625, -0.3024749755859375, -0.284088134765625, -0.2657012939453125, -0.247314453125, -0.2289276123046875, -0.210540771484375, -0.1921539306640625, -0.17376708984375, -0.1553802490234375, -0.136993408203125, -0.1186065673828125, -0.1002197265625, -0.0818328857421875, -0.063446044921875, -0.0450592041015625, -0.02667236328125, -0.0082855224609375, 0.010101318359375, 0.0284881591796875, 0.046875, 0.0652618408203125, 0.083648681640625, 0.1020355224609375, 0.12042236328125, 0.1388092041015625, 0.157196044921875, 0.1755828857421875, 0.1939697265625, 0.2123565673828125, 0.230743408203125, 0.2491302490234375, 0.26751708984375, 0.2859039306640625, 0.304290771484375, 0.3226776123046875, 0.341064453125, 0.3594512939453125, 0.377838134765625, 0.3962249755859375, 0.41461181640625, 0.4329986572265625, 0.451385498046875, 0.4697723388671875, 0.4881591796875, 0.5065460205078125, 0.524932861328125, 0.5433197021484375, 0.56170654296875, 0.5800933837890625, 0.598480224609375, 0.6168670654296875, 0.63525390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 9.0, 2.0, 6.0, 11.0, 14.0, 30.0, 28.0, 33.0, 44.0, 59.0, 100.0, 145.0, 196.0, 303.0, 529.0, 829.0, 1454.0, 2780.0, 5724.0, 12783.0, 31947.0, 99060.0, 586230.0, 209806.0, 57592.0, 20768.0, 8862.0, 4106.0, 2084.0, 1148.0, 673.0, 420.0, 249.0, 160.0, 107.0, 80.0, 46.0, 32.0, 23.0, 13.0, 8.0, 10.0, 7.0, 5.0, 7.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 4.0], "bins": [-0.08319091796875, -0.08065223693847656, -0.07811355590820312, -0.07557487487792969, -0.07303619384765625, -0.07049751281738281, -0.06795883178710938, -0.06542015075683594, -0.0628814697265625, -0.06034278869628906, -0.057804107666015625, -0.05526542663574219, -0.05272674560546875, -0.05018806457519531, -0.047649383544921875, -0.04511070251464844, -0.042572021484375, -0.04003334045410156, -0.037494659423828125, -0.03495597839355469, -0.03241729736328125, -0.029878616333007812, -0.027339935302734375, -0.024801254272460938, -0.0222625732421875, -0.019723892211914062, -0.017185211181640625, -0.014646530151367188, -0.01210784912109375, -0.009569168090820312, -0.007030487060546875, -0.0044918060302734375, -0.001953125, 0.0005855560302734375, 0.003124237060546875, 0.0056629180908203125, 0.00820159912109375, 0.010740280151367188, 0.013278961181640625, 0.015817642211914062, 0.0183563232421875, 0.020895004272460938, 0.023433685302734375, 0.025972366333007812, 0.02851104736328125, 0.031049728393554688, 0.033588409423828125, 0.03612709045410156, 0.038665771484375, 0.04120445251464844, 0.043743133544921875, 0.04628181457519531, 0.04882049560546875, 0.05135917663574219, 0.053897857666015625, 0.05643653869628906, 0.0589752197265625, 0.06151390075683594, 0.06405258178710938, 0.06659126281738281, 0.06912994384765625, 0.07166862487792969, 0.07420730590820312, 0.07674598693847656, 0.07928466796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 11.0, 10.0, 22.0, 24.0, 35.0, 39.0, 73.0, 83.0, 104.0, 117.0, 117.0, 100.0, 70.0, 46.0, 36.0, 23.0, 15.0, 16.0, 15.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.279613494873047e-05, -4.148110747337341e-05, -4.016607999801636e-05, -3.88510525226593e-05, -3.7536025047302246e-05, -3.622099757194519e-05, -3.4905970096588135e-05, -3.359094262123108e-05, -3.2275915145874023e-05, -3.096088767051697e-05, -2.9645860195159912e-05, -2.8330832719802856e-05, -2.70158052444458e-05, -2.5700777769088745e-05, -2.438575029373169e-05, -2.3070722818374634e-05, -2.1755695343017578e-05, -2.0440667867660522e-05, -1.9125640392303467e-05, -1.781061291694641e-05, -1.6495585441589355e-05, -1.51805579662323e-05, -1.3865530490875244e-05, -1.2550503015518188e-05, -1.1235475540161133e-05, -9.920448064804077e-06, -8.605420589447021e-06, -7.290393114089966e-06, -5.97536563873291e-06, -4.6603381633758545e-06, -3.345310688018799e-06, -2.030283212661743e-06, -7.152557373046875e-07, 5.997717380523682e-07, 1.914799213409424e-06, 3.2298266887664795e-06, 4.544854164123535e-06, 5.859881639480591e-06, 7.1749091148376465e-06, 8.489936590194702e-06, 9.804964065551758e-06, 1.1119991540908813e-05, 1.2435019016265869e-05, 1.3750046491622925e-05, 1.506507396697998e-05, 1.6380101442337036e-05, 1.7695128917694092e-05, 1.9010156393051147e-05, 2.0325183868408203e-05, 2.164021134376526e-05, 2.2955238819122314e-05, 2.427026629447937e-05, 2.5585293769836426e-05, 2.690032124519348e-05, 2.8215348720550537e-05, 2.9530376195907593e-05, 3.084540367126465e-05, 3.2160431146621704e-05, 3.347545862197876e-05, 3.4790486097335815e-05, 3.610551357269287e-05, 3.742054104804993e-05, 3.873556852340698e-05, 4.005059599876404e-05, 4.1365623474121094e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 10.0, 9.0, 11.0, 15.0, 25.0, 46.0, 51.0, 95.0, 140.0, 179.0, 314.0, 582.0, 1192.0, 2235.0, 4990.0, 12902.0, 39959.0, 177229.0, 657557.0, 106219.0, 27575.0, 9382.0, 3827.0, 1788.0, 896.0, 475.0, 317.0, 184.0, 116.0, 55.0, 51.0, 46.0, 27.0, 14.0, 15.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11260986328125, -0.10942363739013672, -0.10623741149902344, -0.10305118560791016, -0.09986495971679688, -0.0966787338256836, -0.09349250793457031, -0.09030628204345703, -0.08712005615234375, -0.08393383026123047, -0.08074760437011719, -0.0775613784790039, -0.07437515258789062, -0.07118892669677734, -0.06800270080566406, -0.06481647491455078, -0.0616302490234375, -0.05844402313232422, -0.05525779724121094, -0.052071571350097656, -0.048885345458984375, -0.045699119567871094, -0.04251289367675781, -0.03932666778564453, -0.03614044189453125, -0.03295421600341797, -0.029767990112304688, -0.026581764221191406, -0.023395538330078125, -0.020209312438964844, -0.017023086547851562, -0.013836860656738281, -0.010650634765625, -0.007464408874511719, -0.0042781829833984375, -0.0010919570922851562, 0.002094268798828125, 0.005280494689941406, 0.008466720581054688, 0.011652946472167969, 0.01483917236328125, 0.01802539825439453, 0.021211624145507812, 0.024397850036621094, 0.027584075927734375, 0.030770301818847656, 0.03395652770996094, 0.03714275360107422, 0.0403289794921875, 0.04351520538330078, 0.04670143127441406, 0.049887657165527344, 0.053073883056640625, 0.056260108947753906, 0.05944633483886719, 0.06263256072998047, 0.06581878662109375, 0.06900501251220703, 0.07219123840332031, 0.0753774642944336, 0.07856369018554688, 0.08174991607666016, 0.08493614196777344, 0.08812236785888672, 0.09130859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 14.0, 19.0, 17.0, 24.0, 39.0, 50.0, 54.0, 76.0, 89.0, 101.0, 87.0, 86.0, 60.0, 73.0, 53.0, 24.0, 22.0, 22.0, 14.0, 11.0, 8.0, 7.0, 10.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112060546875, -0.10832786560058594, -0.10459518432617188, -0.10086250305175781, -0.09712982177734375, -0.09339714050292969, -0.08966445922851562, -0.08593177795410156, -0.0821990966796875, -0.07846641540527344, -0.07473373413085938, -0.07100105285644531, -0.06726837158203125, -0.06353569030761719, -0.059803009033203125, -0.05607032775878906, -0.052337646484375, -0.04860496520996094, -0.044872283935546875, -0.04113960266113281, -0.03740692138671875, -0.03367424011230469, -0.029941558837890625, -0.026208877563476562, -0.0224761962890625, -0.018743515014648438, -0.015010833740234375, -0.011278152465820312, -0.00754547119140625, -0.0038127899169921875, -8.0108642578125e-05, 0.0036525726318359375, 0.00738525390625, 0.011117935180664062, 0.014850616455078125, 0.018583297729492188, 0.02231597900390625, 0.026048660278320312, 0.029781341552734375, 0.03351402282714844, 0.0372467041015625, 0.04097938537597656, 0.044712066650390625, 0.04844474792480469, 0.05217742919921875, 0.05591011047363281, 0.059642791748046875, 0.06337547302246094, 0.067108154296875, 0.07084083557128906, 0.07457351684570312, 0.07830619812011719, 0.08203887939453125, 0.08577156066894531, 0.08950424194335938, 0.09323692321777344, 0.0969696044921875, 0.10070228576660156, 0.10443496704101562, 0.10816764831542969, 0.11190032958984375, 0.11563301086425781, 0.11936569213867188, 0.12309837341308594, 0.1268310546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 69.0, 148.0, 346.0, 197.0, 100.0, 42.0, 29.0, 11.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.927361011505127, -3.8200178146362305, -3.712674617767334, -3.6053314208984375, -3.497988224029541, -3.3906450271606445, -3.283301830291748, -3.1759586334228516, -3.068615436553955, -2.9612722396850586, -2.853929042816162, -2.7465858459472656, -2.639242649078369, -2.5318994522094727, -2.424556255340576, -2.3172130584716797, -2.209869861602783, -2.1025266647338867, -1.9951834678649902, -1.8878402709960938, -1.7804970741271973, -1.6731538772583008, -1.5658106803894043, -1.4584674835205078, -1.3511242866516113, -1.2437810897827148, -1.1364378929138184, -1.0290946960449219, -0.9217514991760254, -0.8144083023071289, -0.7070651054382324, -0.5997219085693359, -0.49237847328186035, -0.38503527641296387, -0.2776920795440674, -0.1703488826751709, -0.06300568580627441, 0.04433751106262207, 0.15168070793151855, 0.25902390480041504, 0.3663671016693115, 0.473710298538208, 0.5810534954071045, 0.688396692276001, 0.7957398891448975, 0.903083086013794, 1.0104262828826904, 1.117769479751587, 1.2251126766204834, 1.3324558734893799, 1.4397990703582764, 1.5471422672271729, 1.6544854640960693, 1.7618286609649658, 1.8691718578338623, 1.9765150547027588, 2.0838582515716553, 2.1912014484405518, 2.2985446453094482, 2.4058878421783447, 2.513231039047241, 2.6205742359161377, 2.727917432785034, 2.8352606296539307, 2.942603826522827]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 10.0, 13.0, 18.0, 8.0, 24.0, 12.0, 20.0, 26.0, 27.0, 32.0, 27.0, 41.0, 40.0, 88.0, 98.0, 86.0, 71.0, 51.0, 31.0, 36.0, 33.0, 30.0, 36.0, 18.0, 19.0, 17.0, 13.0, 8.0, 8.0, 12.0, 6.0, 3.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.4488959312438965, -2.380946159362793, -2.3129966259002686, -2.245047092437744, -2.1770973205566406, -2.109147548675537, -2.0411980152130127, -1.9732483625411987, -1.9052987098693848, -1.8373490571975708, -1.7693994045257568, -1.7014497518539429, -1.633500099182129, -1.565550446510315, -1.497600793838501, -1.429651141166687, -1.361701488494873, -1.293751835823059, -1.2258021831512451, -1.1578525304794312, -1.0899028778076172, -1.0219532251358032, -0.9540035724639893, -0.8860539197921753, -0.8181042671203613, -0.7501546144485474, -0.6822049617767334, -0.6142553091049194, -0.5463056564331055, -0.4783560037612915, -0.41040635108947754, -0.3424566984176636, -0.2745072841644287, -0.20655763149261475, -0.13860797882080078, -0.07065832614898682, -0.0027086734771728516, 0.06524097919464111, 0.13319063186645508, 0.20114028453826904, 0.269089937210083, 0.337039589881897, 0.40498924255371094, 0.4729388952255249, 0.5408885478973389, 0.6088382005691528, 0.6767878532409668, 0.7447375059127808, 0.8126871585845947, 0.8806368112564087, 0.9485864639282227, 1.0165361166000366, 1.0844857692718506, 1.1524354219436646, 1.2203850746154785, 1.2883347272872925, 1.3562843799591064, 1.4242340326309204, 1.4921836853027344, 1.5601333379745483, 1.6280829906463623, 1.6960326433181763, 1.7639822959899902, 1.8319319486618042, 1.8998816013336182]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 16.0, 4.0, 12.0, 13.0, 27.0, 38.0, 47.0, 68.0, 116.0, 162.0, 260.0, 405.0, 569.0, 1023.0, 1918.0, 3807.0, 9282.0, 26173.0, 100880.0, 550573.0, 2311126.0, 965677.0, 163309.0, 36321.0, 11928.0, 5015.0, 2350.0, 1246.0, 679.0, 424.0, 247.0, 174.0, 114.0, 97.0, 59.0, 35.0, 23.0, 23.0, 11.0, 8.0, 9.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.183349609375, -0.1782073974609375, -0.173065185546875, -0.1679229736328125, -0.16278076171875, -0.1576385498046875, -0.152496337890625, -0.1473541259765625, -0.1422119140625, -0.1370697021484375, -0.131927490234375, -0.1267852783203125, -0.12164306640625, -0.1165008544921875, -0.111358642578125, -0.1062164306640625, -0.10107421875, -0.0959320068359375, -0.090789794921875, -0.0856475830078125, -0.08050537109375, -0.0753631591796875, -0.070220947265625, -0.0650787353515625, -0.0599365234375, -0.0547943115234375, -0.049652099609375, -0.0445098876953125, -0.03936767578125, -0.0342254638671875, -0.029083251953125, -0.0239410400390625, -0.018798828125, -0.0136566162109375, -0.008514404296875, -0.0033721923828125, 0.00177001953125, 0.0069122314453125, 0.012054443359375, 0.0171966552734375, 0.0223388671875, 0.0274810791015625, 0.032623291015625, 0.0377655029296875, 0.04290771484375, 0.0480499267578125, 0.053192138671875, 0.0583343505859375, 0.0634765625, 0.0686187744140625, 0.073760986328125, 0.0789031982421875, 0.08404541015625, 0.0891876220703125, 0.094329833984375, 0.0994720458984375, 0.1046142578125, 0.1097564697265625, 0.114898681640625, 0.1200408935546875, 0.12518310546875, 0.1303253173828125, 0.135467529296875, 0.1406097412109375, 0.145751953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 8.0, 13.0, 17.0, 16.0, 24.0, 31.0, 36.0, 40.0, 35.0, 47.0, 46.0, 49.0, 55.0, 60.0, 52.0, 50.0, 50.0, 50.0, 46.0, 41.0, 39.0, 34.0, 29.0, 19.0, 22.0, 29.0, 11.0, 14.0, 9.0, 10.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1396484375, -0.13487815856933594, -0.13010787963867188, -0.1253376007080078, -0.12056732177734375, -0.11579704284667969, -0.11102676391601562, -0.10625648498535156, -0.1014862060546875, -0.09671592712402344, -0.09194564819335938, -0.08717536926269531, -0.08240509033203125, -0.07763481140136719, -0.07286453247070312, -0.06809425354003906, -0.063323974609375, -0.05855369567871094, -0.053783416748046875, -0.04901313781738281, -0.04424285888671875, -0.03947257995605469, -0.034702301025390625, -0.029932022094726562, -0.0251617431640625, -0.020391464233398438, -0.015621185302734375, -0.010850906372070312, -0.00608062744140625, -0.0013103485107421875, 0.003459930419921875, 0.008230209350585938, 0.01300048828125, 0.017770767211914062, 0.022541046142578125, 0.027311325073242188, 0.03208160400390625, 0.03685188293457031, 0.041622161865234375, 0.04639244079589844, 0.0511627197265625, 0.05593299865722656, 0.060703277587890625, 0.06547355651855469, 0.07024383544921875, 0.07501411437988281, 0.07978439331054688, 0.08455467224121094, 0.089324951171875, 0.09409523010253906, 0.09886550903320312, 0.10363578796386719, 0.10840606689453125, 0.11317634582519531, 0.11794662475585938, 0.12271690368652344, 0.1274871826171875, 0.13225746154785156, 0.13702774047851562, 0.1417980194091797, 0.14656829833984375, 0.1513385772705078, 0.15610885620117188, 0.16087913513183594, 0.1656494140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0, 7.0, 4.0, 15.0, 7.0, 20.0, 30.0, 28.0, 62.0, 87.0, 159.0, 379.0, 927.0, 3276.0, 15552.0, 157508.0, 3681146.0, 307217.0, 21876.0, 4076.0, 1067.0, 364.0, 176.0, 95.0, 57.0, 34.0, 24.0, 20.0, 18.0, 8.0, 6.0, 9.0, 7.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.437744140625, -0.424713134765625, -0.41168212890625, -0.398651123046875, -0.3856201171875, -0.372589111328125, -0.35955810546875, -0.346527099609375, -0.33349609375, -0.320465087890625, -0.30743408203125, -0.294403076171875, -0.2813720703125, -0.268341064453125, -0.25531005859375, -0.242279052734375, -0.229248046875, -0.216217041015625, -0.20318603515625, -0.190155029296875, -0.1771240234375, -0.164093017578125, -0.15106201171875, -0.138031005859375, -0.125, -0.111968994140625, -0.09893798828125, -0.085906982421875, -0.0728759765625, -0.059844970703125, -0.04681396484375, -0.033782958984375, -0.020751953125, -0.007720947265625, 0.00531005859375, 0.018341064453125, 0.0313720703125, 0.044403076171875, 0.05743408203125, 0.070465087890625, 0.08349609375, 0.096527099609375, 0.10955810546875, 0.122589111328125, 0.1356201171875, 0.148651123046875, 0.16168212890625, 0.174713134765625, 0.187744140625, 0.200775146484375, 0.21380615234375, 0.226837158203125, 0.2398681640625, 0.252899169921875, 0.26593017578125, 0.278961181640625, 0.2919921875, 0.305023193359375, 0.31805419921875, 0.331085205078125, 0.3441162109375, 0.357147216796875, 0.37017822265625, 0.383209228515625, 0.396240234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 8.0, 14.0, 16.0, 21.0, 24.0, 33.0, 59.0, 86.0, 141.0, 222.0, 367.0, 613.0, 753.0, 627.0, 400.0, 252.0, 143.0, 89.0, 59.0, 33.0, 27.0, 11.0, 15.0, 7.0, 12.0, 8.0, 4.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2664604187011719, -0.25679779052734375, -0.24713516235351562, -0.2374725341796875, -0.22780990600585938, -0.21814727783203125, -0.20848464965820312, -0.198822021484375, -0.18915939331054688, -0.17949676513671875, -0.16983413696289062, -0.1601715087890625, -0.15050888061523438, -0.14084625244140625, -0.13118362426757812, -0.12152099609375, -0.11185836791992188, -0.10219573974609375, -0.09253311157226562, -0.0828704833984375, -0.07320785522460938, -0.06354522705078125, -0.053882598876953125, -0.044219970703125, -0.034557342529296875, -0.02489471435546875, -0.015232086181640625, -0.0055694580078125, 0.004093170166015625, 0.01375579833984375, 0.023418426513671875, 0.0330810546875, 0.042743682861328125, 0.05240631103515625, 0.062068939208984375, 0.0717315673828125, 0.08139419555664062, 0.09105682373046875, 0.10071945190429688, 0.110382080078125, 0.12004470825195312, 0.12970733642578125, 0.13936996459960938, 0.1490325927734375, 0.15869522094726562, 0.16835784912109375, 0.17802047729492188, 0.18768310546875, 0.19734573364257812, 0.20700836181640625, 0.21667098999023438, 0.2263336181640625, 0.23599624633789062, 0.24565887451171875, 0.2553215026855469, 0.264984130859375, 0.2746467590332031, 0.28430938720703125, 0.2939720153808594, 0.3036346435546875, 0.3132972717285156, 0.32295989990234375, 0.3326225280761719, 0.34228515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 10.0, 17.0, 26.0, 35.0, 80.0, 148.0, 194.0, 168.0, 143.0, 79.0, 42.0, 17.0, 6.0, 7.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.446486234664917, -3.3627686500549316, -3.2790513038635254, -3.19533371925354, -3.1116161346435547, -3.0278987884521484, -2.944181203842163, -2.8604636192321777, -2.7767462730407715, -2.693028688430786, -2.60931134223938, -2.5255937576293945, -2.4418764114379883, -2.358158826828003, -2.2744412422180176, -2.1907238960266113, -2.107006311416626, -2.0232887268066406, -1.9395713806152344, -1.855853796005249, -1.7721363306045532, -1.6884188652038574, -1.604701280593872, -1.5209838151931763, -1.4372663497924805, -1.3535488843917847, -1.2698314189910889, -1.1861138343811035, -1.1023963689804077, -1.018678903579712, -0.9349613785743713, -0.8512438535690308, -0.7675262689590454, -0.6838088035583496, -0.600091278553009, -0.5163737535476685, -0.43265628814697266, -0.34893879294395447, -0.2652212977409363, -0.1815037727355957, -0.0977863073348999, -0.014068812131881714, 0.06964868307113647, 0.15336617827415466, 0.23708367347717285, 0.32080116868019104, 0.40451866388320923, 0.4882361888885498, 0.5719536542892456, 0.6556711196899414, 0.739388644695282, 0.8231061697006226, 0.9068236351013184, 0.9905411005020142, 1.07425856590271, 1.1579761505126953, 1.2416936159133911, 1.325411081314087, 1.4091286659240723, 1.492846131324768, 1.5765635967254639, 1.6602810621261597, 1.7439985275268555, 1.8277161121368408, 1.9114335775375366]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 5.0, 6.0, 8.0, 6.0, 9.0, 15.0, 7.0, 13.0, 23.0, 23.0, 14.0, 21.0, 25.0, 35.0, 33.0, 30.0, 38.0, 49.0, 50.0, 43.0, 60.0, 45.0, 41.0, 43.0, 35.0, 28.0, 37.0, 34.0, 34.0, 18.0, 33.0, 20.0, 16.0, 14.0, 11.0, 11.0, 13.0, 7.0, 6.0, 10.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.135279655456543, -1.0982357263565063, -1.0611919164657593, -1.0241479873657227, -0.9871041774749756, -0.950060248374939, -0.9130163788795471, -0.8759725093841553, -0.8389286398887634, -0.8018847703933716, -0.7648409008979797, -0.7277970314025879, -0.6907531023025513, -0.6537092924118042, -0.6166653633117676, -0.5796214938163757, -0.5425776243209839, -0.505533754825592, -0.4684898853302002, -0.43144598603248596, -0.3944021165370941, -0.35735824704170227, -0.32031434774398804, -0.2832704782485962, -0.24622660875320435, -0.2091827392578125, -0.17213885486125946, -0.13509497046470642, -0.09805110096931458, -0.06100723147392273, -0.02396334707736969, 0.01308053731918335, 0.050124406814575195, 0.08716828376054764, 0.12421216070652008, 0.16125604510307312, 0.19829991459846497, 0.2353437840938568, 0.27238768339157104, 0.3094315528869629, 0.34647542238235474, 0.3835192918777466, 0.4205631613731384, 0.45760706067085266, 0.4946509301662445, 0.531694769859314, 0.5687386989593506, 0.6057825684547424, 0.6428264379501343, 0.6798703074455261, 0.716914176940918, 0.7539580464363098, 0.7910019159317017, 0.8280458450317383, 0.8650897145271301, 0.902133584022522, 0.9391774535179138, 0.9762213230133057, 1.0132652521133423, 1.0503090620040894, 1.087352991104126, 1.124396800994873, 1.1614407300949097, 1.1984846591949463, 1.2355284690856934]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 3.0, 5.0, 5.0, 11.0, 5.0, 17.0, 28.0, 29.0, 43.0, 43.0, 69.0, 105.0, 188.0, 250.0, 439.0, 774.0, 1364.0, 2631.0, 5794.0, 13820.0, 37773.0, 131265.0, 478820.0, 268692.0, 67010.0, 22275.0, 8767.0, 3848.0, 1929.0, 928.0, 561.0, 382.0, 203.0, 140.0, 91.0, 66.0, 51.0, 29.0, 34.0, 17.0, 14.0, 8.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.2301025390625, -0.2232837677001953, -0.21646499633789062, -0.20964622497558594, -0.20282745361328125, -0.19600868225097656, -0.18918991088867188, -0.1823711395263672, -0.1755523681640625, -0.1687335968017578, -0.16191482543945312, -0.15509605407714844, -0.14827728271484375, -0.14145851135253906, -0.13463973999023438, -0.1278209686279297, -0.121002197265625, -0.11418342590332031, -0.10736465454101562, -0.10054588317871094, -0.09372711181640625, -0.08690834045410156, -0.08008956909179688, -0.07327079772949219, -0.0664520263671875, -0.05963325500488281, -0.052814483642578125, -0.04599571228027344, -0.03917694091796875, -0.03235816955566406, -0.025539398193359375, -0.018720626831054688, -0.01190185546875, -0.0050830841064453125, 0.001735687255859375, 0.008554458618164062, 0.01537322998046875, 0.022192001342773438, 0.029010772705078125, 0.03582954406738281, 0.0426483154296875, 0.04946708679199219, 0.056285858154296875, 0.06310462951660156, 0.06992340087890625, 0.07674217224121094, 0.08356094360351562, 0.09037971496582031, 0.097198486328125, 0.10401725769042969, 0.11083602905273438, 0.11765480041503906, 0.12447357177734375, 0.13129234313964844, 0.13811111450195312, 0.1449298858642578, 0.1517486572265625, 0.1585674285888672, 0.16538619995117188, 0.17220497131347656, 0.17902374267578125, 0.18584251403808594, 0.19266128540039062, 0.1994800567626953, 0.206298828125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 3.0, 10.0, 21.0, 18.0, 19.0, 27.0, 32.0, 49.0, 49.0, 51.0, 59.0, 57.0, 58.0, 56.0, 64.0, 58.0, 46.0, 52.0, 55.0, 44.0, 20.0, 26.0, 31.0, 24.0, 21.0, 16.0, 9.0, 7.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.1547107696533203, -0.14914321899414062, -0.14357566833496094, -0.13800811767578125, -0.13244056701660156, -0.12687301635742188, -0.12130546569824219, -0.1157379150390625, -0.11017036437988281, -0.10460281372070312, -0.09903526306152344, -0.09346771240234375, -0.08790016174316406, -0.08233261108398438, -0.07676506042480469, -0.071197509765625, -0.06562995910644531, -0.060062408447265625, -0.05449485778808594, -0.04892730712890625, -0.04335975646972656, -0.037792205810546875, -0.03222465515136719, -0.0266571044921875, -0.021089553833007812, -0.015522003173828125, -0.009954452514648438, -0.00438690185546875, 0.0011806488037109375, 0.006748199462890625, 0.012315750122070312, 0.01788330078125, 0.023450851440429688, 0.029018402099609375, 0.03458595275878906, 0.04015350341796875, 0.04572105407714844, 0.051288604736328125, 0.05685615539550781, 0.0624237060546875, 0.06799125671386719, 0.07355880737304688, 0.07912635803222656, 0.08469390869140625, 0.09026145935058594, 0.09582901000976562, 0.10139656066894531, 0.106964111328125, 0.11253166198730469, 0.11809921264648438, 0.12366676330566406, 0.12923431396484375, 0.13480186462402344, 0.14036941528320312, 0.1459369659423828, 0.1515045166015625, 0.1570720672607422, 0.16263961791992188, 0.16820716857910156, 0.17377471923828125, 0.17934226989746094, 0.18490982055664062, 0.1904773712158203, 0.196044921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 6.0, 3.0, 3.0, 7.0, 17.0, 27.0, 31.0, 40.0, 47.0, 92.0, 161.0, 276.0, 560.0, 1135.0, 2895.0, 10171.0, 66972.0, 845876.0, 101087.0, 13074.0, 3431.0, 1265.0, 583.0, 326.0, 167.0, 102.0, 68.0, 39.0, 39.0, 17.0, 18.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.46459197998046875, -0.4511566162109375, -0.43772125244140625, -0.424285888671875, -0.41085052490234375, -0.3974151611328125, -0.38397979736328125, -0.37054443359375, -0.35710906982421875, -0.3436737060546875, -0.33023834228515625, -0.316802978515625, -0.30336761474609375, -0.2899322509765625, -0.27649688720703125, -0.2630615234375, -0.24962615966796875, -0.2361907958984375, -0.22275543212890625, -0.209320068359375, -0.19588470458984375, -0.1824493408203125, -0.16901397705078125, -0.15557861328125, -0.14214324951171875, -0.1287078857421875, -0.11527252197265625, -0.101837158203125, -0.08840179443359375, -0.0749664306640625, -0.06153106689453125, -0.048095703125, -0.03466033935546875, -0.0212249755859375, -0.00778961181640625, 0.005645751953125, 0.01908111572265625, 0.0325164794921875, 0.04595184326171875, 0.05938720703125, 0.07282257080078125, 0.0862579345703125, 0.09969329833984375, 0.113128662109375, 0.12656402587890625, 0.1399993896484375, 0.15343475341796875, 0.1668701171875, 0.18030548095703125, 0.1937408447265625, 0.20717620849609375, 0.220611572265625, 0.23404693603515625, 0.2474822998046875, 0.26091766357421875, 0.27435302734375, 0.28778839111328125, 0.3012237548828125, 0.31465911865234375, 0.328094482421875, 0.34152984619140625, 0.3549652099609375, 0.36840057373046875, 0.3818359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 12.0, 14.0, 22.0, 14.0, 20.0, 26.0, 30.0, 43.0, 39.0, 40.0, 35.0, 51.0, 56.0, 61.0, 52.0, 54.0, 63.0, 47.0, 47.0, 50.0, 37.0, 30.0, 27.0, 19.0, 19.0, 17.0, 12.0, 13.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6171875, -0.5996780395507812, -0.5821685791015625, -0.5646591186523438, -0.547149658203125, -0.5296401977539062, -0.5121307373046875, -0.49462127685546875, -0.47711181640625, -0.45960235595703125, -0.4420928955078125, -0.42458343505859375, -0.407073974609375, -0.38956451416015625, -0.3720550537109375, -0.35454559326171875, -0.3370361328125, -0.31952667236328125, -0.3020172119140625, -0.28450775146484375, -0.266998291015625, -0.24948883056640625, -0.2319793701171875, -0.21446990966796875, -0.19696044921875, -0.17945098876953125, -0.1619415283203125, -0.14443206787109375, -0.126922607421875, -0.10941314697265625, -0.0919036865234375, -0.07439422607421875, -0.056884765625, -0.03937530517578125, -0.0218658447265625, -0.00435638427734375, 0.013153076171875, 0.03066253662109375, 0.0481719970703125, 0.06568145751953125, 0.08319091796875, 0.10070037841796875, 0.1182098388671875, 0.13571929931640625, 0.153228759765625, 0.17073822021484375, 0.1882476806640625, 0.20575714111328125, 0.2232666015625, 0.24077606201171875, 0.2582855224609375, 0.27579498291015625, 0.293304443359375, 0.31081390380859375, 0.3283233642578125, 0.34583282470703125, 0.36334228515625, 0.38085174560546875, 0.3983612060546875, 0.41587066650390625, 0.433380126953125, 0.45088958740234375, 0.4683990478515625, 0.48590850830078125, 0.50341796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 2.0, 15.0, 15.0, 19.0, 21.0, 31.0, 48.0, 61.0, 90.0, 126.0, 219.0, 361.0, 722.0, 1392.0, 2931.0, 7089.0, 19007.0, 65566.0, 578260.0, 286714.0, 56531.0, 17409.0, 6269.0, 2716.0, 1278.0, 622.0, 356.0, 250.0, 120.0, 92.0, 68.0, 44.0, 28.0, 16.0, 19.0, 15.0, 15.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07635498046875, -0.07396507263183594, -0.07157516479492188, -0.06918525695800781, -0.06679534912109375, -0.06440544128417969, -0.062015533447265625, -0.05962562561035156, -0.0572357177734375, -0.05484580993652344, -0.052455902099609375, -0.05006599426269531, -0.04767608642578125, -0.04528617858886719, -0.042896270751953125, -0.04050636291503906, -0.038116455078125, -0.03572654724121094, -0.033336639404296875, -0.030946731567382812, -0.02855682373046875, -0.026166915893554688, -0.023777008056640625, -0.021387100219726562, -0.0189971923828125, -0.016607284545898438, -0.014217376708984375, -0.011827468872070312, -0.00943756103515625, -0.0070476531982421875, -0.004657745361328125, -0.0022678375244140625, 0.0001220703125, 0.0025119781494140625, 0.004901885986328125, 0.0072917938232421875, 0.00968170166015625, 0.012071609497070312, 0.014461517333984375, 0.016851425170898438, 0.0192413330078125, 0.021631240844726562, 0.024021148681640625, 0.026411056518554688, 0.02880096435546875, 0.031190872192382812, 0.033580780029296875, 0.03597068786621094, 0.038360595703125, 0.04075050354003906, 0.043140411376953125, 0.04553031921386719, 0.04792022705078125, 0.05031013488769531, 0.052700042724609375, 0.05508995056152344, 0.0574798583984375, 0.05986976623535156, 0.062259674072265625, 0.06464958190917969, 0.06703948974609375, 0.06942939758300781, 0.07181930541992188, 0.07420921325683594, 0.07659912109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 12.0, 16.0, 19.0, 39.0, 50.0, 91.0, 132.0, 164.0, 161.0, 114.0, 80.0, 49.0, 31.0, 17.0, 8.0, 10.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7610530853271484e-05, -3.6094337701797485e-05, -3.4578144550323486e-05, -3.306195139884949e-05, -3.154575824737549e-05, -3.002956509590149e-05, -2.851337194442749e-05, -2.699717879295349e-05, -2.5480985641479492e-05, -2.3964792490005493e-05, -2.2448599338531494e-05, -2.0932406187057495e-05, -1.9416213035583496e-05, -1.7900019884109497e-05, -1.6383826732635498e-05, -1.4867633581161499e-05, -1.33514404296875e-05, -1.1835247278213501e-05, -1.0319054126739502e-05, -8.802860975265503e-06, -7.286667823791504e-06, -5.770474672317505e-06, -4.254281520843506e-06, -2.738088369369507e-06, -1.2218952178955078e-06, 2.942979335784912e-07, 1.8104910850524902e-06, 3.3266842365264893e-06, 4.842877388000488e-06, 6.359070539474487e-06, 7.875263690948486e-06, 9.391456842422485e-06, 1.0907649993896484e-05, 1.2423843145370483e-05, 1.3940036296844482e-05, 1.545622944831848e-05, 1.697242259979248e-05, 1.848861575126648e-05, 2.000480890274048e-05, 2.1521002054214478e-05, 2.3037195205688477e-05, 2.4553388357162476e-05, 2.6069581508636475e-05, 2.7585774660110474e-05, 2.9101967811584473e-05, 3.061816096305847e-05, 3.213435411453247e-05, 3.365054726600647e-05, 3.516674041748047e-05, 3.668293356895447e-05, 3.819912672042847e-05, 3.9715319871902466e-05, 4.1231513023376465e-05, 4.2747706174850464e-05, 4.426389932632446e-05, 4.578009247779846e-05, 4.729628562927246e-05, 4.881247878074646e-05, 5.032867193222046e-05, 5.184486508369446e-05, 5.336105823516846e-05, 5.4877251386642456e-05, 5.6393444538116455e-05, 5.7909637689590454e-05, 5.942583084106445e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 10.0, 7.0, 5.0, 22.0, 13.0, 37.0, 46.0, 63.0, 101.0, 136.0, 216.0, 322.0, 567.0, 914.0, 1822.0, 3689.0, 8857.0, 24360.0, 77773.0, 555502.0, 270513.0, 66546.0, 21721.0, 7971.0, 3484.0, 1611.0, 865.0, 474.0, 299.0, 192.0, 140.0, 75.0, 69.0, 33.0, 24.0, 18.0, 12.0, 14.0, 12.0, 5.0, 5.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06024169921875, -0.058005332946777344, -0.05576896667480469, -0.05353260040283203, -0.051296234130859375, -0.04905986785888672, -0.04682350158691406, -0.044587135314941406, -0.04235076904296875, -0.040114402770996094, -0.03787803649902344, -0.03564167022705078, -0.033405303955078125, -0.03116893768310547, -0.028932571411132812, -0.026696205139160156, -0.0244598388671875, -0.022223472595214844, -0.019987106323242188, -0.01775074005126953, -0.015514373779296875, -0.013278007507324219, -0.011041641235351562, -0.008805274963378906, -0.00656890869140625, -0.004332542419433594, -0.0020961761474609375, 0.00014019012451171875, 0.002376556396484375, 0.004612922668457031, 0.0068492889404296875, 0.009085655212402344, 0.011322021484375, 0.013558387756347656, 0.015794754028320312, 0.01803112030029297, 0.020267486572265625, 0.02250385284423828, 0.024740219116210938, 0.026976585388183594, 0.02921295166015625, 0.031449317932128906, 0.03368568420410156, 0.03592205047607422, 0.038158416748046875, 0.04039478302001953, 0.04263114929199219, 0.044867515563964844, 0.0471038818359375, 0.049340248107910156, 0.05157661437988281, 0.05381298065185547, 0.056049346923828125, 0.05828571319580078, 0.06052207946777344, 0.0627584457397461, 0.06499481201171875, 0.0672311782836914, 0.06946754455566406, 0.07170391082763672, 0.07394027709960938, 0.07617664337158203, 0.07841300964355469, 0.08064937591552734, 0.0828857421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 2.0, 6.0, 5.0, 12.0, 27.0, 24.0, 29.0, 37.0, 58.0, 49.0, 71.0, 99.0, 96.0, 90.0, 85.0, 76.0, 55.0, 44.0, 28.0, 23.0, 20.0, 12.0, 10.0, 14.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1109619140625, -0.10774707794189453, -0.10453224182128906, -0.1013174057006836, -0.09810256958007812, -0.09488773345947266, -0.09167289733886719, -0.08845806121826172, -0.08524322509765625, -0.08202838897705078, -0.07881355285644531, -0.07559871673583984, -0.07238388061523438, -0.0691690444946289, -0.06595420837402344, -0.06273937225341797, -0.0595245361328125, -0.05630970001220703, -0.05309486389160156, -0.049880027770996094, -0.046665191650390625, -0.043450355529785156, -0.04023551940917969, -0.03702068328857422, -0.03380584716796875, -0.03059101104736328, -0.027376174926757812, -0.024161338806152344, -0.020946502685546875, -0.017731666564941406, -0.014516830444335938, -0.011301994323730469, -0.008087158203125, -0.004872322082519531, -0.0016574859619140625, 0.0015573501586914062, 0.004772186279296875, 0.007987022399902344, 0.011201858520507812, 0.014416694641113281, 0.01763153076171875, 0.02084636688232422, 0.024061203002929688, 0.027276039123535156, 0.030490875244140625, 0.033705711364746094, 0.03692054748535156, 0.04013538360595703, 0.0433502197265625, 0.04656505584716797, 0.04977989196777344, 0.052994728088378906, 0.056209564208984375, 0.059424400329589844, 0.06263923645019531, 0.06585407257080078, 0.06906890869140625, 0.07228374481201172, 0.07549858093261719, 0.07871341705322266, 0.08192825317382812, 0.0851430892944336, 0.08835792541503906, 0.09157276153564453, 0.09478759765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 13.0, 30.0, 52.0, 145.0, 395.0, 190.0, 94.0, 38.0, 18.0, 8.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1198501586914062, -3.0021679401397705, -2.8844857215881348, -2.76680326461792, -2.649121046066284, -2.5314388275146484, -2.4137563705444336, -2.296074151992798, -2.178391933441162, -2.0607097148895264, -1.943027377128601, -1.8253450393676758, -1.70766282081604, -1.5899806022644043, -1.472298264503479, -1.3546159267425537, -1.236933708190918, -1.1192514896392822, -1.001569151878357, -0.8838868737220764, -0.7662045955657959, -0.6485223174095154, -0.5308400392532349, -0.41315776109695435, -0.29547548294067383, -0.1777932047843933, -0.06011092662811279, 0.057571351528167725, 0.17525362968444824, 0.29293590784072876, 0.4106181859970093, 0.5283004641532898, 0.6459827423095703, 0.7636650204658508, 0.8813472986221313, 0.9990295767784119, 1.1167118549346924, 1.2343940734863281, 1.3520764112472534, 1.4697587490081787, 1.5874409675598145, 1.7051231861114502, 1.8228055238723755, 1.9404878616333008, 2.0581700801849365, 2.1758522987365723, 2.293534755706787, 2.411216974258423, 2.5288991928100586, 2.6465814113616943, 2.76426362991333, 2.881946086883545, 2.9996283054351807, 3.1173105239868164, 3.2349929809570312, 3.352675199508667, 3.4703574180603027, 3.5880396366119385, 3.705721855163574, 3.823404312133789, 3.941086530685425, 4.0587687492370605, 4.176451206207275, 4.294133186340332, 4.411815643310547]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 1.0, 8.0, 9.0, 8.0, 7.0, 9.0, 13.0, 20.0, 24.0, 21.0, 24.0, 30.0, 33.0, 53.0, 41.0, 95.0, 111.0, 123.0, 78.0, 45.0, 36.0, 23.0, 26.0, 40.0, 24.0, 17.0, 16.0, 16.0, 7.0, 6.0, 9.0, 4.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9430243968963623, -1.8712377548217773, -1.7994511127471924, -1.7276644706726074, -1.6558778285980225, -1.5840911865234375, -1.512304425239563, -1.440517783164978, -1.368731141090393, -1.296944499015808, -1.2251578569412231, -1.1533712148666382, -1.0815844535827637, -1.0097978115081787, -0.9380111694335938, -0.8662245273590088, -0.7944378852844238, -0.7226512432098389, -0.6508646011352539, -0.5790778994560242, -0.5072912573814392, -0.43550461530685425, -0.3637179434299469, -0.29193127155303955, -0.2201446294784546, -0.14835797250270844, -0.07657131552696228, -0.0047846585512161255, 0.06700199842453003, 0.138788640499115, 0.21057531237602234, 0.2823619842529297, 0.35414886474609375, 0.4259355068206787, 0.49772217869758606, 0.5695088505744934, 0.6412954926490784, 0.7130821347236633, 0.7848688364028931, 0.856655478477478, 0.928442120552063, 1.000228762626648, 1.072015404701233, 1.1438020467758179, 1.2155888080596924, 1.2873754501342773, 1.3591620922088623, 1.4309487342834473, 1.5027353763580322, 1.5745220184326172, 1.6463086605072021, 1.718095302581787, 1.789881944656372, 1.861668586730957, 1.9334553480148315, 2.005241870880127, 2.077028751373291, 2.148815393447876, 2.220602035522461, 2.292388677597046, 2.364175319671631, 2.435961961746216, 2.507748603820801, 2.579535484313965, 2.6513218879699707]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 9.0, 12.0, 18.0, 29.0, 44.0, 69.0, 109.0, 219.0, 326.0, 577.0, 931.0, 1560.0, 2929.0, 5842.0, 11608.0, 25967.0, 67381.0, 209872.0, 718566.0, 1725985.0, 977459.0, 292639.0, 88269.0, 33125.0, 14784.0, 7118.0, 3802.0, 2064.0, 1191.0, 665.0, 391.0, 267.0, 176.0, 103.0, 68.0, 47.0, 19.0, 14.0, 10.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15789222717285156, -0.15196609497070312, -0.1460399627685547, -0.14011383056640625, -0.1341876983642578, -0.12826156616210938, -0.12233543395996094, -0.1164093017578125, -0.11048316955566406, -0.10455703735351562, -0.09863090515136719, -0.09270477294921875, -0.08677864074707031, -0.08085250854492188, -0.07492637634277344, -0.069000244140625, -0.06307411193847656, -0.057147979736328125, -0.05122184753417969, -0.04529571533203125, -0.03936958312988281, -0.033443450927734375, -0.027517318725585938, -0.0215911865234375, -0.015665054321289062, -0.009738922119140625, -0.0038127899169921875, 0.00211334228515625, 0.008039474487304688, 0.013965606689453125, 0.019891738891601562, 0.02581787109375, 0.03174400329589844, 0.037670135498046875, 0.04359626770019531, 0.04952239990234375, 0.05544853210449219, 0.061374664306640625, 0.06730079650878906, 0.0732269287109375, 0.07915306091308594, 0.08507919311523438, 0.09100532531738281, 0.09693145751953125, 0.10285758972167969, 0.10878372192382812, 0.11470985412597656, 0.120635986328125, 0.12656211853027344, 0.13248825073242188, 0.1384143829345703, 0.14434051513671875, 0.1502666473388672, 0.15619277954101562, 0.16211891174316406, 0.1680450439453125, 0.17397117614746094, 0.17989730834960938, 0.1858234405517578, 0.19174957275390625, 0.1976757049560547, 0.20360183715820312, 0.20952796936035156, 0.2154541015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 15.0, 27.0, 22.0, 28.0, 37.0, 45.0, 48.0, 51.0, 43.0, 64.0, 49.0, 46.0, 48.0, 54.0, 43.0, 46.0, 43.0, 32.0, 44.0, 30.0, 33.0, 27.0, 13.0, 18.0, 11.0, 16.0, 9.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1119384765625, -0.10716056823730469, -0.10238265991210938, -0.09760475158691406, -0.09282684326171875, -0.08804893493652344, -0.08327102661132812, -0.07849311828613281, -0.0737152099609375, -0.06893730163574219, -0.06415939331054688, -0.05938148498535156, -0.05460357666015625, -0.04982566833496094, -0.045047760009765625, -0.04026985168457031, -0.035491943359375, -0.030714035034179688, -0.025936126708984375, -0.021158218383789062, -0.01638031005859375, -0.011602401733398438, -0.006824493408203125, -0.0020465850830078125, 0.0027313232421875, 0.0075092315673828125, 0.012287139892578125, 0.017065048217773438, 0.02184295654296875, 0.026620864868164062, 0.031398773193359375, 0.03617668151855469, 0.04095458984375, 0.04573249816894531, 0.050510406494140625, 0.05528831481933594, 0.06006622314453125, 0.06484413146972656, 0.06962203979492188, 0.07439994812011719, 0.0791778564453125, 0.08395576477050781, 0.08873367309570312, 0.09351158142089844, 0.09828948974609375, 0.10306739807128906, 0.10784530639648438, 0.11262321472167969, 0.117401123046875, 0.12217903137207031, 0.12695693969726562, 0.13173484802246094, 0.13651275634765625, 0.14129066467285156, 0.14606857299804688, 0.1508464813232422, 0.1556243896484375, 0.1604022979736328, 0.16518020629882812, 0.16995811462402344, 0.17473602294921875, 0.17951393127441406, 0.18429183959960938, 0.1890697479248047, 0.19384765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 11.0, 18.0, 22.0, 37.0, 63.0, 104.0, 241.0, 506.0, 1368.0, 8017.0, 2181553.0, 1992035.0, 8033.0, 1276.0, 484.0, 221.0, 131.0, 69.0, 37.0, 19.0, 15.0, 1.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.8212890625, -1.7789306640625, -1.736572265625, -1.6942138671875, -1.65185546875, -1.6094970703125, -1.567138671875, -1.5247802734375, -1.482421875, -1.4400634765625, -1.397705078125, -1.3553466796875, -1.31298828125, -1.2706298828125, -1.228271484375, -1.1859130859375, -1.1435546875, -1.1011962890625, -1.058837890625, -1.0164794921875, -0.97412109375, -0.9317626953125, -0.889404296875, -0.8470458984375, -0.8046875, -0.7623291015625, -0.719970703125, -0.6776123046875, -0.63525390625, -0.5928955078125, -0.550537109375, -0.5081787109375, -0.4658203125, -0.4234619140625, -0.381103515625, -0.3387451171875, -0.29638671875, -0.2540283203125, -0.211669921875, -0.1693115234375, -0.126953125, -0.0845947265625, -0.042236328125, 0.0001220703125, 0.04248046875, 0.0848388671875, 0.127197265625, 0.1695556640625, 0.2119140625, 0.2542724609375, 0.296630859375, 0.3389892578125, 0.38134765625, 0.4237060546875, 0.466064453125, 0.5084228515625, 0.55078125, 0.5931396484375, 0.635498046875, 0.6778564453125, 0.72021484375, 0.7625732421875, 0.804931640625, 0.8472900390625, 0.8896484375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 13.0, 9.0, 26.0, 18.0, 33.0, 49.0, 69.0, 94.0, 131.0, 209.0, 313.0, 476.0, 700.0, 601.0, 405.0, 251.0, 200.0, 135.0, 104.0, 74.0, 47.0, 33.0, 26.0, 20.0, 15.0, 10.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5709953308105469, -0.5550765991210938, -0.5391578674316406, -0.5232391357421875, -0.5073204040527344, -0.49140167236328125, -0.4754829406738281, -0.459564208984375, -0.4436454772949219, -0.42772674560546875, -0.4118080139160156, -0.3958892822265625, -0.3799705505371094, -0.36405181884765625, -0.3481330871582031, -0.33221435546875, -0.3162956237792969, -0.30037689208984375, -0.2844581604003906, -0.2685394287109375, -0.2526206970214844, -0.23670196533203125, -0.22078323364257812, -0.204864501953125, -0.18894577026367188, -0.17302703857421875, -0.15710830688476562, -0.1411895751953125, -0.12527084350585938, -0.10935211181640625, -0.09343338012695312, -0.0775146484375, -0.061595916748046875, -0.04567718505859375, -0.029758453369140625, -0.0138397216796875, 0.002079010009765625, 0.01799774169921875, 0.033916473388671875, 0.049835205078125, 0.06575393676757812, 0.08167266845703125, 0.09759140014648438, 0.1135101318359375, 0.12942886352539062, 0.14534759521484375, 0.16126632690429688, 0.17718505859375, 0.19310379028320312, 0.20902252197265625, 0.22494125366210938, 0.2408599853515625, 0.2567787170410156, 0.27269744873046875, 0.2886161804199219, 0.304534912109375, 0.3204536437988281, 0.33637237548828125, 0.3522911071777344, 0.3682098388671875, 0.3841285705566406, 0.40004730224609375, 0.4159660339355469, 0.431884765625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 6.0, 6.0, 6.0, 19.0, 37.0, 70.0, 166.0, 283.0, 213.0, 99.0, 51.0, 19.0, 14.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.26026725769043, -11.991594314575195, -11.722922325134277, -11.454249382019043, -11.185577392578125, -10.91690444946289, -10.648231506347656, -10.379559516906738, -10.110886573791504, -9.84221363067627, -9.573541641235352, -9.304868698120117, -9.036195755004883, -8.767523765563965, -8.49885082244873, -8.230178833007812, -7.961505889892578, -7.692833423614502, -7.424160957336426, -7.155488014221191, -6.886815547943115, -6.618143081665039, -6.349470138549805, -6.0807976722717285, -5.812125205993652, -5.543452739715576, -5.2747802734375, -5.006107330322266, -4.7374348640441895, -4.468762397766113, -4.200089454650879, -3.9314169883728027, -3.6627445220947266, -3.3940720558166504, -3.125399351119995, -2.85672664642334, -2.5880541801452637, -2.3193817138671875, -2.0507090091705322, -1.7820364236831665, -1.5133638381958008, -1.244691252708435, -0.9760186672210693, -0.7073460817337036, -0.4386734962463379, -0.17000091075897217, 0.09867167472839355, 0.3673442602157593, 0.636016845703125, 0.9046894311904907, 1.1733620166778564, 1.4420346021652222, 1.710707187652588, 1.9793797731399536, 2.2480523586273193, 2.5167250633239746, 2.785397529602051, 3.054069995880127, 3.3227427005767822, 3.5914154052734375, 3.8600878715515137, 4.12876033782959, 4.397433280944824, 4.6661057472229, 4.934778213500977]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 1.0, 4.0, 8.0, 9.0, 14.0, 16.0, 24.0, 17.0, 23.0, 27.0, 31.0, 38.0, 33.0, 37.0, 62.0, 61.0, 76.0, 70.0, 66.0, 55.0, 45.0, 38.0, 46.0, 32.0, 21.0, 16.0, 19.0, 15.0, 26.0, 17.0, 12.0, 10.0, 11.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.313432455062866, -2.2276346683502197, -2.1418368816375732, -2.0560390949249268, -1.9702411890029907, -1.8844434022903442, -1.7986454963684082, -1.7128477096557617, -1.6270499229431152, -1.5412521362304688, -1.4554543495178223, -1.3696564435958862, -1.2838586568832397, -1.1980608701705933, -1.1122629642486572, -1.0264651775360107, -0.9406673908233643, -0.8548696041107178, -0.7690717577934265, -0.6832739114761353, -0.5974761247634888, -0.5116783380508423, -0.425880491733551, -0.34008264541625977, -0.2542848587036133, -0.1684870421886444, -0.08268922567367554, 0.003108590841293335, 0.08890640735626221, 0.17470422387123108, 0.26050204038619995, 0.3462998867034912, 0.4320974349975586, 0.5178952217102051, 0.6036930680274963, 0.6894909143447876, 0.7752887010574341, 0.8610864877700806, 0.9468843340873718, 1.032682180404663, 1.1184799671173096, 1.204277753829956, 1.2900755405426025, 1.3758734464645386, 1.461671233177185, 1.5474690198898315, 1.6332669258117676, 1.719064712524414, 1.8048624992370605, 1.890660285949707, 1.9764580726623535, 2.062255859375, 2.1480536460876465, 2.233851671218872, 2.3196494579315186, 2.405447244644165, 2.4912450313568115, 2.577042818069458, 2.6628406047821045, 2.748638391494751, 2.8344364166259766, 2.920234203338623, 3.0060319900512695, 3.091829776763916, 3.1776275634765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 5.0, 7.0, 11.0, 15.0, 18.0, 18.0, 47.0, 64.0, 105.0, 118.0, 228.0, 433.0, 857.0, 2091.0, 5885.0, 18699.0, 84983.0, 676636.0, 208585.0, 34354.0, 9437.0, 3298.0, 1316.0, 538.0, 326.0, 155.0, 98.0, 60.0, 34.0, 36.0, 28.0, 18.0, 12.0, 11.0, 9.0, 10.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.33882904052734375, -0.3287811279296875, -0.31873321533203125, -0.308685302734375, -0.29863739013671875, -0.2885894775390625, -0.27854156494140625, -0.26849365234375, -0.25844573974609375, -0.2483978271484375, -0.23834991455078125, -0.228302001953125, -0.21825408935546875, -0.2082061767578125, -0.19815826416015625, -0.1881103515625, -0.17806243896484375, -0.1680145263671875, -0.15796661376953125, -0.147918701171875, -0.13787078857421875, -0.1278228759765625, -0.11777496337890625, -0.10772705078125, -0.09767913818359375, -0.0876312255859375, -0.07758331298828125, -0.067535400390625, -0.05748748779296875, -0.0474395751953125, -0.03739166259765625, -0.02734375, -0.01729583740234375, -0.0072479248046875, 0.00279998779296875, 0.012847900390625, 0.02289581298828125, 0.0329437255859375, 0.04299163818359375, 0.05303955078125, 0.06308746337890625, 0.0731353759765625, 0.08318328857421875, 0.093231201171875, 0.10327911376953125, 0.1133270263671875, 0.12337493896484375, 0.1334228515625, 0.14347076416015625, 0.1535186767578125, 0.16356658935546875, 0.173614501953125, 0.18366241455078125, 0.1937103271484375, 0.20375823974609375, 0.21380615234375, 0.22385406494140625, 0.2339019775390625, 0.24394989013671875, 0.253997802734375, 0.26404571533203125, 0.2740936279296875, 0.28414154052734375, 0.294189453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 10.0, 11.0, 15.0, 20.0, 18.0, 22.0, 38.0, 24.0, 28.0, 44.0, 49.0, 58.0, 67.0, 45.0, 49.0, 44.0, 49.0, 53.0, 47.0, 41.0, 35.0, 39.0, 30.0, 29.0, 25.0, 15.0, 14.0, 7.0, 11.0, 7.0, 12.0, 2.0, 7.0, 1.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19921875, -0.19310760498046875, -0.1869964599609375, -0.18088531494140625, -0.174774169921875, -0.16866302490234375, -0.1625518798828125, -0.15644073486328125, -0.15032958984375, -0.14421844482421875, -0.1381072998046875, -0.13199615478515625, -0.125885009765625, -0.11977386474609375, -0.1136627197265625, -0.10755157470703125, -0.1014404296875, -0.09532928466796875, -0.0892181396484375, -0.08310699462890625, -0.076995849609375, -0.07088470458984375, -0.0647735595703125, -0.05866241455078125, -0.05255126953125, -0.04644012451171875, -0.0403289794921875, -0.03421783447265625, -0.028106689453125, -0.02199554443359375, -0.0158843994140625, -0.00977325439453125, -0.003662109375, 0.00244903564453125, 0.0085601806640625, 0.01467132568359375, 0.020782470703125, 0.02689361572265625, 0.0330047607421875, 0.03911590576171875, 0.04522705078125, 0.05133819580078125, 0.0574493408203125, 0.06356048583984375, 0.069671630859375, 0.07578277587890625, 0.0818939208984375, 0.08800506591796875, 0.0941162109375, 0.10022735595703125, 0.1063385009765625, 0.11244964599609375, 0.118560791015625, 0.12467193603515625, 0.1307830810546875, 0.13689422607421875, 0.14300537109375, 0.14911651611328125, 0.1552276611328125, 0.16133880615234375, 0.167449951171875, 0.17356109619140625, 0.1796722412109375, 0.18578338623046875, 0.19189453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 15.0, 7.0, 12.0, 22.0, 32.0, 57.0, 72.0, 126.0, 225.0, 483.0, 1171.0, 3884.0, 25038.0, 883539.0, 118919.0, 10877.0, 2361.0, 815.0, 382.0, 203.0, 117.0, 60.0, 37.0, 25.0, 16.0, 18.0, 8.0, 7.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.433837890625, -0.41927337646484375, -0.4047088623046875, -0.39014434814453125, -0.375579833984375, -0.36101531982421875, -0.3464508056640625, -0.33188629150390625, -0.31732177734375, -0.30275726318359375, -0.2881927490234375, -0.27362823486328125, -0.259063720703125, -0.24449920654296875, -0.2299346923828125, -0.21537017822265625, -0.2008056640625, -0.18624114990234375, -0.1716766357421875, -0.15711212158203125, -0.142547607421875, -0.12798309326171875, -0.1134185791015625, -0.09885406494140625, -0.08428955078125, -0.06972503662109375, -0.0551605224609375, -0.04059600830078125, -0.026031494140625, -0.01146697998046875, 0.0030975341796875, 0.01766204833984375, 0.0322265625, 0.04679107666015625, 0.0613555908203125, 0.07592010498046875, 0.090484619140625, 0.10504913330078125, 0.1196136474609375, 0.13417816162109375, 0.14874267578125, 0.16330718994140625, 0.1778717041015625, 0.19243621826171875, 0.207000732421875, 0.22156524658203125, 0.2361297607421875, 0.25069427490234375, 0.2652587890625, 0.27982330322265625, 0.2943878173828125, 0.30895233154296875, 0.323516845703125, 0.33808135986328125, 0.3526458740234375, 0.36721038818359375, 0.38177490234375, 0.39633941650390625, 0.4109039306640625, 0.42546844482421875, 0.440032958984375, 0.45459747314453125, 0.4691619873046875, 0.48372650146484375, 0.498291015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 8.0, 7.0, 6.0, 7.0, 10.0, 11.0, 18.0, 12.0, 12.0, 30.0, 25.0, 36.0, 41.0, 58.0, 73.0, 78.0, 97.0, 72.0, 56.0, 50.0, 40.0, 37.0, 35.0, 31.0, 25.0, 23.0, 14.0, 16.0, 18.0, 8.0, 5.0, 13.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.748046875, -0.7234573364257812, -0.6988677978515625, -0.6742782592773438, -0.649688720703125, -0.6250991821289062, -0.6005096435546875, -0.5759201049804688, -0.55133056640625, -0.5267410278320312, -0.5021514892578125, -0.47756195068359375, -0.452972412109375, -0.42838287353515625, -0.4037933349609375, -0.37920379638671875, -0.3546142578125, -0.33002471923828125, -0.3054351806640625, -0.28084564208984375, -0.256256103515625, -0.23166656494140625, -0.2070770263671875, -0.18248748779296875, -0.15789794921875, -0.13330841064453125, -0.1087188720703125, -0.08412933349609375, -0.059539794921875, -0.03495025634765625, -0.0103607177734375, 0.01422882080078125, 0.038818359375, 0.06340789794921875, 0.0879974365234375, 0.11258697509765625, 0.137176513671875, 0.16176605224609375, 0.1863555908203125, 0.21094512939453125, 0.23553466796875, 0.26012420654296875, 0.2847137451171875, 0.30930328369140625, 0.333892822265625, 0.35848236083984375, 0.3830718994140625, 0.40766143798828125, 0.4322509765625, 0.45684051513671875, 0.4814300537109375, 0.5060195922851562, 0.530609130859375, 0.5551986694335938, 0.5797882080078125, 0.6043777465820312, 0.62896728515625, 0.6535568237304688, 0.6781463623046875, 0.7027359008789062, 0.727325439453125, 0.7519149780273438, 0.7765045166015625, 0.8010940551757812, 0.82568359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 9.0, 6.0, 3.0, 7.0, 4.0, 11.0, 13.0, 9.0, 15.0, 20.0, 28.0, 39.0, 45.0, 64.0, 83.0, 127.0, 167.0, 316.0, 487.0, 787.0, 1327.0, 2666.0, 5718.0, 13841.0, 42385.0, 233341.0, 673081.0, 46450.0, 14892.0, 6161.0, 2779.0, 1397.0, 832.0, 469.0, 331.0, 187.0, 118.0, 92.0, 62.0, 44.0, 22.0, 22.0, 21.0, 10.0, 12.0, 10.0, 12.0, 13.0, 7.0, 7.0, 4.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.047393798828125, -0.045866966247558594, -0.04434013366699219, -0.04281330108642578, -0.041286468505859375, -0.03975963592529297, -0.03823280334472656, -0.036705970764160156, -0.03517913818359375, -0.033652305603027344, -0.03212547302246094, -0.03059864044189453, -0.029071807861328125, -0.02754497528076172, -0.026018142700195312, -0.024491310119628906, -0.0229644775390625, -0.021437644958496094, -0.019910812377929688, -0.01838397979736328, -0.016857147216796875, -0.015330314636230469, -0.013803482055664062, -0.012276649475097656, -0.01074981689453125, -0.009222984313964844, -0.0076961517333984375, -0.006169319152832031, -0.004642486572265625, -0.0031156539916992188, -0.0015888214111328125, -6.198883056640625e-05, 0.00146484375, 0.0029916763305664062, 0.0045185089111328125, 0.006045341491699219, 0.007572174072265625, 0.009099006652832031, 0.010625839233398438, 0.012152671813964844, 0.01367950439453125, 0.015206336975097656, 0.016733169555664062, 0.01826000213623047, 0.019786834716796875, 0.02131366729736328, 0.022840499877929688, 0.024367332458496094, 0.0258941650390625, 0.027420997619628906, 0.028947830200195312, 0.03047466278076172, 0.032001495361328125, 0.03352832794189453, 0.03505516052246094, 0.036581993103027344, 0.03810882568359375, 0.039635658264160156, 0.04116249084472656, 0.04268932342529297, 0.044216156005859375, 0.04574298858642578, 0.04726982116699219, 0.048796653747558594, 0.050323486328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 12.0, 14.0, 12.0, 17.0, 19.0, 38.0, 44.0, 96.0, 108.0, 115.0, 117.0, 114.0, 71.0, 55.0, 37.0, 25.0, 24.0, 18.0, 12.0, 17.0, 9.0, 5.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.24249267578125e-05, -3.141164779663086e-05, -3.039836883544922e-05, -2.9385089874267578e-05, -2.8371810913085938e-05, -2.7358531951904297e-05, -2.6345252990722656e-05, -2.5331974029541016e-05, -2.4318695068359375e-05, -2.3305416107177734e-05, -2.2292137145996094e-05, -2.1278858184814453e-05, -2.0265579223632812e-05, -1.9252300262451172e-05, -1.823902130126953e-05, -1.722574234008789e-05, -1.621246337890625e-05, -1.519918441772461e-05, -1.4185905456542969e-05, -1.3172626495361328e-05, -1.2159347534179688e-05, -1.1146068572998047e-05, -1.0132789611816406e-05, -9.119510650634766e-06, -8.106231689453125e-06, -7.092952728271484e-06, -6.079673767089844e-06, -5.066394805908203e-06, -4.0531158447265625e-06, -3.039836883544922e-06, -2.0265579223632812e-06, -1.0132789611816406e-06, 0.0, 1.0132789611816406e-06, 2.0265579223632812e-06, 3.039836883544922e-06, 4.0531158447265625e-06, 5.066394805908203e-06, 6.079673767089844e-06, 7.092952728271484e-06, 8.106231689453125e-06, 9.119510650634766e-06, 1.0132789611816406e-05, 1.1146068572998047e-05, 1.2159347534179688e-05, 1.3172626495361328e-05, 1.4185905456542969e-05, 1.519918441772461e-05, 1.621246337890625e-05, 1.722574234008789e-05, 1.823902130126953e-05, 1.9252300262451172e-05, 2.0265579223632812e-05, 2.1278858184814453e-05, 2.2292137145996094e-05, 2.3305416107177734e-05, 2.4318695068359375e-05, 2.5331974029541016e-05, 2.6345252990722656e-05, 2.7358531951904297e-05, 2.8371810913085938e-05, 2.9385089874267578e-05, 3.039836883544922e-05, 3.141164779663086e-05, 3.24249267578125e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 7.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 13.0, 16.0, 23.0, 61.0, 75.0, 99.0, 173.0, 277.0, 459.0, 890.0, 1632.0, 3374.0, 7893.0, 21603.0, 80445.0, 781310.0, 107366.0, 25591.0, 9090.0, 3901.0, 1879.0, 963.0, 517.0, 339.0, 177.0, 109.0, 86.0, 57.0, 35.0, 15.0, 13.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05322265625, -0.051482200622558594, -0.04974174499511719, -0.04800128936767578, -0.046260833740234375, -0.04452037811279297, -0.04277992248535156, -0.041039466857910156, -0.03929901123046875, -0.037558555603027344, -0.03581809997558594, -0.03407764434814453, -0.032337188720703125, -0.03059673309326172, -0.028856277465820312, -0.027115821838378906, -0.0253753662109375, -0.023634910583496094, -0.021894454956054688, -0.02015399932861328, -0.018413543701171875, -0.01667308807373047, -0.014932632446289062, -0.013192176818847656, -0.01145172119140625, -0.009711265563964844, -0.007970809936523438, -0.006230354309082031, -0.004489898681640625, -0.0027494430541992188, -0.0010089874267578125, 0.0007314682006835938, 0.002471923828125, 0.004212379455566406, 0.0059528350830078125, 0.007693290710449219, 0.009433746337890625, 0.011174201965332031, 0.012914657592773438, 0.014655113220214844, 0.01639556884765625, 0.018136024475097656, 0.019876480102539062, 0.02161693572998047, 0.023357391357421875, 0.02509784698486328, 0.026838302612304688, 0.028578758239746094, 0.0303192138671875, 0.032059669494628906, 0.03380012512207031, 0.03554058074951172, 0.037281036376953125, 0.03902149200439453, 0.04076194763183594, 0.042502403259277344, 0.04424285888671875, 0.045983314514160156, 0.04772377014160156, 0.04946422576904297, 0.051204681396484375, 0.05294513702392578, 0.05468559265136719, 0.056426048278808594, 0.05816650390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 10.0, 7.0, 13.0, 12.0, 21.0, 28.0, 34.0, 49.0, 99.0, 169.0, 189.0, 127.0, 72.0, 51.0, 19.0, 17.0, 21.0, 19.0, 9.0, 10.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.146484375, -0.14219284057617188, -0.13790130615234375, -0.13360977172851562, -0.1293182373046875, -0.12502670288085938, -0.12073516845703125, -0.11644363403320312, -0.112152099609375, -0.10786056518554688, -0.10356903076171875, -0.09927749633789062, -0.0949859619140625, -0.09069442749023438, -0.08640289306640625, -0.08211135864257812, -0.07781982421875, -0.07352828979492188, -0.06923675537109375, -0.06494522094726562, -0.0606536865234375, -0.056362152099609375, -0.05207061767578125, -0.047779083251953125, -0.043487548828125, -0.039196014404296875, -0.03490447998046875, -0.030612945556640625, -0.0263214111328125, -0.022029876708984375, -0.01773834228515625, -0.013446807861328125, -0.0091552734375, -0.004863739013671875, -0.00057220458984375, 0.003719329833984375, 0.0080108642578125, 0.012302398681640625, 0.01659393310546875, 0.020885467529296875, 0.025177001953125, 0.029468536376953125, 0.03376007080078125, 0.038051605224609375, 0.0423431396484375, 0.046634674072265625, 0.05092620849609375, 0.055217742919921875, 0.05950927734375, 0.06380081176757812, 0.06809234619140625, 0.07238388061523438, 0.0766754150390625, 0.08096694946289062, 0.08525848388671875, 0.08955001831054688, 0.093841552734375, 0.09813308715820312, 0.10242462158203125, 0.10671615600585938, 0.1110076904296875, 0.11529922485351562, 0.11959075927734375, 0.12388229370117188, 0.128173828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 11.0, 10.0, 34.0, 74.0, 316.0, 400.0, 94.0, 37.0, 14.0, 4.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525306224822998, -2.3678910732269287, -2.2104761600494385, -2.053061008453369, -1.8956459760665894, -1.7382309436798096, -1.5808157920837402, -1.4234007596969604, -1.2659857273101807, -1.1085706949234009, -0.9511556029319763, -0.7937405109405518, -0.636325478553772, -0.4789104461669922, -0.3214953541755676, -0.16408026218414307, -0.006665229797363281, 0.1507498323917389, 0.30816489458084106, 0.46557995676994324, 0.6229950189590454, 0.7804100513458252, 0.9378251433372498, 1.0952402353286743, 1.252655267715454, 1.4100703001022339, 1.5674853324890137, 1.724900484085083, 1.8823155164718628, 2.0397305488586426, 2.197145700454712, 2.3545608520507812, 2.5119762420654297, 2.669391393661499, 2.8268063068389893, 2.9842214584350586, 3.141636371612549, 3.299051523208618, 3.4564666748046875, 3.6138815879821777, 3.771296739578247, 3.9287118911743164, 4.086126804351807, 4.243541717529297, 4.400957107543945, 4.5583720207214355, 4.715786933898926, 4.873202323913574, 5.0306172370910645, 5.188032150268555, 5.345447540283203, 5.502862453460693, 5.660277366638184, 5.817692756652832, 5.975107669830322, 6.1325225830078125, 6.289937973022461, 6.447352886199951, 6.6047682762146, 6.76218318939209, 6.91959810256958, 7.07701301574707, 7.234428405761719, 7.391843318939209, 7.549258232116699]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 10.0, 3.0, 2.0, 6.0, 6.0, 5.0, 12.0, 5.0, 16.0, 12.0, 14.0, 22.0, 27.0, 18.0, 37.0, 58.0, 96.0, 106.0, 97.0, 96.0, 88.0, 51.0, 24.0, 25.0, 19.0, 18.0, 18.0, 20.0, 9.0, 14.0, 6.0, 10.0, 7.0, 7.0, 7.0, 1.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-2.1506664752960205, -2.091336488723755, -2.0320067405700684, -1.9726767539978027, -1.913346767425537, -1.854016900062561, -1.794687032699585, -1.7353570461273193, -1.6760271787643433, -1.6166973114013672, -1.5573673248291016, -1.4980374574661255, -1.4387074708938599, -1.3793776035308838, -1.3200476169586182, -1.260717749595642, -1.201387882232666, -1.14205801486969, -1.0827280282974243, -1.0233981609344482, -0.9640682339668274, -0.9047383069992065, -0.8454083800315857, -0.7860784530639648, -0.7267484664916992, -0.6674185395240784, -0.6080886125564575, -0.5487587451934814, -0.4894288182258606, -0.43009889125823975, -0.3707689642906189, -0.31143906712532043, -0.252109169960022, -0.19277925789356232, -0.13344934582710266, -0.07411941885948181, -0.014789506793022156, 0.0445404052734375, 0.10387033224105835, 0.1632002294063568, 0.22253015637397766, 0.2818600833415985, 0.341189980506897, 0.4005199074745178, 0.45984983444213867, 0.5191797018051147, 0.5785096883773804, 0.6378395557403564, 0.6971694827079773, 0.7564994096755981, 0.815829336643219, 0.8751592636108398, 0.9344891309738159, 0.9938190579414368, 1.0531489849090576, 1.1124788522720337, 1.1718088388442993, 1.2311387062072754, 1.290468692779541, 1.349798560142517, 1.4091285467147827, 1.4684584140777588, 1.5277884006500244, 1.5871182680130005, 1.6464481353759766]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 3.0, 5.0, 5.0, 9.0, 9.0, 25.0, 21.0, 24.0, 24.0, 25.0, 35.0, 36.0, 36.0, 43.0, 75.0, 178.0, 122.0, 37.0, 38.0, 28.0, 35.0, 28.0, 14.0, 21.0, 18.0, 14.0, 12.0, 12.0, 10.0, 11.0, 9.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17202186584472656, -0.16643142700195312, -0.1608409881591797, -0.15525054931640625, -0.1496601104736328, -0.14406967163085938, -0.13847923278808594, -0.1328887939453125, -0.12729835510253906, -0.12170791625976562, -0.11611747741699219, -0.11052703857421875, -0.10493659973144531, -0.09934616088867188, -0.09375572204589844, -0.088165283203125, -0.08257484436035156, -0.07698440551757812, -0.07139396667480469, -0.06580352783203125, -0.06021308898925781, -0.054622650146484375, -0.04903221130371094, -0.0434417724609375, -0.03785133361816406, -0.032260894775390625, -0.026670455932617188, -0.02108001708984375, -0.015489578247070312, -0.009899139404296875, -0.0043087005615234375, 0.00128173828125, 0.0068721771240234375, 0.012462615966796875, 0.018053054809570312, 0.02364349365234375, 0.029233932495117188, 0.034824371337890625, 0.04041481018066406, 0.0460052490234375, 0.05159568786621094, 0.057186126708984375, 0.06277656555175781, 0.06836700439453125, 0.07395744323730469, 0.07954788208007812, 0.08513832092285156, 0.090728759765625, 0.09631919860839844, 0.10190963745117188, 0.10750007629394531, 0.11309051513671875, 0.11868095397949219, 0.12427139282226562, 0.12986183166503906, 0.1354522705078125, 0.14104270935058594, 0.14663314819335938, 0.1522235870361328, 0.15781402587890625, 0.1634044647216797, 0.16899490356445312, 0.17458534240722656, 0.18017578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 6.0, 7.0, 4.0, 7.0, 3.0, 2.0, 7.0, 4.0, 9.0, 16.0, 35.0, 44.0, 46.0, 92.0, 125.0, 221.0, 619.0, 1842.0, 7046.0, 775399.0, 7592187.0, 7675.0, 1837.0, 650.0, 255.0, 160.0, 71.0, 53.0, 30.0, 41.0, 19.0, 16.0, 12.0, 10.0, 10.0, 6.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.56608247756958, -1.5213700532913208, -1.476657509803772, -1.4319450855255127, -1.3872326612472534, -1.3425201177597046, -1.2978076934814453, -1.2530951499938965, -1.2083827257156372, -1.163670301437378, -1.118957757949829, -1.0742453336715698, -1.0295329093933105, -0.9848203659057617, -0.9401079416275024, -0.8953954577445984, -0.8506830334663391, -0.8059705495834351, -0.7612581253051758, -0.7165456414222717, -0.6718331575393677, -0.6271207332611084, -0.5824082493782043, -0.5376957654953003, -0.49298331141471863, -0.44827085733413696, -0.4035583734512329, -0.35884591937065125, -0.3141334652900696, -0.2694209814071655, -0.22470852732658386, -0.1799960434436798, -0.13528358936309814, -0.09057112038135529, -0.045858658850193024, -0.0011461973190307617, 0.0435662716627121, 0.08827874064445496, 0.13299119472503662, 0.17770367860794067, 0.22241613268852234, 0.267128586769104, 0.31184107065200806, 0.3565535247325897, 0.4012659788131714, 0.44597846269607544, 0.4906909167766571, 0.5354033708572388, 0.5801158547401428, 0.6248283386230469, 0.6695407629013062, 0.7142532467842102, 0.7589657306671143, 0.8036781549453735, 0.8483906388282776, 0.8931031227111816, 0.9378155469894409, 0.982528030872345, 1.027240514755249, 1.0719529390335083, 1.1166653633117676, 1.1613779067993164, 1.2060903310775757, 1.250802755355835, 1.2955152988433838]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 4.0, 6.0, 9.0, 5.0, 4.0, 3.0, 4.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.898141384124756, -2.814516544342041, -2.730891704559326, -2.6472666263580322, -2.5636417865753174, -2.4800169467926025, -2.3963918685913086, -2.3127670288085938, -2.229142189025879, -2.145517349243164, -2.061892509460449, -1.9782674312591553, -1.8946425914764404, -1.8110177516937256, -1.7273927927017212, -1.6437678337097168, -1.560142993927002, -1.476518154144287, -1.3928931951522827, -1.3092682361602783, -1.2256433963775635, -1.1420185565948486, -1.0583935976028442, -0.9747686982154846, -0.891143798828125, -0.8075188994407654, -0.7238940000534058, -0.6402691006660461, -0.5566442012786865, -0.4730193018913269, -0.3893944025039673, -0.30576950311660767, -0.22214460372924805, -0.13851970434188843, -0.05489480495452881, 0.02873009443283081, 0.11235499382019043, 0.19597989320755005, 0.27960479259490967, 0.3632296919822693, 0.4468545913696289, 0.5304794907569885, 0.6141043901443481, 0.6977292895317078, 0.7813541889190674, 0.864979088306427, 0.9486039876937866, 1.032228946685791, 1.1158537864685059, 1.1994786262512207, 1.283103585243225, 1.3667285442352295, 1.4503533840179443, 1.5339782238006592, 1.6176031827926636, 1.701228141784668, 1.7848529815673828, 1.8684778213500977, 1.952102780342102, 2.0357277393341064, 2.1193525791168213, 2.202977418899536, 2.28660249710083, 2.370227336883545, 2.4538521766662598]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 13.0, 18.0, 14.0, 18.0, 20.0, 27.0, 30.0, 29.0, 35.0, 35.0, 42.0, 45.0, 63.0, 51.0, 59.0, 53.0, 49.0, 48.0, 43.0, 33.0, 30.0, 23.0, 16.0, 36.0, 23.0, 25.0, 18.0, 14.0, 9.0, 10.0, 9.0, 11.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.135498046875, -0.13158798217773438, -0.12767791748046875, -0.12376785278320312, -0.1198577880859375, -0.11594772338867188, -0.11203765869140625, -0.10812759399414062, -0.104217529296875, -0.10030746459960938, -0.09639739990234375, -0.09248733520507812, -0.0885772705078125, -0.08466720581054688, -0.08075714111328125, -0.07684707641601562, -0.07293701171875, -0.06902694702148438, -0.06511688232421875, -0.061206817626953125, -0.0572967529296875, -0.053386688232421875, -0.04947662353515625, -0.045566558837890625, -0.041656494140625, -0.037746429443359375, -0.03383636474609375, -0.029926300048828125, -0.0260162353515625, -0.022106170654296875, -0.01819610595703125, -0.014286041259765625, -0.0103759765625, -0.006465911865234375, -0.00255584716796875, 0.001354217529296875, 0.0052642822265625, 0.009174346923828125, 0.01308441162109375, 0.016994476318359375, 0.020904541015625, 0.024814605712890625, 0.02872467041015625, 0.032634735107421875, 0.0365447998046875, 0.040454864501953125, 0.04436492919921875, 0.048274993896484375, 0.05218505859375, 0.056095123291015625, 0.06000518798828125, 0.06391525268554688, 0.0678253173828125, 0.07173538208007812, 0.07564544677734375, 0.07955551147460938, 0.083465576171875, 0.08737564086914062, 0.09128570556640625, 0.09519577026367188, 0.0991058349609375, 0.10301589965820312, 0.10692596435546875, 0.11083602905273438, 0.11474609375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 10.0, 6.0, 3.0, 7.0, 4.0, 13.0, 18.0, 15.0, 31.0, 45.0, 74.0, 125.0, 224.0, 380.0, 686.0, 1298.0, 2816.0, 5900.0, 13840.0, 34008.0, 86404.0, 173172.0, 121570.0, 48901.0, 19288.0, 8168.0, 3634.0, 1723.0, 865.0, 418.0, 224.0, 126.0, 97.0, 52.0, 35.0, 24.0, 16.0, 20.0, 11.0, 8.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.109375, -1.0774002075195312, -1.0454254150390625, -1.0134506225585938, -0.981475830078125, -0.9495010375976562, -0.9175262451171875, -0.8855514526367188, -0.85357666015625, -0.8216018676757812, -0.7896270751953125, -0.7576522827148438, -0.725677490234375, -0.6937026977539062, -0.6617279052734375, -0.6297531127929688, -0.5977783203125, -0.5658035278320312, -0.5338287353515625, -0.5018539428710938, -0.469879150390625, -0.43790435791015625, -0.4059295654296875, -0.37395477294921875, -0.34197998046875, -0.31000518798828125, -0.2780303955078125, -0.24605560302734375, -0.214080810546875, -0.18210601806640625, -0.1501312255859375, -0.11815643310546875, -0.086181640625, -0.05420684814453125, -0.0222320556640625, 0.00974273681640625, 0.041717529296875, 0.07369232177734375, 0.1056671142578125, 0.13764190673828125, 0.16961669921875, 0.20159149169921875, 0.2335662841796875, 0.26554107666015625, 0.297515869140625, 0.32949066162109375, 0.3614654541015625, 0.39344024658203125, 0.4254150390625, 0.45738983154296875, 0.4893646240234375, 0.5213394165039062, 0.553314208984375, 0.5852890014648438, 0.6172637939453125, 0.6492385864257812, 0.68121337890625, 0.7131881713867188, 0.7451629638671875, 0.7771377563476562, 0.809112548828125, 0.8410873413085938, 0.8730621337890625, 0.9050369262695312, 0.93701171875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 9.0, 12.0, 14.0, 16.0, 22.0, 30.0, 21.0, 32.0, 29.0, 33.0, 57.0, 44.0, 67.0, 52.0, 60.0, 52.0, 65.0, 46.0, 39.0, 32.0, 43.0, 32.0, 25.0, 22.0, 25.0, 19.0, 9.0, 12.0, 12.0, 6.0, 9.0, 7.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.187744140625, -0.182769775390625, -0.17779541015625, -0.172821044921875, -0.1678466796875, -0.162872314453125, -0.15789794921875, -0.152923583984375, -0.14794921875, -0.142974853515625, -0.13800048828125, -0.133026123046875, -0.1280517578125, -0.123077392578125, -0.11810302734375, -0.113128662109375, -0.108154296875, -0.103179931640625, -0.09820556640625, -0.093231201171875, -0.0882568359375, -0.083282470703125, -0.07830810546875, -0.073333740234375, -0.068359375, -0.063385009765625, -0.05841064453125, -0.053436279296875, -0.0484619140625, -0.043487548828125, -0.03851318359375, -0.033538818359375, -0.028564453125, -0.023590087890625, -0.01861572265625, -0.013641357421875, -0.0086669921875, -0.003692626953125, 0.00128173828125, 0.006256103515625, 0.01123046875, 0.016204833984375, 0.02117919921875, 0.026153564453125, 0.0311279296875, 0.036102294921875, 0.04107666015625, 0.046051025390625, 0.051025390625, 0.055999755859375, 0.06097412109375, 0.065948486328125, 0.0709228515625, 0.075897216796875, 0.08087158203125, 0.085845947265625, 0.0908203125, 0.095794677734375, 0.10076904296875, 0.105743408203125, 0.1107177734375, 0.115692138671875, 0.12066650390625, 0.125640869140625, 0.130615234375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 4.0, 6.0, 8.0, 13.0, 25.0, 53.0, 96.0, 90.0, 69.0, 49.0, 18.0, 8.0, 7.0, 6.0, 3.0, 6.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.331541895866394, -1.2872164249420166, -1.2428910732269287, -1.1985657215118408, -1.1542402505874634, -1.109914779663086, -1.065589427947998, -1.0212640762329102, -0.9769386053085327, -0.9326131939888, -0.8882877826690674, -0.8439623713493347, -0.799636960029602, -0.7553115487098694, -0.7109861373901367, -0.666660726070404, -0.6223353147506714, -0.5780099034309387, -0.533684492111206, -0.4893590807914734, -0.4450336694717407, -0.40070825815200806, -0.3563828468322754, -0.3120574355125427, -0.26773202419281006, -0.2234066128730774, -0.17908120155334473, -0.13475579023361206, -0.0904303789138794, -0.04610496759414673, -0.0017795562744140625, 0.042545855045318604, 0.08687114715576172, 0.13119655847549438, 0.17552196979522705, 0.21984738111495972, 0.2641727924346924, 0.30849820375442505, 0.3528236150741577, 0.3971490263938904, 0.44147443771362305, 0.4857998490333557, 0.5301252603530884, 0.574450671672821, 0.6187760829925537, 0.6631014943122864, 0.707426905632019, 0.7517523169517517, 0.7960777282714844, 0.840403139591217, 0.8847285509109497, 0.9290539622306824, 0.973379373550415, 1.017704725265503, 1.0620301961898804, 1.1063556671142578, 1.1506810188293457, 1.1950063705444336, 1.239331841468811, 1.2836573123931885, 1.3279826641082764, 1.3723080158233643, 1.4166334867477417, 1.4609589576721191, 1.505284309387207]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 8.0, 7.0, 17.0, 22.0, 57.0, 71.0, 94.0, 70.0, 42.0, 19.0, 14.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1043403148651123, -1.0688014030456543, -1.0332624912261963, -0.9977235794067383, -0.9621846675872803, -0.9266457557678223, -0.8911067843437195, -0.8555678725242615, -0.8200289607048035, -0.7844900488853455, -0.7489511370658875, -0.7134122252464294, -0.6778732538223267, -0.6423343420028687, -0.6067954301834106, -0.5712565183639526, -0.5357176065444946, -0.5001786947250366, -0.4646397829055786, -0.4291008412837982, -0.3935619294643402, -0.3580230176448822, -0.3224840760231018, -0.2869451642036438, -0.2514062523841858, -0.21586734056472778, -0.18032841384410858, -0.14478948712348938, -0.10925057530403137, -0.07371166348457336, -0.03817273676395416, -0.002633810043334961, 0.03290510177612305, 0.06844402104616165, 0.10398294031620026, 0.13952186703681946, 0.17506077885627747, 0.21059969067573547, 0.24613861739635468, 0.2816775441169739, 0.3172164559364319, 0.3527553677558899, 0.3882942795753479, 0.4238332211971283, 0.4593721330165863, 0.4949110448360443, 0.5304499864578247, 0.5659888982772827, 0.6015278100967407, 0.6370667219161987, 0.6726056337356567, 0.7081445455551147, 0.7436834573745728, 0.7792223691940308, 0.8147613406181335, 0.8503002524375916, 0.8858391642570496, 0.9213780760765076, 0.9569169878959656, 0.9924558997154236, 1.0279948711395264, 1.0635337829589844, 1.0990726947784424, 1.1346116065979004, 1.1701505184173584]}, "eval/loss": 0.34626105427742004, "eval/wer": 0.10119000396667989, "eval/runtime": 713.9632, "eval/samples_per_second": 3.7, "eval/steps_per_second": 0.464, "train/train_runtime": 25980.5507, "train/train_samples_per_second": 5.492, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 2.498668275362574, "_wandb": {"runtime": 26988}} \ No newline at end of file